diff --git "a/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" "b/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" --- "a/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" +++ "b/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.1519, "train/learning_rate": 1.741654571843251e-06, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 8088, "_timestamp": 1646243983, "_step": 1192, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 39.0, 666.0, 303.0, 7.0, 1.0, 0.0, 1.0], "bins": [-403.2832946777344, -396.4258117675781, -389.5683288574219, -382.7108459472656, -375.8533630371094, -368.9958801269531, -362.138427734375, -355.28094482421875, -348.4234619140625, -341.56597900390625, -334.70849609375, -327.85101318359375, -320.9935302734375, -314.13604736328125, -307.278564453125, -300.42108154296875, -293.5635986328125, -286.70611572265625, -279.8486328125, -272.99114990234375, -266.1336669921875, -259.27618408203125, -252.41871643066406, -245.5612335205078, -238.70376586914062, -231.84628295898438, -224.98880004882812, -218.13131713867188, -211.2738494873047, -204.41636657714844, -197.5588836669922, -190.70140075683594, -183.84393310546875, -176.9864501953125, -170.12896728515625, -163.271484375, -156.4140167236328, -149.55653381347656, -142.6990509033203, -135.84156799316406, -128.9840850830078, -122.12660217285156, -115.26912689208984, -108.4116439819336, -101.55416107177734, -94.69668579101562, -87.83920288085938, -80.98171997070312, -74.12423706054688, -67.26675415039062, -60.40927505493164, -53.551795959472656, -46.694313049316406, -39.83683395385742, -32.97935485839844, -26.121871948242188, -19.264392852783203, -12.406911849975586, -5.549431800842285, 1.3080482482910156, 8.165529251098633, 15.02301025390625, 21.880489349365234, 28.737972259521484, 35.59545135498047]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 4.0, 10.0, 8.0, 12.0, 10.0, 11.0, 23.0, 12.0, 16.0, 20.0, 30.0, 24.0, 30.0, 35.0, 37.0, 35.0, 57.0, 39.0, 42.0, 42.0, 43.0, 40.0, 36.0, 42.0, 36.0, 30.0, 32.0, 24.0, 31.0, 28.0, 17.0, 24.0, 21.0, 15.0, 14.0, 14.0, 13.0, 6.0, 5.0, 4.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-56.051300048828125, -54.218135833740234, -52.384971618652344, -50.55180740356445, -48.71864318847656, -46.88547897338867, -45.05231475830078, -43.21915054321289, -41.385986328125, -39.55282211303711, -37.71965789794922, -35.88649368286133, -34.05332946777344, -32.22016525268555, -30.387001037597656, -28.553836822509766, -26.720674514770508, -24.887510299682617, -23.054346084594727, -21.221181869506836, -19.388017654418945, -17.554855346679688, -15.72169017791748, -13.88852596282959, -12.0553617477417, -10.222197532653809, -8.389033317565918, -6.5558695793151855, -4.722705364227295, -2.8895416259765625, -1.0563774108886719, 0.7767868041992188, 2.6099510192871094, 4.443115234375, 6.276279449462891, 8.109443664550781, 9.942607879638672, 11.775771141052246, 13.608935356140137, 15.442099571228027, 17.275264739990234, 19.108428955078125, 20.941593170166016, 22.774757385253906, 24.607921600341797, 26.441085815429688, 28.274250030517578, 30.10741424560547, 31.940576553344727, 33.773738861083984, 35.606903076171875, 37.440067291259766, 39.273231506347656, 41.10639572143555, 42.93955993652344, 44.77272415161133, 46.60588836669922, 48.43905258178711, 50.272216796875, 52.10538101196289, 53.93854522705078, 55.77170944213867, 57.60487365722656, 59.43803787231445, 61.271202087402344]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 15.0, 13.0, 14.0, 33.0, 29.0, 41.0, 51.0, 70.0, 70.0, 74.0, 85.0, 77.0, 74.0, 68.0, 60.0, 59.0, 45.0, 45.0, 27.0, 15.0, 14.0, 7.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.728515625, -3.641937255859375, -3.55535888671875, -3.468780517578125, -3.3822021484375, -3.295623779296875, -3.20904541015625, -3.122467041015625, -3.035888671875, -2.949310302734375, -2.86273193359375, -2.776153564453125, -2.6895751953125, -2.602996826171875, -2.51641845703125, -2.429840087890625, -2.34326171875, -2.256683349609375, -2.17010498046875, -2.083526611328125, -1.9969482421875, -1.910369873046875, -1.82379150390625, -1.737213134765625, -1.650634765625, -1.564056396484375, -1.47747802734375, -1.390899658203125, -1.3043212890625, -1.217742919921875, -1.13116455078125, -1.044586181640625, -0.9580078125, -0.871429443359375, -0.78485107421875, -0.698272705078125, -0.6116943359375, -0.525115966796875, -0.43853759765625, -0.351959228515625, -0.265380859375, -0.178802490234375, -0.09222412109375, -0.005645751953125, 0.0809326171875, 0.167510986328125, 0.25408935546875, 0.340667724609375, 0.42724609375, 0.513824462890625, 0.60040283203125, 0.686981201171875, 0.7735595703125, 0.860137939453125, 0.94671630859375, 1.033294677734375, 1.119873046875, 1.206451416015625, 1.29302978515625, 1.379608154296875, 1.4661865234375, 1.552764892578125, 1.63934326171875, 1.725921630859375, 1.8125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 10.0, 11.0, 23.0, 29.0, 64.0, 77.0, 120.0, 228.0, 450.0, 833.0, 2069.0, 6217.0, 47833.0, 3781207.0, 334939.0, 14092.0, 3323.0, 1314.0, 631.0, 346.0, 189.0, 111.0, 59.0, 35.0, 33.0, 18.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.46875, -23.882568359375, -23.29638671875, -22.710205078125, -22.1240234375, -21.537841796875, -20.95166015625, -20.365478515625, -19.779296875, -19.193115234375, -18.60693359375, -18.020751953125, -17.4345703125, -16.848388671875, -16.26220703125, -15.676025390625, -15.08984375, -14.503662109375, -13.91748046875, -13.331298828125, -12.7451171875, -12.158935546875, -11.57275390625, -10.986572265625, -10.400390625, -9.814208984375, -9.22802734375, -8.641845703125, -8.0556640625, -7.469482421875, -6.88330078125, -6.297119140625, -5.7109375, -5.124755859375, -4.53857421875, -3.952392578125, -3.3662109375, -2.780029296875, -2.19384765625, -1.607666015625, -1.021484375, -0.435302734375, 0.15087890625, 0.737060546875, 1.3232421875, 1.909423828125, 2.49560546875, 3.081787109375, 3.66796875, 4.254150390625, 4.84033203125, 5.426513671875, 6.0126953125, 6.598876953125, 7.18505859375, 7.771240234375, 8.357421875, 8.943603515625, 9.52978515625, 10.115966796875, 10.7021484375, 11.288330078125, 11.87451171875, 12.460693359375, 13.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 12.0, 23.0, 34.0, 64.0, 139.0, 237.0, 451.0, 822.0, 948.0, 613.0, 318.0, 179.0, 94.0, 63.0, 28.0, 21.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.90625, -17.5263671875, -17.146484375, -16.7666015625, -16.38671875, -16.0068359375, -15.626953125, -15.2470703125, -14.8671875, -14.4873046875, -14.107421875, -13.7275390625, -13.34765625, -12.9677734375, -12.587890625, -12.2080078125, -11.828125, -11.4482421875, -11.068359375, -10.6884765625, -10.30859375, -9.9287109375, -9.548828125, -9.1689453125, -8.7890625, -8.4091796875, -8.029296875, -7.6494140625, -7.26953125, -6.8896484375, -6.509765625, -6.1298828125, -5.75, -5.3701171875, -4.990234375, -4.6103515625, -4.23046875, -3.8505859375, -3.470703125, -3.0908203125, -2.7109375, -2.3310546875, -1.951171875, -1.5712890625, -1.19140625, -0.8115234375, -0.431640625, -0.0517578125, 0.328125, 0.7080078125, 1.087890625, 1.4677734375, 1.84765625, 2.2275390625, 2.607421875, 2.9873046875, 3.3671875, 3.7470703125, 4.126953125, 4.5068359375, 4.88671875, 5.2666015625, 5.646484375, 6.0263671875, 6.40625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 10.0, 27.0, 50.0, 123.0, 263.0, 691.0, 3128.0, 691723.0, 3491822.0, 4969.0, 883.0, 330.0, 129.0, 62.0, 27.0, 12.0, 8.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.28125, -44.79248046875, -43.3037109375, -41.81494140625, -40.326171875, -38.83740234375, -37.3486328125, -35.85986328125, -34.37109375, -32.88232421875, -31.3935546875, -29.90478515625, -28.416015625, -26.92724609375, -25.4384765625, -23.94970703125, -22.4609375, -20.97216796875, -19.4833984375, -17.99462890625, -16.505859375, -15.01708984375, -13.5283203125, -12.03955078125, -10.55078125, -9.06201171875, -7.5732421875, -6.08447265625, -4.595703125, -3.10693359375, -1.6181640625, -0.12939453125, 1.359375, 2.84814453125, 4.3369140625, 5.82568359375, 7.314453125, 8.80322265625, 10.2919921875, 11.78076171875, 13.26953125, 14.75830078125, 16.2470703125, 17.73583984375, 19.224609375, 20.71337890625, 22.2021484375, 23.69091796875, 25.1796875, 26.66845703125, 28.1572265625, 29.64599609375, 31.134765625, 32.62353515625, 34.1123046875, 35.60107421875, 37.08984375, 38.57861328125, 40.0673828125, 41.55615234375, 43.044921875, 44.53369140625, 46.0224609375, 47.51123046875, 49.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 67.0, 329.0, 452.0, 125.0, 25.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-148.87753295898438, -146.17604064941406, -143.47454833984375, -140.77305603027344, -138.07156372070312, -135.3700714111328, -132.6685791015625, -129.9670867919922, -127.26558685302734, -124.56409454345703, -121.86260223388672, -119.1611099243164, -116.4596176147461, -113.75811767578125, -111.05662536621094, -108.35513305664062, -105.65364074707031, -102.9521484375, -100.25065612792969, -97.54916381835938, -94.84767150878906, -92.14617919921875, -89.44468688964844, -86.7431869506836, -84.04170227050781, -81.3402099609375, -78.63871765136719, -75.93722534179688, -73.23573303222656, -70.53424072265625, -67.83274841308594, -65.1312484741211, -62.42975616455078, -59.72826385498047, -57.026771545410156, -54.325279235839844, -51.623783111572266, -48.92229080200195, -46.22079849243164, -43.51930236816406, -40.81781005859375, -38.11631774902344, -35.414825439453125, -32.71333312988281, -30.011837005615234, -27.310344696044922, -24.60885238647461, -21.907358169555664, -19.20586585998535, -16.50437355041504, -13.802879333496094, -11.101387023925781, -8.399893760681152, -5.698400497436523, -2.996908187866211, -0.2954139709472656, 2.406078338623047, 5.107571601867676, 7.8090643882751465, 10.510557174682617, 13.212050437927246, 15.913543701171875, 18.615036010742188, 21.316530227661133, 24.018022537231445]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 8.0, 12.0, 7.0, 6.0, 13.0, 15.0, 12.0, 24.0, 22.0, 26.0, 29.0, 29.0, 27.0, 36.0, 46.0, 44.0, 44.0, 49.0, 51.0, 54.0, 36.0, 35.0, 48.0, 35.0, 30.0, 32.0, 35.0, 40.0, 24.0, 18.0, 22.0, 11.0, 18.0, 13.0, 15.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-29.539199829101562, -28.756149291992188, -27.973098754882812, -27.190048217773438, -26.406997680664062, -25.623945236206055, -24.84089469909668, -24.057844161987305, -23.27479362487793, -22.491743087768555, -21.70869255065918, -20.925642013549805, -20.142589569091797, -19.359539031982422, -18.576488494873047, -17.793437957763672, -17.010387420654297, -16.227336883544922, -15.444286346435547, -14.661234855651855, -13.87818431854248, -13.095133781433105, -12.312082290649414, -11.529031753540039, -10.745981216430664, -9.962930679321289, -9.179880142211914, -8.396828651428223, -7.613778114318848, -6.830727577209473, -6.0476765632629395, -5.264625549316406, -4.481575012207031, -3.698524236679077, -2.915473461151123, -2.132422685623169, -1.3493719100952148, -0.5663211345672607, 0.21672964096069336, 0.9997806549072266, 1.7828311920166016, 2.5658819675445557, 3.3489327430725098, 4.131983757019043, 4.915034294128418, 5.698084831237793, 6.481135845184326, 7.264186859130859, 8.047237396240234, 8.83028793334961, 9.613338470458984, 10.396389961242676, 11.17944049835205, 11.962491035461426, 12.745542526245117, 13.528593063354492, 14.311643600463867, 15.094694137573242, 15.877744674682617, 16.660795211791992, 17.44384765625, 18.226898193359375, 19.00994873046875, 19.792999267578125, 20.5760498046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 18.0, 14.0, 25.0, 21.0, 20.0, 31.0, 48.0, 49.0, 40.0, 65.0, 68.0, 56.0, 69.0, 63.0, 62.0, 65.0, 53.0, 43.0, 38.0, 40.0, 28.0, 22.0, 10.0, 17.0, 6.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-3.1328125, -3.0621490478515625, -2.991485595703125, -2.9208221435546875, -2.85015869140625, -2.7794952392578125, -2.708831787109375, -2.6381683349609375, -2.5675048828125, -2.4968414306640625, -2.426177978515625, -2.3555145263671875, -2.28485107421875, -2.2141876220703125, -2.143524169921875, -2.0728607177734375, -2.002197265625, -1.9315338134765625, -1.860870361328125, -1.7902069091796875, -1.71954345703125, -1.6488800048828125, -1.578216552734375, -1.5075531005859375, -1.4368896484375, -1.3662261962890625, -1.295562744140625, -1.2248992919921875, -1.15423583984375, -1.0835723876953125, -1.012908935546875, -0.9422454833984375, -0.87158203125, -0.8009185791015625, -0.730255126953125, -0.6595916748046875, -0.58892822265625, -0.5182647705078125, -0.447601318359375, -0.3769378662109375, -0.3062744140625, -0.2356109619140625, -0.164947509765625, -0.0942840576171875, -0.02362060546875, 0.0470428466796875, 0.117706298828125, 0.1883697509765625, 0.259033203125, 0.3296966552734375, 0.400360107421875, 0.4710235595703125, 0.54168701171875, 0.6123504638671875, 0.683013916015625, 0.7536773681640625, 0.8243408203125, 0.8950042724609375, 0.965667724609375, 1.0363311767578125, 1.10699462890625, 1.1776580810546875, 1.248321533203125, 1.3189849853515625, 1.3896484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 8.0, 5.0, 8.0, 11.0, 9.0, 11.0, 25.0, 35.0, 64.0, 97.0, 178.0, 414.0, 866.0, 1655.0, 3606.0, 7591.0, 16643.0, 38682.0, 103024.0, 415424.0, 311612.0, 87079.0, 33793.0, 14710.0, 6696.0, 3208.0, 1515.0, 746.0, 369.0, 179.0, 80.0, 60.0, 41.0, 23.0, 11.0, 8.0, 10.0, 13.0, 6.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0218048095703125, -0.02114248275756836, -0.02048015594482422, -0.019817829132080078, -0.019155502319335938, -0.018493175506591797, -0.017830848693847656, -0.017168521881103516, -0.016506195068359375, -0.015843868255615234, -0.015181541442871094, -0.014519214630126953, -0.013856887817382812, -0.013194561004638672, -0.012532234191894531, -0.01186990737915039, -0.01120758056640625, -0.01054525375366211, -0.009882926940917969, -0.009220600128173828, -0.008558273315429688, -0.007895946502685547, -0.007233619689941406, -0.006571292877197266, -0.005908966064453125, -0.005246639251708984, -0.004584312438964844, -0.003921985626220703, -0.0032596588134765625, -0.002597332000732422, -0.0019350051879882812, -0.0012726783752441406, -0.0006103515625, 5.1975250244140625e-05, 0.0007143020629882812, 0.0013766288757324219, 0.0020389556884765625, 0.002701282501220703, 0.0033636093139648438, 0.004025936126708984, 0.004688262939453125, 0.005350589752197266, 0.006012916564941406, 0.006675243377685547, 0.0073375701904296875, 0.007999897003173828, 0.008662223815917969, 0.00932455062866211, 0.00998687744140625, 0.01064920425415039, 0.011311531066894531, 0.011973857879638672, 0.012636184692382812, 0.013298511505126953, 0.013960838317871094, 0.014623165130615234, 0.015285491943359375, 0.015947818756103516, 0.016610145568847656, 0.017272472381591797, 0.017934799194335938, 0.018597126007080078, 0.01925945281982422, 0.01992177963256836, 0.0205841064453125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 0.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 15.0, 11.0, 20.0, 17.0, 14.0, 23.0, 20.0, 18.0, 30.0, 27.0, 31.0, 32.0, 51.0, 49.0, 46.0, 45.0, 1061.0, 42.0, 41.0, 41.0, 35.0, 42.0, 32.0, 36.0, 32.0, 28.0, 22.0, 16.0, 25.0, 18.0, 13.0, 9.0, 16.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.97998046875, -0.9477157592773438, -0.9154510498046875, -0.8831863403320312, -0.850921630859375, -0.8186569213867188, -0.7863922119140625, -0.7541275024414062, -0.72186279296875, -0.6895980834960938, -0.6573333740234375, -0.6250686645507812, -0.592803955078125, -0.5605392456054688, -0.5282745361328125, -0.49600982666015625, -0.4637451171875, -0.43148040771484375, -0.3992156982421875, -0.36695098876953125, -0.334686279296875, -0.30242156982421875, -0.2701568603515625, -0.23789215087890625, -0.20562744140625, -0.17336273193359375, -0.1410980224609375, -0.10883331298828125, -0.076568603515625, -0.04430389404296875, -0.0120391845703125, 0.02022552490234375, 0.052490234375, 0.08475494384765625, 0.1170196533203125, 0.14928436279296875, 0.181549072265625, 0.21381378173828125, 0.2460784912109375, 0.27834320068359375, 0.31060791015625, 0.34287261962890625, 0.3751373291015625, 0.40740203857421875, 0.439666748046875, 0.47193145751953125, 0.5041961669921875, 0.5364608764648438, 0.5687255859375, 0.6009902954101562, 0.6332550048828125, 0.6655197143554688, 0.697784423828125, 0.7300491333007812, 0.7623138427734375, 0.7945785522460938, 0.82684326171875, 0.8591079711914062, 0.8913726806640625, 0.9236373901367188, 0.955902099609375, 0.9881668090820312, 1.0204315185546875, 1.0526962280273438, 1.0849609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 28.0, 25.0, 39.0, 62.0, 109.0, 153.0, 231.0, 326.0, 383.0, 684.0, 969.0, 1480.0, 2228.0, 3402.0, 5230.0, 8127.0, 12528.0, 20118.0, 32612.0, 54585.0, 100946.0, 231085.0, 1334619.0, 122295.0, 63595.0, 37380.0, 23019.0, 14390.0, 9155.0, 5922.0, 3817.0, 2544.0, 1692.0, 1116.0, 682.0, 471.0, 355.0, 230.0, 133.0, 108.0, 74.0, 47.0, 40.0, 20.0, 26.0, 9.0, 9.0, 7.0, 5.0, 0.0, 3.0, 5.0], "bins": [-0.006641387939453125, -0.00644683837890625, -0.006252288818359375, -0.0060577392578125, -0.005863189697265625, -0.00566864013671875, -0.005474090576171875, -0.005279541015625, -0.005084991455078125, -0.00489044189453125, -0.004695892333984375, -0.0045013427734375, -0.004306793212890625, -0.00411224365234375, -0.003917694091796875, -0.00372314453125, -0.003528594970703125, -0.00333404541015625, -0.003139495849609375, -0.0029449462890625, -0.002750396728515625, -0.00255584716796875, -0.002361297607421875, -0.002166748046875, -0.001972198486328125, -0.00177764892578125, -0.001583099365234375, -0.0013885498046875, -0.001194000244140625, -0.00099945068359375, -0.000804901123046875, -0.0006103515625, -0.000415802001953125, -0.00022125244140625, -2.6702880859375e-05, 0.0001678466796875, 0.000362396240234375, 0.00055694580078125, 0.000751495361328125, 0.000946044921875, 0.001140594482421875, 0.00133514404296875, 0.001529693603515625, 0.0017242431640625, 0.001918792724609375, 0.00211334228515625, 0.002307891845703125, 0.00250244140625, 0.002696990966796875, 0.00289154052734375, 0.003086090087890625, 0.0032806396484375, 0.003475189208984375, 0.00366973876953125, 0.003864288330078125, 0.004058837890625, 0.004253387451171875, 0.00444793701171875, 0.004642486572265625, 0.0048370361328125, 0.005031585693359375, 0.00522613525390625, 0.005420684814453125, 0.005615234375, 0.005809783935546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 3.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 2222.0, 0.0, 1043919.0, 2264.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 3.0, 0.0, 2.0, 10.0], "bins": [-1.0728836059570312e-06, -1.039355993270874e-06, -1.0058283805847168e-06, -9.723007678985596e-07, -9.387731552124023e-07, -9.052455425262451e-07, -8.717179298400879e-07, -8.381903171539307e-07, -8.046627044677734e-07, -7.711350917816162e-07, -7.37607479095459e-07, -7.040798664093018e-07, -6.705522537231445e-07, -6.370246410369873e-07, -6.034970283508301e-07, -5.699694156646729e-07, -5.364418029785156e-07, -5.029141902923584e-07, -4.6938657760620117e-07, -4.3585896492004395e-07, -4.023313522338867e-07, -3.688037395477295e-07, -3.3527612686157227e-07, -3.0174851417541504e-07, -2.682209014892578e-07, -2.3469328880310059e-07, -2.0116567611694336e-07, -1.6763806343078613e-07, -1.341104507446289e-07, -1.0058283805847168e-07, -6.705522537231445e-08, -3.3527612686157227e-08, 0.0, 3.3527612686157227e-08, 6.705522537231445e-08, 1.0058283805847168e-07, 1.341104507446289e-07, 1.6763806343078613e-07, 2.0116567611694336e-07, 2.3469328880310059e-07, 2.682209014892578e-07, 3.0174851417541504e-07, 3.3527612686157227e-07, 3.688037395477295e-07, 4.023313522338867e-07, 4.3585896492004395e-07, 4.6938657760620117e-07, 5.029141902923584e-07, 5.364418029785156e-07, 5.699694156646729e-07, 6.034970283508301e-07, 6.370246410369873e-07, 6.705522537231445e-07, 7.040798664093018e-07, 7.37607479095459e-07, 7.711350917816162e-07, 8.046627044677734e-07, 8.381903171539307e-07, 8.717179298400879e-07, 9.052455425262451e-07, 9.387731552124023e-07, 9.723007678985596e-07, 1.0058283805847168e-06, 1.039355993270874e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 18.0, 14.0, 25.0, 21.0, 20.0, 31.0, 48.0, 49.0, 40.0, 65.0, 68.0, 56.0, 69.0, 63.0, 62.0, 65.0, 53.0, 43.0, 38.0, 40.0, 28.0, 22.0, 10.0, 17.0, 6.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-3.1328125, -3.0621490478515625, -2.991485595703125, -2.9208221435546875, -2.85015869140625, -2.7794952392578125, -2.708831787109375, -2.6381683349609375, -2.5675048828125, -2.4968414306640625, -2.426177978515625, -2.3555145263671875, -2.28485107421875, -2.2141876220703125, -2.143524169921875, -2.0728607177734375, -2.002197265625, -1.9315338134765625, -1.860870361328125, -1.7902069091796875, -1.71954345703125, -1.6488800048828125, -1.578216552734375, -1.5075531005859375, -1.4368896484375, -1.3662261962890625, -1.295562744140625, -1.2248992919921875, -1.15423583984375, -1.0835723876953125, -1.012908935546875, -0.9422454833984375, -0.87158203125, -0.8009185791015625, -0.730255126953125, -0.6595916748046875, -0.58892822265625, -0.5182647705078125, -0.447601318359375, -0.3769378662109375, -0.3062744140625, -0.2356109619140625, -0.164947509765625, -0.0942840576171875, -0.02362060546875, 0.0470428466796875, 0.117706298828125, 0.1883697509765625, 0.259033203125, 0.3296966552734375, 0.400360107421875, 0.4710235595703125, 0.54168701171875, 0.6123504638671875, 0.683013916015625, 0.7536773681640625, 0.8243408203125, 0.8950042724609375, 0.965667724609375, 1.0363311767578125, 1.10699462890625, 1.1776580810546875, 1.248321533203125, 1.3189849853515625, 1.3896484375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 7.0, 13.0, 14.0, 19.0, 30.0, 55.0, 75.0, 110.0, 193.0, 329.0, 510.0, 819.0, 1398.0, 2368.0, 4388.0, 8947.0, 22532.0, 128773.0, 746617.0, 93907.0, 19680.0, 8056.0, 4058.0, 2233.0, 1332.0, 792.0, 437.0, 307.0, 182.0, 127.0, 70.0, 48.0, 34.0, 27.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-9.8984375, -9.62677001953125, -9.3551025390625, -9.08343505859375, -8.811767578125, -8.54010009765625, -8.2684326171875, -7.99676513671875, -7.72509765625, -7.45343017578125, -7.1817626953125, -6.91009521484375, -6.638427734375, -6.36676025390625, -6.0950927734375, -5.82342529296875, -5.5517578125, -5.28009033203125, -5.0084228515625, -4.73675537109375, -4.465087890625, -4.19342041015625, -3.9217529296875, -3.65008544921875, -3.37841796875, -3.10675048828125, -2.8350830078125, -2.56341552734375, -2.291748046875, -2.02008056640625, -1.7484130859375, -1.47674560546875, -1.205078125, -0.93341064453125, -0.6617431640625, -0.39007568359375, -0.118408203125, 0.15325927734375, 0.4249267578125, 0.69659423828125, 0.96826171875, 1.23992919921875, 1.5115966796875, 1.78326416015625, 2.054931640625, 2.32659912109375, 2.5982666015625, 2.86993408203125, 3.1416015625, 3.41326904296875, 3.6849365234375, 3.95660400390625, 4.228271484375, 4.49993896484375, 4.7716064453125, 5.04327392578125, 5.31494140625, 5.58660888671875, 5.8582763671875, 6.12994384765625, 6.401611328125, 6.67327880859375, 6.9449462890625, 7.21661376953125, 7.48828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 1.0, 7.0, 17.0, 11.0, 12.0, 17.0, 24.0, 26.0, 19.0, 29.0, 25.0, 28.0, 36.0, 30.0, 45.0, 43.0, 73.0, 134.0, 1474.0, 376.0, 144.0, 58.0, 58.0, 52.0, 40.0, 42.0, 29.0, 31.0, 19.0, 19.0, 18.0, 20.0, 20.0, 16.0, 8.0, 8.0, 7.0, 12.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.70703125, -4.5640869140625, -4.421142578125, -4.2781982421875, -4.13525390625, -3.9923095703125, -3.849365234375, -3.7064208984375, -3.5634765625, -3.4205322265625, -3.277587890625, -3.1346435546875, -2.99169921875, -2.8487548828125, -2.705810546875, -2.5628662109375, -2.419921875, -2.2769775390625, -2.134033203125, -1.9910888671875, -1.84814453125, -1.7052001953125, -1.562255859375, -1.4193115234375, -1.2763671875, -1.1334228515625, -0.990478515625, -0.8475341796875, -0.70458984375, -0.5616455078125, -0.418701171875, -0.2757568359375, -0.1328125, 0.0101318359375, 0.153076171875, 0.2960205078125, 0.43896484375, 0.5819091796875, 0.724853515625, 0.8677978515625, 1.0107421875, 1.1536865234375, 1.296630859375, 1.4395751953125, 1.58251953125, 1.7254638671875, 1.868408203125, 2.0113525390625, 2.154296875, 2.2972412109375, 2.440185546875, 2.5831298828125, 2.72607421875, 2.8690185546875, 3.011962890625, 3.1549072265625, 3.2978515625, 3.4407958984375, 3.583740234375, 3.7266845703125, 3.86962890625, 4.0125732421875, 4.155517578125, 4.2984619140625, 4.44140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 12.0, 7.0, 8.0, 7.0, 10.0, 18.0, 16.0, 12.0, 19.0, 21.0, 22.0, 24.0, 42.0, 45.0, 65.0, 107.0, 213.0, 723.0, 9179.0, 3094224.0, 39200.0, 965.0, 284.0, 113.0, 73.0, 54.0, 28.0, 25.0, 22.0, 23.0, 25.0, 23.0, 20.0, 16.0, 8.0, 14.0, 11.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.734375, -19.068359375, -18.40234375, -17.736328125, -17.0703125, -16.404296875, -15.73828125, -15.072265625, -14.40625, -13.740234375, -13.07421875, -12.408203125, -11.7421875, -11.076171875, -10.41015625, -9.744140625, -9.078125, -8.412109375, -7.74609375, -7.080078125, -6.4140625, -5.748046875, -5.08203125, -4.416015625, -3.75, -3.083984375, -2.41796875, -1.751953125, -1.0859375, -0.419921875, 0.24609375, 0.912109375, 1.578125, 2.244140625, 2.91015625, 3.576171875, 4.2421875, 4.908203125, 5.57421875, 6.240234375, 6.90625, 7.572265625, 8.23828125, 8.904296875, 9.5703125, 10.236328125, 10.90234375, 11.568359375, 12.234375, 12.900390625, 13.56640625, 14.232421875, 14.8984375, 15.564453125, 16.23046875, 16.896484375, 17.5625, 18.228515625, 18.89453125, 19.560546875, 20.2265625, 20.892578125, 21.55859375, 22.224609375, 22.890625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 197.0, 784.0, 33.0, 1.0, 1.0, 0.0, 1.0], "bins": [-141.17442321777344, -138.7506103515625, -136.3267822265625, -133.90296936035156, -131.47914123535156, -129.05532836914062, -126.63150024414062, -124.20768737792969, -121.78385925292969, -119.36003875732422, -116.93621826171875, -114.51239776611328, -112.08857727050781, -109.66475677490234, -107.24093627929688, -104.81712341308594, -102.39330291748047, -99.969482421875, -97.54566192626953, -95.12184143066406, -92.6980209350586, -90.27420043945312, -87.85037994384766, -85.42655944824219, -83.00274658203125, -80.57892608642578, -78.15510559082031, -75.73128509521484, -73.30746459960938, -70.8836441040039, -68.45982360839844, -66.0360107421875, -63.612186431884766, -61.1883659362793, -58.76454544067383, -56.34072494506836, -53.916908264160156, -51.49308776855469, -49.06926727294922, -46.64544677734375, -44.22162628173828, -41.79780578613281, -39.373985290527344, -36.950164794921875, -34.526344299316406, -32.10252380371094, -29.678707122802734, -27.254886627197266, -24.831066131591797, -22.407245635986328, -19.98342514038086, -17.559606552124023, -15.135786056518555, -12.711965560913086, -10.288146018981934, -7.864326477050781, -5.440506935119629, -3.0166869163513184, -0.5928668975830078, 1.8309531211853027, 4.254773139953613, 6.678593635559082, 9.102413177490234, 11.526232719421387, 13.950053215026855]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 3.0, 5.0, 7.0, 17.0, 15.0, 32.0, 19.0, 26.0, 19.0, 23.0, 30.0, 35.0, 31.0, 32.0, 36.0, 44.0, 34.0, 47.0, 35.0, 42.0, 42.0, 45.0, 36.0, 27.0, 32.0, 35.0, 31.0, 31.0, 22.0, 22.0, 24.0, 20.0, 16.0, 15.0, 9.0, 10.0, 12.0, 7.0, 8.0, 5.0, 1.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.92745590209961, -16.432964324951172, -15.938474655151367, -15.443984031677246, -14.949493408203125, -14.455002784729004, -13.960512161254883, -13.466020584106445, -12.97153091430664, -12.47704029083252, -11.982549667358398, -11.488059043884277, -10.993568420410156, -10.499077796936035, -10.004587173461914, -9.510095596313477, -9.015604972839355, -8.521114349365234, -8.026623725891113, -7.532133102416992, -7.037642478942871, -6.54315185546875, -6.048660755157471, -5.55417013168335, -5.0596795082092285, -4.565188884735107, -4.070698261260986, -3.576207399368286, -3.081716775894165, -2.587226152420044, -2.0927352905273438, -1.5982446670532227, -1.1037540435791016, -0.6092633605003357, -0.11477267742156982, 0.3797180652618408, 0.8742086887359619, 1.368699312210083, 1.8631901741027832, 2.3576807975769043, 2.8521714210510254, 3.3466620445251465, 3.8411526679992676, 4.335643768310547, 4.830134391784668, 5.324625015258789, 5.81911563873291, 6.313606262207031, 6.808096885681152, 7.302587509155273, 7.7970781326293945, 8.291568756103516, 8.786059379577637, 9.280550003051758, 9.775041580200195, 10.26953125, 10.764022827148438, 11.258513450622559, 11.75300407409668, 12.2474946975708, 12.741985321044922, 13.236475944519043, 13.730966567993164, 14.225458145141602, 14.719947814941406]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 12.0, 24.0, 18.0, 22.0, 15.0, 42.0, 42.0, 48.0, 58.0, 61.0, 57.0, 55.0, 70.0, 70.0, 68.0, 52.0, 51.0, 37.0, 44.0, 35.0, 22.0, 20.0, 16.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-3.15234375, -3.080780029296875, -3.00921630859375, -2.937652587890625, -2.8660888671875, -2.794525146484375, -2.72296142578125, -2.651397705078125, -2.579833984375, -2.508270263671875, -2.43670654296875, -2.365142822265625, -2.2935791015625, -2.222015380859375, -2.15045166015625, -2.078887939453125, -2.00732421875, -1.935760498046875, -1.86419677734375, -1.792633056640625, -1.7210693359375, -1.649505615234375, -1.57794189453125, -1.506378173828125, -1.434814453125, -1.363250732421875, -1.29168701171875, -1.220123291015625, -1.1485595703125, -1.076995849609375, -1.00543212890625, -0.933868408203125, -0.8623046875, -0.790740966796875, -0.71917724609375, -0.647613525390625, -0.5760498046875, -0.504486083984375, -0.43292236328125, -0.361358642578125, -0.289794921875, -0.218231201171875, -0.14666748046875, -0.075103759765625, -0.0035400390625, 0.068023681640625, 0.13958740234375, 0.211151123046875, 0.28271484375, 0.354278564453125, 0.42584228515625, 0.497406005859375, 0.5689697265625, 0.640533447265625, 0.71209716796875, 0.783660888671875, 0.855224609375, 0.926788330078125, 0.99835205078125, 1.069915771484375, 1.1414794921875, 1.213043212890625, 1.28460693359375, 1.356170654296875, 1.427734375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 8.0, 5.0, 17.0, 17.0, 38.0, 31.0, 61.0, 92.0, 162.0, 315.0, 552.0, 1474.0, 7353.0, 115096.0, 3709689.0, 341748.0, 13941.0, 2092.0, 704.0, 353.0, 197.0, 120.0, 78.0, 40.0, 25.0, 33.0, 18.0, 8.0, 3.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-20.015625, -19.5570068359375, -19.098388671875, -18.6397705078125, -18.18115234375, -17.7225341796875, -17.263916015625, -16.8052978515625, -16.3466796875, -15.8880615234375, -15.429443359375, -14.9708251953125, -14.51220703125, -14.0535888671875, -13.594970703125, -13.1363525390625, -12.677734375, -12.2191162109375, -11.760498046875, -11.3018798828125, -10.84326171875, -10.3846435546875, -9.926025390625, -9.4674072265625, -9.0087890625, -8.5501708984375, -8.091552734375, -7.6329345703125, -7.17431640625, -6.7156982421875, -6.257080078125, -5.7984619140625, -5.33984375, -4.8812255859375, -4.422607421875, -3.9639892578125, -3.50537109375, -3.0467529296875, -2.588134765625, -2.1295166015625, -1.6708984375, -1.2122802734375, -0.753662109375, -0.2950439453125, 0.16357421875, 0.6221923828125, 1.080810546875, 1.5394287109375, 1.998046875, 2.4566650390625, 2.915283203125, 3.3739013671875, 3.83251953125, 4.2911376953125, 4.749755859375, 5.2083740234375, 5.6669921875, 6.1256103515625, 6.584228515625, 7.0428466796875, 7.50146484375, 7.9600830078125, 8.418701171875, 8.8773193359375, 9.3359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 16.0, 29.0, 21.0, 57.0, 75.0, 160.0, 235.0, 375.0, 573.0, 760.0, 631.0, 420.0, 290.0, 179.0, 104.0, 63.0, 30.0, 12.0, 15.0, 1.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.494384765625, -8.20751953125, -7.920654296875, -7.6337890625, -7.346923828125, -7.06005859375, -6.773193359375, -6.486328125, -6.199462890625, -5.91259765625, -5.625732421875, -5.3388671875, -5.052001953125, -4.76513671875, -4.478271484375, -4.19140625, -3.904541015625, -3.61767578125, -3.330810546875, -3.0439453125, -2.757080078125, -2.47021484375, -2.183349609375, -1.896484375, -1.609619140625, -1.32275390625, -1.035888671875, -0.7490234375, -0.462158203125, -0.17529296875, 0.111572265625, 0.3984375, 0.685302734375, 0.97216796875, 1.259033203125, 1.5458984375, 1.832763671875, 2.11962890625, 2.406494140625, 2.693359375, 2.980224609375, 3.26708984375, 3.553955078125, 3.8408203125, 4.127685546875, 4.41455078125, 4.701416015625, 4.98828125, 5.275146484375, 5.56201171875, 5.848876953125, 6.1357421875, 6.422607421875, 6.70947265625, 6.996337890625, 7.283203125, 7.570068359375, 7.85693359375, 8.143798828125, 8.4306640625, 8.717529296875, 9.00439453125, 9.291259765625, 9.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 9.0, 13.0, 12.0, 29.0, 29.0, 38.0, 68.0, 93.0, 150.0, 276.0, 541.0, 1037.0, 2743.0, 14790.0, 260557.0, 3580244.0, 311548.0, 16687.0, 2978.0, 1072.0, 569.0, 291.0, 188.0, 102.0, 85.0, 44.0, 28.0, 22.0, 18.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -15.84619140625, -15.2705078125, -14.69482421875, -14.119140625, -13.54345703125, -12.9677734375, -12.39208984375, -11.81640625, -11.24072265625, -10.6650390625, -10.08935546875, -9.513671875, -8.93798828125, -8.3623046875, -7.78662109375, -7.2109375, -6.63525390625, -6.0595703125, -5.48388671875, -4.908203125, -4.33251953125, -3.7568359375, -3.18115234375, -2.60546875, -2.02978515625, -1.4541015625, -0.87841796875, -0.302734375, 0.27294921875, 0.8486328125, 1.42431640625, 2.0, 2.57568359375, 3.1513671875, 3.72705078125, 4.302734375, 4.87841796875, 5.4541015625, 6.02978515625, 6.60546875, 7.18115234375, 7.7568359375, 8.33251953125, 8.908203125, 9.48388671875, 10.0595703125, 10.63525390625, 11.2109375, 11.78662109375, 12.3623046875, 12.93798828125, 13.513671875, 14.08935546875, 14.6650390625, 15.24072265625, 15.81640625, 16.39208984375, 16.9677734375, 17.54345703125, 18.119140625, 18.69482421875, 19.2705078125, 19.84619140625, 20.421875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 10.0, 32.0, 162.0, 313.0, 323.0, 133.0, 34.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.589736938476562, -16.253463745117188, -13.91718864440918, -11.580914497375488, -9.244640350341797, -6.9083662033081055, -4.572092056274414, -2.2358169555664062, 0.10045623779296875, 2.43673038482666, 4.773004531860352, 7.109278678894043, 9.445552825927734, 11.781826972961426, 14.118101119995117, 16.454376220703125, 18.7906494140625, 21.126922607421875, 23.463197708129883, 25.79947280883789, 28.135746002197266, 30.47201919555664, 32.80829620361328, 35.144569396972656, 37.48084259033203, 39.817115783691406, 42.15338897705078, 44.48966598510742, 46.8259391784668, 49.16221237182617, 51.49848937988281, 53.83476257324219, 56.17103576660156, 58.50730895996094, 60.84358215332031, 63.17985916137695, 65.51612854003906, 67.85240936279297, 70.18868255615234, 72.52495574951172, 74.8612289428711, 77.19750213623047, 79.53377532958984, 81.87004852294922, 84.20632934570312, 86.5426025390625, 88.87887573242188, 91.21514892578125, 93.55142211914062, 95.8876953125, 98.22396850585938, 100.56024169921875, 102.89651489257812, 105.23279571533203, 107.5690689086914, 109.90534210205078, 112.24161529541016, 114.57788848876953, 116.9141616821289, 119.25043487548828, 121.58671569824219, 123.92298889160156, 126.25926208496094, 128.5955352783203, 130.9318084716797]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 6.0, 10.0, 17.0, 10.0, 26.0, 10.0, 20.0, 21.0, 22.0, 35.0, 26.0, 34.0, 32.0, 34.0, 33.0, 54.0, 39.0, 34.0, 37.0, 34.0, 40.0, 36.0, 40.0, 35.0, 36.0, 28.0, 33.0, 24.0, 21.0, 18.0, 17.0, 15.0, 17.0, 16.0, 11.0, 8.0, 14.0, 6.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0], "bins": [-20.789962768554688, -20.206619262695312, -19.623275756835938, -19.03993034362793, -18.456586837768555, -17.87324333190918, -17.289897918701172, -16.706554412841797, -16.123210906982422, -15.539867401123047, -14.956522941589355, -14.373178482055664, -13.789834976196289, -13.206491470336914, -12.623147010803223, -12.039802551269531, -11.456459045410156, -10.873115539550781, -10.28977108001709, -9.706426620483398, -9.123083114624023, -8.539739608764648, -7.956395149230957, -7.373051166534424, -6.789707183837891, -6.206363201141357, -5.623019218444824, -5.039675235748291, -4.456331253051758, -3.8729872703552246, -3.2896432876586914, -2.706299304962158, -2.122955322265625, -1.5396113395690918, -0.9562673568725586, -0.3729233741760254, 0.2104206085205078, 0.793764591217041, 1.3771085739135742, 1.9604525566101074, 2.5437965393066406, 3.127140522003174, 3.710484504699707, 4.29382848739624, 4.877172470092773, 5.460516452789307, 6.04386043548584, 6.627204418182373, 7.210548400878906, 7.7938923835754395, 8.377236366271973, 8.960580825805664, 9.543924331665039, 10.127267837524414, 10.710612297058105, 11.293956756591797, 11.877300262451172, 12.460643768310547, 13.043988227844238, 13.62733268737793, 14.210676193237305, 14.79401969909668, 15.377364158630371, 15.960708618164062, 16.544052124023438]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 12.0, 16.0, 25.0, 25.0, 38.0, 35.0, 37.0, 43.0, 43.0, 69.0, 64.0, 67.0, 59.0, 62.0, 67.0, 55.0, 39.0, 42.0, 41.0, 29.0, 24.0, 16.0, 20.0, 13.0, 8.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.064453125, -2.99285888671875, -2.9212646484375, -2.84967041015625, -2.778076171875, -2.70648193359375, -2.6348876953125, -2.56329345703125, -2.49169921875, -2.42010498046875, -2.3485107421875, -2.27691650390625, -2.205322265625, -2.13372802734375, -2.0621337890625, -1.99053955078125, -1.9189453125, -1.84735107421875, -1.7757568359375, -1.70416259765625, -1.632568359375, -1.56097412109375, -1.4893798828125, -1.41778564453125, -1.34619140625, -1.27459716796875, -1.2030029296875, -1.13140869140625, -1.059814453125, -0.98822021484375, -0.9166259765625, -0.84503173828125, -0.7734375, -0.70184326171875, -0.6302490234375, -0.55865478515625, -0.487060546875, -0.41546630859375, -0.3438720703125, -0.27227783203125, -0.20068359375, -0.12908935546875, -0.0574951171875, 0.01409912109375, 0.085693359375, 0.15728759765625, 0.2288818359375, 0.30047607421875, 0.3720703125, 0.44366455078125, 0.5152587890625, 0.58685302734375, 0.658447265625, 0.73004150390625, 0.8016357421875, 0.87322998046875, 0.94482421875, 1.01641845703125, 1.0880126953125, 1.15960693359375, 1.231201171875, 1.30279541015625, 1.3743896484375, 1.44598388671875, 1.517578125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 14.0, 18.0, 29.0, 48.0, 85.0, 144.0, 277.0, 450.0, 980.0, 1990.0, 4413.0, 10226.0, 24121.0, 61967.0, 190593.0, 522948.0, 144393.0, 50174.0, 19938.0, 8507.0, 3760.0, 1698.0, 797.0, 428.0, 220.0, 123.0, 67.0, 48.0, 18.0, 16.0, 15.0, 4.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023162841796875, -0.02250838279724121, -0.021853923797607422, -0.021199464797973633, -0.020545005798339844, -0.019890546798706055, -0.019236087799072266, -0.018581628799438477, -0.017927169799804688, -0.0172727108001709, -0.01661825180053711, -0.01596379280090332, -0.015309333801269531, -0.014654874801635742, -0.014000415802001953, -0.013345956802368164, -0.012691497802734375, -0.012037038803100586, -0.011382579803466797, -0.010728120803833008, -0.010073661804199219, -0.00941920280456543, -0.00876474380493164, -0.008110284805297852, -0.0074558258056640625, -0.0068013668060302734, -0.006146907806396484, -0.005492448806762695, -0.004837989807128906, -0.004183530807495117, -0.003529071807861328, -0.002874612808227539, -0.00222015380859375, -0.001565694808959961, -0.0009112358093261719, -0.0002567768096923828, 0.00039768218994140625, 0.0010521411895751953, 0.0017066001892089844, 0.0023610591888427734, 0.0030155181884765625, 0.0036699771881103516, 0.004324436187744141, 0.00497889518737793, 0.005633354187011719, 0.006287813186645508, 0.006942272186279297, 0.007596731185913086, 0.008251190185546875, 0.008905649185180664, 0.009560108184814453, 0.010214567184448242, 0.010869026184082031, 0.01152348518371582, 0.01217794418334961, 0.012832403182983398, 0.013486862182617188, 0.014141321182250977, 0.014795780181884766, 0.015450239181518555, 0.016104698181152344, 0.016759157180786133, 0.017413616180419922, 0.01806807518005371, 0.0187225341796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 4.0, 10.0, 7.0, 13.0, 8.0, 21.0, 25.0, 12.0, 17.0, 25.0, 30.0, 31.0, 34.0, 33.0, 27.0, 28.0, 49.0, 41.0, 49.0, 1061.0, 48.0, 42.0, 33.0, 41.0, 25.0, 33.0, 34.0, 31.0, 32.0, 30.0, 30.0, 15.0, 20.0, 11.0, 13.0, 15.0, 5.0, 7.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0704803466796875, -1.036468505859375, -1.0024566650390625, -0.96844482421875, -0.9344329833984375, -0.900421142578125, -0.8664093017578125, -0.8323974609375, -0.7983856201171875, -0.764373779296875, -0.7303619384765625, -0.69635009765625, -0.6623382568359375, -0.628326416015625, -0.5943145751953125, -0.560302734375, -0.5262908935546875, -0.492279052734375, -0.4582672119140625, -0.42425537109375, -0.3902435302734375, -0.356231689453125, -0.3222198486328125, -0.2882080078125, -0.2541961669921875, -0.220184326171875, -0.1861724853515625, -0.15216064453125, -0.1181488037109375, -0.084136962890625, -0.0501251220703125, -0.01611328125, 0.0178985595703125, 0.051910400390625, 0.0859222412109375, 0.11993408203125, 0.1539459228515625, 0.187957763671875, 0.2219696044921875, 0.2559814453125, 0.2899932861328125, 0.324005126953125, 0.3580169677734375, 0.39202880859375, 0.4260406494140625, 0.460052490234375, 0.4940643310546875, 0.528076171875, 0.5620880126953125, 0.596099853515625, 0.6301116943359375, 0.66412353515625, 0.6981353759765625, 0.732147216796875, 0.7661590576171875, 0.8001708984375, 0.8341827392578125, 0.868194580078125, 0.9022064208984375, 0.93621826171875, 0.9702301025390625, 1.004241943359375, 1.0382537841796875, 1.072265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 0.0, 1.0, 7.0, 5.0, 6.0, 19.0, 35.0, 42.0, 58.0, 71.0, 142.0, 201.0, 291.0, 394.0, 648.0, 994.0, 1505.0, 2182.0, 3416.0, 5195.0, 8100.0, 13052.0, 20452.0, 32921.0, 54282.0, 92404.0, 202912.0, 1345625.0, 129312.0, 69463.0, 42111.0, 25838.0, 16266.0, 10303.0, 6585.0, 4212.0, 2731.0, 1811.0, 1121.0, 802.0, 558.0, 358.0, 219.0, 125.0, 117.0, 93.0, 51.0, 37.0, 25.0, 9.0, 8.0, 14.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.0061408281326293945, -0.005937814712524414, -0.005734801292419434, -0.005531787872314453, -0.005328774452209473, -0.005125761032104492, -0.004922747611999512, -0.004719734191894531, -0.004516720771789551, -0.00431370735168457, -0.00411069393157959, -0.003907680511474609, -0.003704667091369629, -0.0035016536712646484, -0.003298640251159668, -0.0030956268310546875, -0.002892613410949707, -0.0026895999908447266, -0.002486586570739746, -0.0022835731506347656, -0.002080559730529785, -0.0018775463104248047, -0.0016745328903198242, -0.0014715194702148438, -0.0012685060501098633, -0.0010654926300048828, -0.0008624792098999023, -0.0006594657897949219, -0.0004564523696899414, -0.00025343894958496094, -5.042552947998047e-05, 0.000152587890625, 0.00035560131072998047, 0.0005586147308349609, 0.0007616281509399414, 0.0009646415710449219, 0.0011676549911499023, 0.0013706684112548828, 0.0015736818313598633, 0.0017766952514648438, 0.0019797086715698242, 0.0021827220916748047, 0.002385735511779785, 0.0025887489318847656, 0.002791762351989746, 0.0029947757720947266, 0.003197789192199707, 0.0034008026123046875, 0.003603816032409668, 0.0038068294525146484, 0.004009842872619629, 0.004212856292724609, 0.00441586971282959, 0.00461888313293457, 0.004821896553039551, 0.005024909973144531, 0.005227923393249512, 0.005430936813354492, 0.005633950233459473, 0.005836963653564453, 0.006039977073669434, 0.006242990493774414, 0.0064460039138793945, 0.006649017333984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 990.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 0.0, 13.0, 0.0, 29.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 486.0, 0.0, 7355.0, 0.0, 1032694.0, 0.0, 7334.0, 0.0, 505.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 28.0, 0.0, 10.0, 0.0, 6.0, 4.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 12.0, 16.0, 25.0, 25.0, 38.0, 35.0, 37.0, 43.0, 43.0, 69.0, 64.0, 67.0, 59.0, 62.0, 67.0, 55.0, 39.0, 42.0, 41.0, 29.0, 24.0, 16.0, 20.0, 13.0, 8.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.064453125, -2.99285888671875, -2.9212646484375, -2.84967041015625, -2.778076171875, -2.70648193359375, -2.6348876953125, -2.56329345703125, -2.49169921875, -2.42010498046875, -2.3485107421875, -2.27691650390625, -2.205322265625, -2.13372802734375, -2.0621337890625, -1.99053955078125, -1.9189453125, -1.84735107421875, -1.7757568359375, -1.70416259765625, -1.632568359375, -1.56097412109375, -1.4893798828125, -1.41778564453125, -1.34619140625, -1.27459716796875, -1.2030029296875, -1.13140869140625, -1.059814453125, -0.98822021484375, -0.9166259765625, -0.84503173828125, -0.7734375, -0.70184326171875, -0.6302490234375, -0.55865478515625, -0.487060546875, -0.41546630859375, -0.3438720703125, -0.27227783203125, -0.20068359375, -0.12908935546875, -0.0574951171875, 0.01409912109375, 0.085693359375, 0.15728759765625, 0.2288818359375, 0.30047607421875, 0.3720703125, 0.44366455078125, 0.5152587890625, 0.58685302734375, 0.658447265625, 0.73004150390625, 0.8016357421875, 0.87322998046875, 0.94482421875, 1.01641845703125, 1.0880126953125, 1.15960693359375, 1.231201171875, 1.30279541015625, 1.3743896484375, 1.44598388671875, 1.517578125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 15.0, 24.0, 41.0, 57.0, 93.0, 157.0, 272.0, 451.0, 959.0, 1876.0, 4531.0, 14526.0, 58368.0, 308742.0, 528354.0, 96148.0, 22376.0, 6573.0, 2444.0, 1158.0, 540.0, 328.0, 217.0, 117.0, 63.0, 41.0, 31.0, 14.0, 10.0, 9.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.59765625, -2.5295867919921875, -2.461517333984375, -2.3934478759765625, -2.32537841796875, -2.2573089599609375, -2.189239501953125, -2.1211700439453125, -2.0531005859375, -1.9850311279296875, -1.916961669921875, -1.8488922119140625, -1.78082275390625, -1.7127532958984375, -1.644683837890625, -1.5766143798828125, -1.508544921875, -1.4404754638671875, -1.372406005859375, -1.3043365478515625, -1.23626708984375, -1.1681976318359375, -1.100128173828125, -1.0320587158203125, -0.9639892578125, -0.8959197998046875, -0.827850341796875, -0.7597808837890625, -0.69171142578125, -0.6236419677734375, -0.555572509765625, -0.4875030517578125, -0.41943359375, -0.3513641357421875, -0.283294677734375, -0.2152252197265625, -0.14715576171875, -0.0790863037109375, -0.011016845703125, 0.0570526123046875, 0.1251220703125, 0.1931915283203125, 0.261260986328125, 0.3293304443359375, 0.39739990234375, 0.4654693603515625, 0.533538818359375, 0.6016082763671875, 0.669677734375, 0.7377471923828125, 0.805816650390625, 0.8738861083984375, 0.94195556640625, 1.0100250244140625, 1.078094482421875, 1.1461639404296875, 1.2142333984375, 1.2823028564453125, 1.350372314453125, 1.4184417724609375, 1.48651123046875, 1.5545806884765625, 1.622650146484375, 1.6907196044921875, 1.7587890625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 7.0, 10.0, 9.0, 13.0, 21.0, 19.0, 17.0, 25.0, 22.0, 23.0, 29.0, 35.0, 33.0, 32.0, 51.0, 57.0, 89.0, 371.0, 1608.0, 103.0, 44.0, 46.0, 47.0, 39.0, 41.0, 40.0, 25.0, 38.0, 20.0, 32.0, 9.0, 13.0, 20.0, 12.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.9150390625, -4.740234375, -4.5654296875, -4.390625, -4.2158203125, -4.041015625, -3.8662109375, -3.69140625, -3.5166015625, -3.341796875, -3.1669921875, -2.9921875, -2.8173828125, -2.642578125, -2.4677734375, -2.29296875, -2.1181640625, -1.943359375, -1.7685546875, -1.59375, -1.4189453125, -1.244140625, -1.0693359375, -0.89453125, -0.7197265625, -0.544921875, -0.3701171875, -0.1953125, -0.0205078125, 0.154296875, 0.3291015625, 0.50390625, 0.6787109375, 0.853515625, 1.0283203125, 1.203125, 1.3779296875, 1.552734375, 1.7275390625, 1.90234375, 2.0771484375, 2.251953125, 2.4267578125, 2.6015625, 2.7763671875, 2.951171875, 3.1259765625, 3.30078125, 3.4755859375, 3.650390625, 3.8251953125, 4.0, 4.1748046875, 4.349609375, 4.5244140625, 4.69921875, 4.8740234375, 5.048828125, 5.2236328125, 5.3984375, 5.5732421875, 5.748046875, 5.9228515625, 6.09765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 9.0, 8.0, 12.0, 21.0, 10.0, 11.0, 19.0, 20.0, 27.0, 37.0, 39.0, 39.0, 79.0, 72.0, 136.0, 224.0, 537.0, 1478.0, 14793.0, 3044403.0, 79553.0, 2659.0, 671.0, 280.0, 129.0, 91.0, 73.0, 48.0, 38.0, 23.0, 25.0, 20.0, 15.0, 21.0, 13.0, 21.0, 10.0, 6.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.546875, -11.2138671875, -10.880859375, -10.5478515625, -10.21484375, -9.8818359375, -9.548828125, -9.2158203125, -8.8828125, -8.5498046875, -8.216796875, -7.8837890625, -7.55078125, -7.2177734375, -6.884765625, -6.5517578125, -6.21875, -5.8857421875, -5.552734375, -5.2197265625, -4.88671875, -4.5537109375, -4.220703125, -3.8876953125, -3.5546875, -3.2216796875, -2.888671875, -2.5556640625, -2.22265625, -1.8896484375, -1.556640625, -1.2236328125, -0.890625, -0.5576171875, -0.224609375, 0.1083984375, 0.44140625, 0.7744140625, 1.107421875, 1.4404296875, 1.7734375, 2.1064453125, 2.439453125, 2.7724609375, 3.10546875, 3.4384765625, 3.771484375, 4.1044921875, 4.4375, 4.7705078125, 5.103515625, 5.4365234375, 5.76953125, 6.1025390625, 6.435546875, 6.7685546875, 7.1015625, 7.4345703125, 7.767578125, 8.1005859375, 8.43359375, 8.7666015625, 9.099609375, 9.4326171875, 9.765625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 19.0, 375.0, 598.0, 23.0, 0.0, 0.0, 2.0], "bins": [-67.957275390625, -66.80784606933594, -65.65841674804688, -64.50898742675781, -63.35955810546875, -62.21012878417969, -61.060699462890625, -59.91127014160156, -58.7618408203125, -57.61241149902344, -56.462982177734375, -55.31355285644531, -54.16412353515625, -53.01469421386719, -51.865264892578125, -50.71583557128906, -49.56640625, -48.41697692871094, -47.267547607421875, -46.11811828613281, -44.96868896484375, -43.81925964355469, -42.669830322265625, -41.52040100097656, -40.370967864990234, -39.22153854370117, -38.07210922241211, -36.92267990112305, -35.773250579833984, -34.62382125854492, -33.47439193725586, -32.3249626159668, -31.175533294677734, -30.026103973388672, -28.87667465209961, -27.727245330810547, -26.577816009521484, -25.428386688232422, -24.27895736694336, -23.129528045654297, -21.980098724365234, -20.830669403076172, -19.68124008178711, -18.531810760498047, -17.382381439208984, -16.232952117919922, -15.083521842956543, -13.93409252166748, -12.784662246704102, -11.635232925415039, -10.485803604125977, -9.336374282836914, -8.186944961547852, -7.037515163421631, -5.88808536529541, -4.738656044006348, -3.589226722717285, -2.4397974014282227, -1.290367841720581, -0.14093828201293945, 1.008491039276123, 2.1579203605651855, 3.3073501586914062, 4.456779479980469, 5.606208801269531]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 6.0, 8.0, 13.0, 25.0, 20.0, 23.0, 18.0, 21.0, 32.0, 34.0, 33.0, 37.0, 40.0, 44.0, 44.0, 39.0, 41.0, 35.0, 36.0, 43.0, 39.0, 41.0, 40.0, 33.0, 40.0, 38.0, 25.0, 21.0, 21.0, 17.0, 16.0, 15.0, 13.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.0784969329834, -19.500879287719727, -18.923263549804688, -18.345645904541016, -17.768030166625977, -17.190412521362305, -16.612796783447266, -16.035179138183594, -15.457562446594238, -14.879945755004883, -14.302329063415527, -13.724712371826172, -13.1470947265625, -12.569478988647461, -11.991861343383789, -11.414244651794434, -10.836627960205078, -10.259011268615723, -9.681394577026367, -9.103777885437012, -8.526161193847656, -7.948544025421143, -7.370926856994629, -6.793310165405273, -6.215693473815918, -5.6380767822265625, -5.060460090637207, -4.482842922210693, -3.905226230621338, -3.3276095390319824, -2.749992609024048, -2.1723756790161133, -1.594757080078125, -1.01714026927948, -0.43952345848083496, 0.13809335231781006, 0.7157101631164551, 1.2933268547058105, 1.8709437847137451, 2.4485607147216797, 3.026177406311035, 3.6037940979003906, 4.181410789489746, 4.75902795791626, 5.336644649505615, 5.914261341094971, 6.491878509521484, 7.06949520111084, 7.647111892700195, 8.22472858428955, 8.802345275878906, 9.379961967468262, 9.957578659057617, 10.535196304321289, 11.112812995910645, 11.6904296875, 12.268046379089355, 12.845663070678711, 13.423279762268066, 14.000896453857422, 14.578514099121094, 15.156129837036133, 15.733747482299805, 16.311363220214844, 16.888980865478516]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 16.0, 13.0, 17.0, 31.0, 30.0, 31.0, 41.0, 28.0, 46.0, 53.0, 65.0, 68.0, 54.0, 64.0, 70.0, 63.0, 48.0, 37.0, 47.0, 36.0, 25.0, 25.0, 14.0, 19.0, 13.0, 4.0, 8.0, 9.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.08203125, -3.0094451904296875, -2.936859130859375, -2.8642730712890625, -2.79168701171875, -2.7191009521484375, -2.646514892578125, -2.5739288330078125, -2.5013427734375, -2.4287567138671875, -2.356170654296875, -2.2835845947265625, -2.21099853515625, -2.1384124755859375, -2.065826416015625, -1.9932403564453125, -1.920654296875, -1.8480682373046875, -1.775482177734375, -1.7028961181640625, -1.63031005859375, -1.5577239990234375, -1.485137939453125, -1.4125518798828125, -1.3399658203125, -1.2673797607421875, -1.194793701171875, -1.1222076416015625, -1.04962158203125, -0.9770355224609375, -0.904449462890625, -0.8318634033203125, -0.75927734375, -0.6866912841796875, -0.614105224609375, -0.5415191650390625, -0.46893310546875, -0.3963470458984375, -0.323760986328125, -0.2511749267578125, -0.1785888671875, -0.1060028076171875, -0.033416748046875, 0.0391693115234375, 0.11175537109375, 0.1843414306640625, 0.256927490234375, 0.3295135498046875, 0.402099609375, 0.4746856689453125, 0.547271728515625, 0.6198577880859375, 0.69244384765625, 0.7650299072265625, 0.837615966796875, 0.9102020263671875, 0.9827880859375, 1.0553741455078125, 1.127960205078125, 1.2005462646484375, 1.27313232421875, 1.3457183837890625, 1.418304443359375, 1.4908905029296875, 1.5634765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 25.0, 29.0, 27.0, 42.0, 60.0, 82.0, 174.0, 237.0, 595.0, 1720.0, 9327.0, 87901.0, 2223289.0, 1786588.0, 73295.0, 8084.0, 1585.0, 544.0, 219.0, 140.0, 88.0, 62.0, 37.0, 32.0, 18.0, 16.0, 10.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-12.921875, -12.6064453125, -12.291015625, -11.9755859375, -11.66015625, -11.3447265625, -11.029296875, -10.7138671875, -10.3984375, -10.0830078125, -9.767578125, -9.4521484375, -9.13671875, -8.8212890625, -8.505859375, -8.1904296875, -7.875, -7.5595703125, -7.244140625, -6.9287109375, -6.61328125, -6.2978515625, -5.982421875, -5.6669921875, -5.3515625, -5.0361328125, -4.720703125, -4.4052734375, -4.08984375, -3.7744140625, -3.458984375, -3.1435546875, -2.828125, -2.5126953125, -2.197265625, -1.8818359375, -1.56640625, -1.2509765625, -0.935546875, -0.6201171875, -0.3046875, 0.0107421875, 0.326171875, 0.6416015625, 0.95703125, 1.2724609375, 1.587890625, 1.9033203125, 2.21875, 2.5341796875, 2.849609375, 3.1650390625, 3.48046875, 3.7958984375, 4.111328125, 4.4267578125, 4.7421875, 5.0576171875, 5.373046875, 5.6884765625, 6.00390625, 6.3193359375, 6.634765625, 6.9501953125, 7.265625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 9.0, 19.0, 36.0, 77.0, 132.0, 248.0, 413.0, 608.0, 821.0, 647.0, 451.0, 262.0, 142.0, 83.0, 47.0, 28.0, 19.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.75360107421875, -6.4407958984375, -6.12799072265625, -5.815185546875, -5.50238037109375, -5.1895751953125, -4.87677001953125, -4.56396484375, -4.25115966796875, -3.9383544921875, -3.62554931640625, -3.312744140625, -2.99993896484375, -2.6871337890625, -2.37432861328125, -2.0615234375, -1.74871826171875, -1.4359130859375, -1.12310791015625, -0.810302734375, -0.49749755859375, -0.1846923828125, 0.12811279296875, 0.44091796875, 0.75372314453125, 1.0665283203125, 1.37933349609375, 1.692138671875, 2.00494384765625, 2.3177490234375, 2.63055419921875, 2.943359375, 3.25616455078125, 3.5689697265625, 3.88177490234375, 4.194580078125, 4.50738525390625, 4.8201904296875, 5.13299560546875, 5.44580078125, 5.75860595703125, 6.0714111328125, 6.38421630859375, 6.697021484375, 7.00982666015625, 7.3226318359375, 7.63543701171875, 7.9482421875, 8.26104736328125, 8.5738525390625, 8.88665771484375, 9.199462890625, 9.51226806640625, 9.8250732421875, 10.13787841796875, 10.45068359375, 10.76348876953125, 11.0762939453125, 11.38909912109375, 11.701904296875, 12.01470947265625, 12.3275146484375, 12.64031982421875, 12.953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 10.0, 11.0, 11.0, 21.0, 11.0, 28.0, 43.0, 50.0, 81.0, 134.0, 193.0, 362.0, 588.0, 1349.0, 4062.0, 19563.0, 185063.0, 2816702.0, 1078819.0, 72457.0, 9911.0, 2530.0, 969.0, 488.0, 275.0, 180.0, 108.0, 59.0, 68.0, 41.0, 31.0, 13.0, 15.0, 15.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.421630859375, -13.96826171875, -13.514892578125, -13.0615234375, -12.608154296875, -12.15478515625, -11.701416015625, -11.248046875, -10.794677734375, -10.34130859375, -9.887939453125, -9.4345703125, -8.981201171875, -8.52783203125, -8.074462890625, -7.62109375, -7.167724609375, -6.71435546875, -6.260986328125, -5.8076171875, -5.354248046875, -4.90087890625, -4.447509765625, -3.994140625, -3.540771484375, -3.08740234375, -2.634033203125, -2.1806640625, -1.727294921875, -1.27392578125, -0.820556640625, -0.3671875, 0.086181640625, 0.53955078125, 0.992919921875, 1.4462890625, 1.899658203125, 2.35302734375, 2.806396484375, 3.259765625, 3.713134765625, 4.16650390625, 4.619873046875, 5.0732421875, 5.526611328125, 5.97998046875, 6.433349609375, 6.88671875, 7.340087890625, 7.79345703125, 8.246826171875, 8.7001953125, 9.153564453125, 9.60693359375, 10.060302734375, 10.513671875, 10.967041015625, 11.42041015625, 11.873779296875, 12.3271484375, 12.780517578125, 13.23388671875, 13.687255859375, 14.140625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 17.0, 81.0, 200.0, 310.0, 253.0, 111.0, 35.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.1061782836914, -94.59596252441406, -92.08575439453125, -89.5755386352539, -87.06532287597656, -84.55510711669922, -82.04489135742188, -79.53468322753906, -77.02446746826172, -74.51425170898438, -72.00404357910156, -69.49382781982422, -66.98361206054688, -64.47339630126953, -61.96318435668945, -59.452972412109375, -56.94275665283203, -54.43254089355469, -51.92232894897461, -49.41211700439453, -46.90190124511719, -44.391685485839844, -41.881473541259766, -39.37126159667969, -36.861045837402344, -34.350830078125, -31.840618133544922, -29.33040428161621, -26.8201904296875, -24.30997657775879, -21.799762725830078, -19.289548873901367, -16.77933120727539, -14.26911735534668, -11.758903503417969, -9.248689651489258, -6.738475799560547, -4.228261947631836, -1.718048095703125, 0.7921657562255859, 3.302379608154297, 5.812593460083008, 8.322807312011719, 10.83302116394043, 13.34323501586914, 15.853448867797852, 18.363662719726562, 20.873876571655273, 23.384090423583984, 25.894304275512695, 28.404518127441406, 30.914731979370117, 33.42494583129883, 35.935157775878906, 38.44537353515625, 40.955589294433594, 43.46580123901367, 45.97601318359375, 48.486228942871094, 50.99644470214844, 53.506656646728516, 56.016868591308594, 58.52708435058594, 61.03730010986328, 63.54751205444336]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 9.0, 12.0, 13.0, 13.0, 16.0, 22.0, 28.0, 24.0, 21.0, 28.0, 16.0, 40.0, 33.0, 36.0, 36.0, 31.0, 32.0, 45.0, 25.0, 37.0, 32.0, 51.0, 32.0, 34.0, 23.0, 28.0, 26.0, 27.0, 21.0, 33.0, 16.0, 23.0, 15.0, 20.0, 19.0, 10.0, 15.0, 10.0, 5.0, 6.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-18.29857635498047, -17.76156234741211, -17.22454833984375, -16.687536239624023, -16.150522232055664, -15.613508224487305, -15.076494216918945, -14.539480209350586, -14.002467155456543, -13.465453147888184, -12.92844009399414, -12.391426086425781, -11.854412078857422, -11.317399024963379, -10.78038501739502, -10.243371963500977, -9.706357955932617, -9.169343948364258, -8.632330894470215, -8.095316886901855, -7.558303356170654, -7.021289825439453, -6.484275817871094, -5.947262287139893, -5.410248756408691, -4.87323522567749, -4.336221694946289, -3.7992076873779297, -3.2621941566467285, -2.7251806259155273, -2.188166856765747, -1.6511530876159668, -1.1141395568847656, -0.5771259069442749, -0.04011225700378418, 0.49690139293670654, 1.0339150428771973, 1.5709285736083984, 2.1079423427581787, 2.644956111907959, 3.18196964263916, 3.7189831733703613, 4.2559967041015625, 4.793010711669922, 5.330024242401123, 5.867037773132324, 6.404051780700684, 6.941065311431885, 7.478078842163086, 8.015092849731445, 8.552105903625488, 9.089119911193848, 9.62613296508789, 10.16314697265625, 10.70016098022461, 11.237174987792969, 11.774188041687012, 12.311202049255371, 12.848215103149414, 13.385229110717773, 13.922243118286133, 14.459256172180176, 14.996270179748535, 15.533283233642578, 16.070297241210938]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 9.0, 6.0, 15.0, 9.0, 16.0, 10.0, 20.0, 19.0, 33.0, 49.0, 50.0, 35.0, 59.0, 54.0, 62.0, 57.0, 49.0, 60.0, 59.0, 68.0, 55.0, 40.0, 35.0, 29.0, 28.0, 20.0, 11.0, 18.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8162078857421875, -2.741790771484375, -2.6673736572265625, -2.59295654296875, -2.5185394287109375, -2.444122314453125, -2.3697052001953125, -2.2952880859375, -2.2208709716796875, -2.146453857421875, -2.0720367431640625, -1.99761962890625, -1.9232025146484375, -1.848785400390625, -1.7743682861328125, -1.699951171875, -1.6255340576171875, -1.551116943359375, -1.4766998291015625, -1.40228271484375, -1.3278656005859375, -1.253448486328125, -1.1790313720703125, -1.1046142578125, -1.0301971435546875, -0.955780029296875, -0.8813629150390625, -0.80694580078125, -0.7325286865234375, -0.658111572265625, -0.5836944580078125, -0.50927734375, -0.4348602294921875, -0.360443115234375, -0.2860260009765625, -0.21160888671875, -0.1371917724609375, -0.062774658203125, 0.0116424560546875, 0.0860595703125, 0.1604766845703125, 0.234893798828125, 0.3093109130859375, 0.38372802734375, 0.4581451416015625, 0.532562255859375, 0.6069793701171875, 0.681396484375, 0.7558135986328125, 0.830230712890625, 0.9046478271484375, 0.97906494140625, 1.0534820556640625, 1.127899169921875, 1.2023162841796875, 1.2767333984375, 1.3511505126953125, 1.425567626953125, 1.4999847412109375, 1.57440185546875, 1.6488189697265625, 1.723236083984375, 1.7976531982421875, 1.8720703125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 10.0, 17.0, 14.0, 25.0, 53.0, 62.0, 123.0, 166.0, 323.0, 577.0, 1039.0, 2000.0, 3708.0, 7463.0, 14951.0, 32214.0, 74631.0, 207590.0, 455021.0, 143040.0, 56522.0, 24714.0, 11887.0, 5880.0, 2974.0, 1568.0, 863.0, 452.0, 254.0, 154.0, 89.0, 51.0, 41.0, 21.0, 19.0, 7.0, 4.0, 0.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0191802978515625, -0.01862168312072754, -0.018063068389892578, -0.017504453659057617, -0.016945838928222656, -0.016387224197387695, -0.015828609466552734, -0.015269994735717773, -0.014711380004882812, -0.014152765274047852, -0.01359415054321289, -0.01303553581237793, -0.012476921081542969, -0.011918306350708008, -0.011359691619873047, -0.010801076889038086, -0.010242462158203125, -0.009683847427368164, -0.009125232696533203, -0.008566617965698242, -0.008008003234863281, -0.00744938850402832, -0.006890773773193359, -0.0063321590423583984, -0.0057735443115234375, -0.0052149295806884766, -0.004656314849853516, -0.004097700119018555, -0.0035390853881835938, -0.002980470657348633, -0.002421855926513672, -0.001863241195678711, -0.00130462646484375, -0.0007460117340087891, -0.00018739700317382812, 0.0003712177276611328, 0.0009298324584960938, 0.0014884471893310547, 0.0020470619201660156, 0.0026056766510009766, 0.0031642913818359375, 0.0037229061126708984, 0.004281520843505859, 0.00484013557434082, 0.005398750305175781, 0.005957365036010742, 0.006515979766845703, 0.007074594497680664, 0.007633209228515625, 0.008191823959350586, 0.008750438690185547, 0.009309053421020508, 0.009867668151855469, 0.01042628288269043, 0.01098489761352539, 0.011543512344360352, 0.012102127075195312, 0.012660741806030273, 0.013219356536865234, 0.013777971267700195, 0.014336585998535156, 0.014895200729370117, 0.015453815460205078, 0.01601243019104004, 0.016571044921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 12.0, 8.0, 16.0, 17.0, 17.0, 13.0, 29.0, 31.0, 35.0, 22.0, 36.0, 32.0, 49.0, 35.0, 48.0, 37.0, 1074.0, 40.0, 40.0, 24.0, 29.0, 36.0, 43.0, 35.0, 30.0, 25.0, 32.0, 25.0, 33.0, 15.0, 16.0, 11.0, 16.0, 18.0, 13.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0726318359375, -1.036865234375, -1.0010986328125, -0.96533203125, -0.9295654296875, -0.893798828125, -0.8580322265625, -0.822265625, -0.7864990234375, -0.750732421875, -0.7149658203125, -0.67919921875, -0.6434326171875, -0.607666015625, -0.5718994140625, -0.5361328125, -0.5003662109375, -0.464599609375, -0.4288330078125, -0.39306640625, -0.3572998046875, -0.321533203125, -0.2857666015625, -0.25, -0.2142333984375, -0.178466796875, -0.1427001953125, -0.10693359375, -0.0711669921875, -0.035400390625, 0.0003662109375, 0.0361328125, 0.0718994140625, 0.107666015625, 0.1434326171875, 0.17919921875, 0.2149658203125, 0.250732421875, 0.2864990234375, 0.322265625, 0.3580322265625, 0.393798828125, 0.4295654296875, 0.46533203125, 0.5010986328125, 0.536865234375, 0.5726318359375, 0.6083984375, 0.6441650390625, 0.679931640625, 0.7156982421875, 0.75146484375, 0.7872314453125, 0.822998046875, 0.8587646484375, 0.89453125, 0.9302978515625, 0.966064453125, 1.0018310546875, 1.03759765625, 1.0733642578125, 1.109130859375, 1.1448974609375, 1.1806640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 11.0, 6.0, 17.0, 43.0, 56.0, 77.0, 119.0, 161.0, 277.0, 436.0, 619.0, 920.0, 1553.0, 2396.0, 3613.0, 5795.0, 9418.0, 14640.0, 23853.0, 38674.0, 64669.0, 112999.0, 1301692.0, 243799.0, 109072.0, 62191.0, 37528.0, 23214.0, 14306.0, 9020.0, 5639.0, 3678.0, 2279.0, 1493.0, 1033.0, 623.0, 366.0, 260.0, 194.0, 142.0, 70.0, 59.0, 30.0, 29.0, 25.0, 11.0, 14.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.006916046142578125, -0.006706297397613525, -0.006496548652648926, -0.006286799907684326, -0.0060770511627197266, -0.005867302417755127, -0.005657553672790527, -0.005447804927825928, -0.005238056182861328, -0.0050283074378967285, -0.004818558692932129, -0.004608809947967529, -0.00439906120300293, -0.00418931245803833, -0.0039795637130737305, -0.003769814968109131, -0.0035600662231445312, -0.0033503174781799316, -0.003140568733215332, -0.0029308199882507324, -0.002721071243286133, -0.002511322498321533, -0.0023015737533569336, -0.002091825008392334, -0.0018820762634277344, -0.0016723275184631348, -0.0014625787734985352, -0.0012528300285339355, -0.001043081283569336, -0.0008333325386047363, -0.0006235837936401367, -0.0004138350486755371, -0.0002040863037109375, 5.662441253662109e-06, 0.00021541118621826172, 0.00042515993118286133, 0.0006349086761474609, 0.0008446574211120605, 0.0010544061660766602, 0.0012641549110412598, 0.0014739036560058594, 0.001683652400970459, 0.0018934011459350586, 0.002103149890899658, 0.002312898635864258, 0.0025226473808288574, 0.002732396125793457, 0.0029421448707580566, 0.0031518936157226562, 0.003361642360687256, 0.0035713911056518555, 0.003781139850616455, 0.003990888595581055, 0.004200637340545654, 0.004410386085510254, 0.0046201348304748535, 0.004829883575439453, 0.005039632320404053, 0.005249381065368652, 0.005459129810333252, 0.0056688785552978516, 0.005878627300262451, 0.006088376045227051, 0.00629812479019165, 0.00650787353515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 998.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [18.0, 0.0, 8.0, 0.0, 0.0, 11.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 52.0, 0.0, 755.0, 0.0, 0.0, 5962.0, 0.0, 0.0, 1034942.0, 0.0, 5984.0, 0.0, 0.0, 715.0, 0.0, 0.0, 59.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 10.0, 0.0, 16.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 9.0, 6.0, 15.0, 9.0, 16.0, 10.0, 20.0, 19.0, 33.0, 49.0, 50.0, 35.0, 59.0, 54.0, 62.0, 57.0, 49.0, 60.0, 59.0, 68.0, 55.0, 40.0, 35.0, 29.0, 28.0, 20.0, 11.0, 18.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8162078857421875, -2.741790771484375, -2.6673736572265625, -2.59295654296875, -2.5185394287109375, -2.444122314453125, -2.3697052001953125, -2.2952880859375, -2.2208709716796875, -2.146453857421875, -2.0720367431640625, -1.99761962890625, -1.9232025146484375, -1.848785400390625, -1.7743682861328125, -1.699951171875, -1.6255340576171875, -1.551116943359375, -1.4766998291015625, -1.40228271484375, -1.3278656005859375, -1.253448486328125, -1.1790313720703125, -1.1046142578125, -1.0301971435546875, -0.955780029296875, -0.8813629150390625, -0.80694580078125, -0.7325286865234375, -0.658111572265625, -0.5836944580078125, -0.50927734375, -0.4348602294921875, -0.360443115234375, -0.2860260009765625, -0.21160888671875, -0.1371917724609375, -0.062774658203125, 0.0116424560546875, 0.0860595703125, 0.1604766845703125, 0.234893798828125, 0.3093109130859375, 0.38372802734375, 0.4581451416015625, 0.532562255859375, 0.6069793701171875, 0.681396484375, 0.7558135986328125, 0.830230712890625, 0.9046478271484375, 0.97906494140625, 1.0534820556640625, 1.127899169921875, 1.2023162841796875, 1.2767333984375, 1.3511505126953125, 1.425567626953125, 1.4999847412109375, 1.57440185546875, 1.6488189697265625, 1.723236083984375, 1.7976531982421875, 1.8720703125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 16.0, 10.0, 28.0, 36.0, 100.0, 177.0, 346.0, 775.0, 1841.0, 4521.0, 11392.0, 30568.0, 105352.0, 713714.0, 124879.0, 33631.0, 12617.0, 4897.0, 1970.0, 868.0, 400.0, 178.0, 88.0, 72.0, 25.0, 11.0, 8.0, 8.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.85546875, -2.761993408203125, -2.66851806640625, -2.575042724609375, -2.4815673828125, -2.388092041015625, -2.29461669921875, -2.201141357421875, -2.107666015625, -2.014190673828125, -1.92071533203125, -1.827239990234375, -1.7337646484375, -1.640289306640625, -1.54681396484375, -1.453338623046875, -1.35986328125, -1.266387939453125, -1.17291259765625, -1.079437255859375, -0.9859619140625, -0.892486572265625, -0.79901123046875, -0.705535888671875, -0.612060546875, -0.518585205078125, -0.42510986328125, -0.331634521484375, -0.2381591796875, -0.144683837890625, -0.05120849609375, 0.042266845703125, 0.1357421875, 0.229217529296875, 0.32269287109375, 0.416168212890625, 0.5096435546875, 0.603118896484375, 0.69659423828125, 0.790069580078125, 0.883544921875, 0.977020263671875, 1.07049560546875, 1.163970947265625, 1.2574462890625, 1.350921630859375, 1.44439697265625, 1.537872314453125, 1.63134765625, 1.724822998046875, 1.81829833984375, 1.911773681640625, 2.0052490234375, 2.098724365234375, 2.19219970703125, 2.285675048828125, 2.379150390625, 2.472625732421875, 2.56610107421875, 2.659576416015625, 2.7530517578125, 2.846527099609375, 2.94000244140625, 3.033477783203125, 3.126953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 17.0, 13.0, 19.0, 21.0, 20.0, 19.0, 27.0, 38.0, 34.0, 33.0, 41.0, 53.0, 74.0, 110.0, 1700.0, 242.0, 102.0, 40.0, 33.0, 32.0, 43.0, 37.0, 38.0, 24.0, 26.0, 22.0, 26.0, 10.0, 15.0, 10.0, 15.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.625, -5.44256591796875, -5.2601318359375, -5.07769775390625, -4.895263671875, -4.71282958984375, -4.5303955078125, -4.34796142578125, -4.16552734375, -3.98309326171875, -3.8006591796875, -3.61822509765625, -3.435791015625, -3.25335693359375, -3.0709228515625, -2.88848876953125, -2.7060546875, -2.52362060546875, -2.3411865234375, -2.15875244140625, -1.976318359375, -1.79388427734375, -1.6114501953125, -1.42901611328125, -1.24658203125, -1.06414794921875, -0.8817138671875, -0.69927978515625, -0.516845703125, -0.33441162109375, -0.1519775390625, 0.03045654296875, 0.212890625, 0.39532470703125, 0.5777587890625, 0.76019287109375, 0.942626953125, 1.12506103515625, 1.3074951171875, 1.48992919921875, 1.67236328125, 1.85479736328125, 2.0372314453125, 2.21966552734375, 2.402099609375, 2.58453369140625, 2.7669677734375, 2.94940185546875, 3.1318359375, 3.31427001953125, 3.4967041015625, 3.67913818359375, 3.861572265625, 4.04400634765625, 4.2264404296875, 4.40887451171875, 4.59130859375, 4.77374267578125, 4.9561767578125, 5.13861083984375, 5.321044921875, 5.50347900390625, 5.6859130859375, 5.86834716796875, 6.05078125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 9.0, 7.0, 7.0, 12.0, 13.0, 19.0, 14.0, 21.0, 35.0, 29.0, 39.0, 72.0, 96.0, 138.0, 239.0, 466.0, 1604.0, 11384.0, 415481.0, 2689898.0, 22125.0, 2522.0, 599.0, 297.0, 143.0, 103.0, 68.0, 58.0, 29.0, 26.0, 19.0, 24.0, 14.0, 16.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.1875, -9.8800048828125, -9.572509765625, -9.2650146484375, -8.95751953125, -8.6500244140625, -8.342529296875, -8.0350341796875, -7.7275390625, -7.4200439453125, -7.112548828125, -6.8050537109375, -6.49755859375, -6.1900634765625, -5.882568359375, -5.5750732421875, -5.267578125, -4.9600830078125, -4.652587890625, -4.3450927734375, -4.03759765625, -3.7301025390625, -3.422607421875, -3.1151123046875, -2.8076171875, -2.5001220703125, -2.192626953125, -1.8851318359375, -1.57763671875, -1.2701416015625, -0.962646484375, -0.6551513671875, -0.34765625, -0.0401611328125, 0.267333984375, 0.5748291015625, 0.88232421875, 1.1898193359375, 1.497314453125, 1.8048095703125, 2.1123046875, 2.4197998046875, 2.727294921875, 3.0347900390625, 3.34228515625, 3.6497802734375, 3.957275390625, 4.2647705078125, 4.572265625, 4.8797607421875, 5.187255859375, 5.4947509765625, 5.80224609375, 6.1097412109375, 6.417236328125, 6.7247314453125, 7.0322265625, 7.3397216796875, 7.647216796875, 7.9547119140625, 8.26220703125, 8.5697021484375, 8.877197265625, 9.1846923828125, 9.4921875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 24.0, 83.0, 151.0, 265.0, 219.0, 160.0, 79.0, 22.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9689764976501465, -4.418506622314453, -3.868037223815918, -3.3175673484802246, -2.7670977115631104, -2.216628074645996, -1.6661581993103027, -1.1156885623931885, -0.5652189254760742, -0.014749228954315186, 0.5357204675674438, 1.0861902236938477, 1.636659860610962, 2.187129497528076, 2.7375993728637695, 3.288069009780884, 3.838538646697998, 4.389008522033691, 4.939477920532227, 5.48994779586792, 6.040417671203613, 6.590887069702148, 7.141356945037842, 7.691826820373535, 8.24229621887207, 8.792765617370605, 9.343235969543457, 9.893705368041992, 10.444174766540527, 10.994644165039062, 11.545114517211914, 12.09558391571045, 12.646055221557617, 13.196524620056152, 13.746994972229004, 14.297464370727539, 14.847933769226074, 15.39840316772461, 15.948873519897461, 16.499343872070312, 17.04981231689453, 17.600282669067383, 18.1507511138916, 18.701221466064453, 19.251691818237305, 19.802160263061523, 20.352630615234375, 20.903100967407227, 21.453571319580078, 22.00404167175293, 22.55451011657715, 23.10498046875, 23.65545082092285, 24.20591926574707, 24.756389617919922, 25.306859970092773, 25.857328414916992, 26.407798767089844, 26.958267211914062, 27.508737564086914, 28.059207916259766, 28.609676361083984, 29.160146713256836, 29.710617065429688, 30.261085510253906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 1.0, 4.0, 5.0, 11.0, 7.0, 14.0, 25.0, 19.0, 16.0, 18.0, 22.0, 28.0, 44.0, 32.0, 36.0, 37.0, 36.0, 51.0, 33.0, 39.0, 43.0, 36.0, 44.0, 36.0, 45.0, 40.0, 26.0, 26.0, 28.0, 33.0, 26.0, 16.0, 19.0, 13.0, 24.0, 15.0, 14.0, 7.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.887758255004883, -18.264698028564453, -17.641637802124023, -17.018577575683594, -16.395517349243164, -15.772457122802734, -15.149397850036621, -14.526337623596191, -13.903277397155762, -13.280217170715332, -12.657156944274902, -12.034096717834473, -11.41103744506836, -10.78797721862793, -10.1649169921875, -9.54185676574707, -8.91879653930664, -8.295736312866211, -7.672676086425781, -7.04961633682251, -6.42655611038208, -5.80349588394165, -5.180436134338379, -4.557375907897949, -3.9343156814575195, -3.31125545501709, -2.6881954669952393, -2.0651354789733887, -1.442075252532959, -0.8190150260925293, -0.1959550380706787, 0.4271049499511719, 1.0501651763916016, 1.6732252836227417, 2.296285390853882, 2.9193453788757324, 3.542405605316162, 4.165465831756592, 4.788525581359863, 5.411585807800293, 6.034646034240723, 6.657706260681152, 7.280766487121582, 7.9038262367248535, 8.526885986328125, 9.149946212768555, 9.773006439208984, 10.396066665649414, 11.019126892089844, 11.642187118530273, 12.265247344970703, 12.888307571411133, 13.511367797851562, 14.134428024291992, 14.757487297058105, 15.380547523498535, 16.00360870361328, 16.62666893005371, 17.24972915649414, 17.87278938293457, 18.495849609375, 19.11890983581543, 19.74197006225586, 20.365028381347656, 20.988088607788086]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 13.0, 10.0, 17.0, 10.0, 13.0, 20.0, 31.0, 37.0, 55.0, 37.0, 56.0, 56.0, 51.0, 68.0, 43.0, 49.0, 67.0, 66.0, 52.0, 51.0, 38.0, 33.0, 26.0, 24.0, 16.0, 15.0, 13.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7997589111328125, -2.724517822265625, -2.6492767333984375, -2.57403564453125, -2.4987945556640625, -2.423553466796875, -2.3483123779296875, -2.2730712890625, -2.1978302001953125, -2.122589111328125, -2.0473480224609375, -1.97210693359375, -1.8968658447265625, -1.821624755859375, -1.7463836669921875, -1.671142578125, -1.5959014892578125, -1.520660400390625, -1.4454193115234375, -1.37017822265625, -1.2949371337890625, -1.219696044921875, -1.1444549560546875, -1.0692138671875, -0.9939727783203125, -0.918731689453125, -0.8434906005859375, -0.76824951171875, -0.6930084228515625, -0.617767333984375, -0.5425262451171875, -0.46728515625, -0.3920440673828125, -0.316802978515625, -0.2415618896484375, -0.16632080078125, -0.0910797119140625, -0.015838623046875, 0.0594024658203125, 0.1346435546875, 0.2098846435546875, 0.285125732421875, 0.3603668212890625, 0.43560791015625, 0.5108489990234375, 0.586090087890625, 0.6613311767578125, 0.736572265625, 0.8118133544921875, 0.887054443359375, 0.9622955322265625, 1.03753662109375, 1.1127777099609375, 1.188018798828125, 1.2632598876953125, 1.3385009765625, 1.4137420654296875, 1.488983154296875, 1.5642242431640625, 1.63946533203125, 1.7147064208984375, 1.789947509765625, 1.8651885986328125, 1.9404296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 19.0, 16.0, 15.0, 20.0, 20.0, 26.0, 40.0, 46.0, 74.0, 105.0, 252.0, 576.0, 1598.0, 7556.0, 51914.0, 676609.0, 3194326.0, 230616.0, 24316.0, 4151.0, 1070.0, 376.0, 150.0, 93.0, 86.0, 45.0, 32.0, 29.0, 26.0, 10.0, 16.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0078125, -9.7161865234375, -9.424560546875, -9.1329345703125, -8.84130859375, -8.5496826171875, -8.258056640625, -7.9664306640625, -7.6748046875, -7.3831787109375, -7.091552734375, -6.7999267578125, -6.50830078125, -6.2166748046875, -5.925048828125, -5.6334228515625, -5.341796875, -5.0501708984375, -4.758544921875, -4.4669189453125, -4.17529296875, -3.8836669921875, -3.592041015625, -3.3004150390625, -3.0087890625, -2.7171630859375, -2.425537109375, -2.1339111328125, -1.84228515625, -1.5506591796875, -1.259033203125, -0.9674072265625, -0.67578125, -0.3841552734375, -0.092529296875, 0.1990966796875, 0.49072265625, 0.7823486328125, 1.073974609375, 1.3656005859375, 1.6572265625, 1.9488525390625, 2.240478515625, 2.5321044921875, 2.82373046875, 3.1153564453125, 3.406982421875, 3.6986083984375, 3.990234375, 4.2818603515625, 4.573486328125, 4.8651123046875, 5.15673828125, 5.4483642578125, 5.739990234375, 6.0316162109375, 6.3232421875, 6.6148681640625, 6.906494140625, 7.1981201171875, 7.48974609375, 7.7813720703125, 8.072998046875, 8.3646240234375, 8.65625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 8.0, 16.0, 32.0, 55.0, 103.0, 163.0, 292.0, 510.0, 844.0, 840.0, 520.0, 317.0, 171.0, 96.0, 49.0, 24.0, 10.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.375, -16.03363037109375, -15.6922607421875, -15.35089111328125, -15.009521484375, -14.66815185546875, -14.3267822265625, -13.98541259765625, -13.64404296875, -13.30267333984375, -12.9613037109375, -12.61993408203125, -12.278564453125, -11.93719482421875, -11.5958251953125, -11.25445556640625, -10.9130859375, -10.57171630859375, -10.2303466796875, -9.88897705078125, -9.547607421875, -9.20623779296875, -8.8648681640625, -8.52349853515625, -8.18212890625, -7.84075927734375, -7.4993896484375, -7.15802001953125, -6.816650390625, -6.47528076171875, -6.1339111328125, -5.79254150390625, -5.451171875, -5.10980224609375, -4.7684326171875, -4.42706298828125, -4.085693359375, -3.74432373046875, -3.4029541015625, -3.06158447265625, -2.72021484375, -2.37884521484375, -2.0374755859375, -1.69610595703125, -1.354736328125, -1.01336669921875, -0.6719970703125, -0.33062744140625, 0.0107421875, 0.35211181640625, 0.6934814453125, 1.03485107421875, 1.376220703125, 1.71759033203125, 2.0589599609375, 2.40032958984375, 2.74169921875, 3.08306884765625, 3.4244384765625, 3.76580810546875, 4.107177734375, 4.44854736328125, 4.7899169921875, 5.13128662109375, 5.47265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 13.0, 12.0, 11.0, 25.0, 31.0, 58.0, 112.0, 146.0, 365.0, 880.0, 3783.0, 57427.0, 3360730.0, 751169.0, 16427.0, 1913.0, 551.0, 230.0, 141.0, 86.0, 32.0, 38.0, 35.0, 20.0, 13.0, 8.0, 6.0, 1.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.563232421875, -15.76708984375, -14.970947265625, -14.1748046875, -13.378662109375, -12.58251953125, -11.786376953125, -10.990234375, -10.194091796875, -9.39794921875, -8.601806640625, -7.8056640625, -7.009521484375, -6.21337890625, -5.417236328125, -4.62109375, -3.824951171875, -3.02880859375, -2.232666015625, -1.4365234375, -0.640380859375, 0.15576171875, 0.951904296875, 1.748046875, 2.544189453125, 3.34033203125, 4.136474609375, 4.9326171875, 5.728759765625, 6.52490234375, 7.321044921875, 8.1171875, 8.913330078125, 9.70947265625, 10.505615234375, 11.3017578125, 12.097900390625, 12.89404296875, 13.690185546875, 14.486328125, 15.282470703125, 16.07861328125, 16.874755859375, 17.6708984375, 18.467041015625, 19.26318359375, 20.059326171875, 20.85546875, 21.651611328125, 22.44775390625, 23.243896484375, 24.0400390625, 24.836181640625, 25.63232421875, 26.428466796875, 27.224609375, 28.020751953125, 28.81689453125, 29.613037109375, 30.4091796875, 31.205322265625, 32.00146484375, 32.797607421875, 33.59375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 43.0, 61.0, 104.0, 152.0, 153.0, 141.0, 121.0, 83.0, 56.0, 22.0, 12.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.122764587402344, -60.66960525512695, -59.21644592285156, -57.763282775878906, -56.310123443603516, -54.856964111328125, -53.403804779052734, -51.950645446777344, -50.49748611450195, -49.04432678222656, -47.59116744995117, -46.13800811767578, -44.684844970703125, -43.231685638427734, -41.778526306152344, -40.32536697387695, -38.87220764160156, -37.41904830932617, -35.96588897705078, -34.512725830078125, -33.059566497802734, -31.606407165527344, -30.153247833251953, -28.700088500976562, -27.246925354003906, -25.793766021728516, -24.340604782104492, -22.8874454498291, -21.43428611755371, -19.981124877929688, -18.527965545654297, -17.074806213378906, -15.621644973754883, -14.168484687805176, -12.715325355529785, -11.262165069580078, -9.809005737304688, -8.35584545135498, -6.902685165405273, -5.449525833129883, -3.996365547180176, -2.543205738067627, -1.090045690536499, 0.3631143569946289, 1.8162741661071777, 3.2694339752197266, 4.722594261169434, 6.175753593444824, 7.628913879394531, 9.082074165344238, 10.535233497619629, 11.988393783569336, 13.441553115844727, 14.894713401794434, 16.34787368774414, 17.80103302001953, 19.254192352294922, 20.707351684570312, 22.160512924194336, 23.613672256469727, 25.066831588745117, 26.51999282836914, 27.97315216064453, 29.426311492919922, 30.879472732543945]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 4.0, 8.0, 9.0, 13.0, 10.0, 13.0, 11.0, 15.0, 21.0, 23.0, 24.0, 18.0, 44.0, 32.0, 35.0, 42.0, 39.0, 42.0, 43.0, 39.0, 51.0, 41.0, 51.0, 44.0, 44.0, 27.0, 42.0, 37.0, 26.0, 24.0, 30.0, 22.0, 18.0, 15.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.445066452026367, -20.74574089050293, -20.046417236328125, -19.347091674804688, -18.64776611328125, -17.948440551757812, -17.249114990234375, -16.54979133605957, -15.850465774536133, -15.151140213012695, -14.451815605163574, -13.752490997314453, -13.053165435791016, -12.353839874267578, -11.654515266418457, -10.955190658569336, -10.255865097045898, -9.556539535522461, -8.85721492767334, -8.157890319824219, -7.458564758300781, -6.759239673614502, -6.059914588928223, -5.360589504241943, -4.661264419555664, -3.9619393348693848, -3.2626142501831055, -2.563289165496826, -1.8639640808105469, -1.1646389961242676, -0.4653139114379883, 0.23401117324829102, 0.9333343505859375, 1.6326594352722168, 2.331984519958496, 3.0313096046447754, 3.7306346893310547, 4.429959774017334, 5.129284858703613, 5.828609943389893, 6.527935028076172, 7.227260112762451, 7.9265851974487305, 8.625909805297852, 9.325235366821289, 10.024560928344727, 10.723885536193848, 11.423210144042969, 12.122535705566406, 12.821861267089844, 13.521185874938965, 14.220510482788086, 14.919836044311523, 15.619161605834961, 16.318485260009766, 17.017810821533203, 17.71713638305664, 18.416461944580078, 19.115787506103516, 19.81511116027832, 20.514436721801758, 21.213762283325195, 21.9130859375, 22.612411499023438, 23.311737060546875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 9.0, 16.0, 7.0, 14.0, 11.0, 18.0, 16.0, 32.0, 41.0, 38.0, 41.0, 46.0, 45.0, 55.0, 47.0, 56.0, 54.0, 55.0, 52.0, 51.0, 62.0, 31.0, 31.0, 35.0, 26.0, 22.0, 24.0, 12.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71875, -2.64459228515625, -2.5704345703125, -2.49627685546875, -2.422119140625, -2.34796142578125, -2.2738037109375, -2.19964599609375, -2.12548828125, -2.05133056640625, -1.9771728515625, -1.90301513671875, -1.828857421875, -1.75469970703125, -1.6805419921875, -1.60638427734375, -1.5322265625, -1.45806884765625, -1.3839111328125, -1.30975341796875, -1.235595703125, -1.16143798828125, -1.0872802734375, -1.01312255859375, -0.93896484375, -0.86480712890625, -0.7906494140625, -0.71649169921875, -0.642333984375, -0.56817626953125, -0.4940185546875, -0.41986083984375, -0.345703125, -0.27154541015625, -0.1973876953125, -0.12322998046875, -0.049072265625, 0.02508544921875, 0.0992431640625, 0.17340087890625, 0.24755859375, 0.32171630859375, 0.3958740234375, 0.47003173828125, 0.544189453125, 0.61834716796875, 0.6925048828125, 0.76666259765625, 0.8408203125, 0.91497802734375, 0.9891357421875, 1.06329345703125, 1.137451171875, 1.21160888671875, 1.2857666015625, 1.35992431640625, 1.43408203125, 1.50823974609375, 1.5823974609375, 1.65655517578125, 1.730712890625, 1.80487060546875, 1.8790283203125, 1.95318603515625, 2.02734375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 3.0, 14.0, 18.0, 27.0, 38.0, 53.0, 101.0, 151.0, 239.0, 395.0, 606.0, 997.0, 1559.0, 2846.0, 4639.0, 8287.0, 14334.0, 25620.0, 49873.0, 103556.0, 307771.0, 311669.0, 105086.0, 49890.0, 26517.0, 14373.0, 8109.0, 4662.0, 2787.0, 1647.0, 1029.0, 641.0, 379.0, 240.0, 139.0, 68.0, 57.0, 42.0, 25.0, 15.0, 14.0, 12.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0162353515625, -0.01575791835784912, -0.015280485153198242, -0.014803051948547363, -0.014325618743896484, -0.013848185539245605, -0.013370752334594727, -0.012893319129943848, -0.012415885925292969, -0.01193845272064209, -0.011461019515991211, -0.010983586311340332, -0.010506153106689453, -0.010028719902038574, -0.009551286697387695, -0.009073853492736816, -0.008596420288085938, -0.008118987083435059, -0.00764155387878418, -0.007164120674133301, -0.006686687469482422, -0.006209254264831543, -0.005731821060180664, -0.005254387855529785, -0.004776954650878906, -0.004299521446228027, -0.0038220882415771484, -0.0033446550369262695, -0.0028672218322753906, -0.0023897886276245117, -0.0019123554229736328, -0.001434922218322754, -0.000957489013671875, -0.0004800558090209961, -2.6226043701171875e-06, 0.0004748106002807617, 0.0009522438049316406, 0.0014296770095825195, 0.0019071102142333984, 0.0023845434188842773, 0.0028619766235351562, 0.003339409828186035, 0.003816843032836914, 0.004294276237487793, 0.004771709442138672, 0.005249142646789551, 0.00572657585144043, 0.006204009056091309, 0.0066814422607421875, 0.007158875465393066, 0.007636308670043945, 0.008113741874694824, 0.008591175079345703, 0.009068608283996582, 0.009546041488647461, 0.01002347469329834, 0.010500907897949219, 0.010978341102600098, 0.011455774307250977, 0.011933207511901855, 0.012410640716552734, 0.012888073921203613, 0.013365507125854492, 0.013842940330505371, 0.01432037353515625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 6.0, 5.0, 9.0, 13.0, 11.0, 15.0, 12.0, 13.0, 15.0, 17.0, 20.0, 26.0, 31.0, 41.0, 39.0, 46.0, 34.0, 44.0, 49.0, 1063.0, 45.0, 31.0, 34.0, 40.0, 42.0, 39.0, 38.0, 26.0, 33.0, 28.0, 18.0, 22.0, 21.0, 22.0, 11.0, 13.0, 6.0, 6.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.1953125, -1.1561279296875, -1.116943359375, -1.0777587890625, -1.03857421875, -0.9993896484375, -0.960205078125, -0.9210205078125, -0.8818359375, -0.8426513671875, -0.803466796875, -0.7642822265625, -0.72509765625, -0.6859130859375, -0.646728515625, -0.6075439453125, -0.568359375, -0.5291748046875, -0.489990234375, -0.4508056640625, -0.41162109375, -0.3724365234375, -0.333251953125, -0.2940673828125, -0.2548828125, -0.2156982421875, -0.176513671875, -0.1373291015625, -0.09814453125, -0.0589599609375, -0.019775390625, 0.0194091796875, 0.05859375, 0.0977783203125, 0.136962890625, 0.1761474609375, 0.21533203125, 0.2545166015625, 0.293701171875, 0.3328857421875, 0.3720703125, 0.4112548828125, 0.450439453125, 0.4896240234375, 0.52880859375, 0.5679931640625, 0.607177734375, 0.6463623046875, 0.685546875, 0.7247314453125, 0.763916015625, 0.8031005859375, 0.84228515625, 0.8814697265625, 0.920654296875, 0.9598388671875, 0.9990234375, 1.0382080078125, 1.077392578125, 1.1165771484375, 1.15576171875, 1.1949462890625, 1.234130859375, 1.2733154296875, 1.3125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 7.0, 21.0, 17.0, 40.0, 74.0, 76.0, 111.0, 167.0, 271.0, 447.0, 559.0, 810.0, 1207.0, 1854.0, 2759.0, 4100.0, 6238.0, 9679.0, 15103.0, 23859.0, 39471.0, 67743.0, 127778.0, 1339385.0, 214543.0, 97302.0, 54112.0, 32442.0, 19700.0, 12684.0, 8306.0, 5345.0, 3605.0, 2449.0, 1552.0, 1084.0, 757.0, 466.0, 328.0, 231.0, 129.0, 95.0, 68.0, 45.0, 34.0, 25.0, 20.0, 11.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0], "bins": [-0.00792694091796875, -0.007692456245422363, -0.0074579715728759766, -0.00722348690032959, -0.006989002227783203, -0.006754517555236816, -0.00652003288269043, -0.006285548210144043, -0.006051063537597656, -0.0058165788650512695, -0.005582094192504883, -0.005347609519958496, -0.005113124847412109, -0.004878640174865723, -0.004644155502319336, -0.004409670829772949, -0.0041751861572265625, -0.003940701484680176, -0.003706216812133789, -0.0034717321395874023, -0.0032372474670410156, -0.003002762794494629, -0.002768278121948242, -0.0025337934494018555, -0.0022993087768554688, -0.002064824104309082, -0.0018303394317626953, -0.0015958547592163086, -0.0013613700866699219, -0.0011268854141235352, -0.0008924007415771484, -0.0006579160690307617, -0.000423431396484375, -0.00018894672393798828, 4.553794860839844e-05, 0.00028002262115478516, 0.0005145072937011719, 0.0007489919662475586, 0.0009834766387939453, 0.001217961311340332, 0.0014524459838867188, 0.0016869306564331055, 0.0019214153289794922, 0.002155900001525879, 0.0023903846740722656, 0.0026248693466186523, 0.002859354019165039, 0.0030938386917114258, 0.0033283233642578125, 0.0035628080368041992, 0.003797292709350586, 0.004031777381896973, 0.004266262054443359, 0.004500746726989746, 0.004735231399536133, 0.0049697160720825195, 0.005204200744628906, 0.005438685417175293, 0.00567317008972168, 0.005907654762268066, 0.006142139434814453, 0.00637662410736084, 0.0066111087799072266, 0.006845593452453613, 0.007080078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1000.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [9.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 20.0, 0.0, 0.0, 61.0, 0.0, 960.0, 0.0, 0.0, 5984.0, 0.0, 0.0, 1034427.0, 0.0, 6024.0, 0.0, 0.0, 944.0, 0.0, 0.0, 55.0, 0.0, 17.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 5.0, 0.0, 4.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 9.0, 16.0, 7.0, 14.0, 11.0, 18.0, 16.0, 32.0, 41.0, 38.0, 41.0, 46.0, 45.0, 55.0, 47.0, 56.0, 54.0, 55.0, 52.0, 51.0, 62.0, 31.0, 31.0, 35.0, 26.0, 22.0, 24.0, 12.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71875, -2.64459228515625, -2.5704345703125, -2.49627685546875, -2.422119140625, -2.34796142578125, -2.2738037109375, -2.19964599609375, -2.12548828125, -2.05133056640625, -1.9771728515625, -1.90301513671875, -1.828857421875, -1.75469970703125, -1.6805419921875, -1.60638427734375, -1.5322265625, -1.45806884765625, -1.3839111328125, -1.30975341796875, -1.235595703125, -1.16143798828125, -1.0872802734375, -1.01312255859375, -0.93896484375, -0.86480712890625, -0.7906494140625, -0.71649169921875, -0.642333984375, -0.56817626953125, -0.4940185546875, -0.41986083984375, -0.345703125, -0.27154541015625, -0.1973876953125, -0.12322998046875, -0.049072265625, 0.02508544921875, 0.0992431640625, 0.17340087890625, 0.24755859375, 0.32171630859375, 0.3958740234375, 0.47003173828125, 0.544189453125, 0.61834716796875, 0.6925048828125, 0.76666259765625, 0.8408203125, 0.91497802734375, 0.9891357421875, 1.06329345703125, 1.137451171875, 1.21160888671875, 1.2857666015625, 1.35992431640625, 1.43408203125, 1.50823974609375, 1.5823974609375, 1.65655517578125, 1.730712890625, 1.80487060546875, 1.8790283203125, 1.95318603515625, 2.02734375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 8.0, 23.0, 19.0, 36.0, 60.0, 60.0, 115.0, 161.0, 254.0, 363.0, 587.0, 950.0, 1584.0, 2423.0, 4055.0, 6975.0, 12453.0, 24466.0, 57204.0, 192700.0, 506814.0, 141809.0, 47304.0, 21099.0, 11187.0, 6102.0, 3666.0, 2216.0, 1381.0, 893.0, 550.0, 344.0, 239.0, 156.0, 108.0, 57.0, 41.0, 29.0, 23.0, 12.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.568359375, -1.5252685546875, -1.482177734375, -1.4390869140625, -1.39599609375, -1.3529052734375, -1.309814453125, -1.2667236328125, -1.2236328125, -1.1805419921875, -1.137451171875, -1.0943603515625, -1.05126953125, -1.0081787109375, -0.965087890625, -0.9219970703125, -0.87890625, -0.8358154296875, -0.792724609375, -0.7496337890625, -0.70654296875, -0.6634521484375, -0.620361328125, -0.5772705078125, -0.5341796875, -0.4910888671875, -0.447998046875, -0.4049072265625, -0.36181640625, -0.3187255859375, -0.275634765625, -0.2325439453125, -0.189453125, -0.1463623046875, -0.103271484375, -0.0601806640625, -0.01708984375, 0.0260009765625, 0.069091796875, 0.1121826171875, 0.1552734375, 0.1983642578125, 0.241455078125, 0.2845458984375, 0.32763671875, 0.3707275390625, 0.413818359375, 0.4569091796875, 0.5, 0.5430908203125, 0.586181640625, 0.6292724609375, 0.67236328125, 0.7154541015625, 0.758544921875, 0.8016357421875, 0.8447265625, 0.8878173828125, 0.930908203125, 0.9739990234375, 1.01708984375, 1.0601806640625, 1.103271484375, 1.1463623046875, 1.189453125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 19.0, 30.0, 26.0, 40.0, 42.0, 52.0, 44.0, 63.0, 93.0, 317.0, 1706.0, 97.0, 72.0, 65.0, 55.0, 51.0, 39.0, 32.0, 22.0, 20.0, 21.0, 23.0, 9.0, 11.0, 13.0, 9.0, 7.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.6815185546875, -7.417724609375, -7.1539306640625, -6.89013671875, -6.6263427734375, -6.362548828125, -6.0987548828125, -5.8349609375, -5.5711669921875, -5.307373046875, -5.0435791015625, -4.77978515625, -4.5159912109375, -4.252197265625, -3.9884033203125, -3.724609375, -3.4608154296875, -3.197021484375, -2.9332275390625, -2.66943359375, -2.4056396484375, -2.141845703125, -1.8780517578125, -1.6142578125, -1.3504638671875, -1.086669921875, -0.8228759765625, -0.55908203125, -0.2952880859375, -0.031494140625, 0.2322998046875, 0.49609375, 0.7598876953125, 1.023681640625, 1.2874755859375, 1.55126953125, 1.8150634765625, 2.078857421875, 2.3426513671875, 2.6064453125, 2.8702392578125, 3.134033203125, 3.3978271484375, 3.66162109375, 3.9254150390625, 4.189208984375, 4.4530029296875, 4.716796875, 4.9805908203125, 5.244384765625, 5.5081787109375, 5.77197265625, 6.0357666015625, 6.299560546875, 6.5633544921875, 6.8271484375, 7.0909423828125, 7.354736328125, 7.6185302734375, 7.88232421875, 8.1461181640625, 8.409912109375, 8.6737060546875, 8.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 16.0, 9.0, 10.0, 15.0, 19.0, 22.0, 28.0, 47.0, 67.0, 92.0, 147.0, 247.0, 405.0, 981.0, 3352.0, 23011.0, 2669611.0, 429122.0, 14348.0, 2339.0, 807.0, 350.0, 232.0, 119.0, 80.0, 51.0, 42.0, 30.0, 17.0, 17.0, 10.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.25, -10.9180908203125, -10.586181640625, -10.2542724609375, -9.92236328125, -9.5904541015625, -9.258544921875, -8.9266357421875, -8.5947265625, -8.2628173828125, -7.930908203125, -7.5989990234375, -7.26708984375, -6.9351806640625, -6.603271484375, -6.2713623046875, -5.939453125, -5.6075439453125, -5.275634765625, -4.9437255859375, -4.61181640625, -4.2799072265625, -3.947998046875, -3.6160888671875, -3.2841796875, -2.9522705078125, -2.620361328125, -2.2884521484375, -1.95654296875, -1.6246337890625, -1.292724609375, -0.9608154296875, -0.62890625, -0.2969970703125, 0.034912109375, 0.3668212890625, 0.69873046875, 1.0306396484375, 1.362548828125, 1.6944580078125, 2.0263671875, 2.3582763671875, 2.690185546875, 3.0220947265625, 3.35400390625, 3.6859130859375, 4.017822265625, 4.3497314453125, 4.681640625, 5.0135498046875, 5.345458984375, 5.6773681640625, 6.00927734375, 6.3411865234375, 6.673095703125, 7.0050048828125, 7.3369140625, 7.6688232421875, 8.000732421875, 8.3326416015625, 8.66455078125, 8.9964599609375, 9.328369140625, 9.6602783203125, 9.9921875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 734.0, 282.0, 1.0], "bins": [-292.466796875, -287.7378845214844, -283.0090026855469, -278.28009033203125, -273.55120849609375, -268.8222961425781, -264.0933837890625, -259.364501953125, -254.63558959960938, -249.9066925048828, -245.17779541015625, -240.44888305664062, -235.71998596191406, -230.9910888671875, -226.26219177246094, -221.53329467773438, -216.8043975830078, -212.07550048828125, -207.3466033935547, -202.61769104003906, -197.8887939453125, -193.15989685058594, -188.43099975585938, -183.7021026611328, -178.97320556640625, -174.2443084716797, -169.51541137695312, -164.7864990234375, -160.05760192871094, -155.32870483398438, -150.5998077392578, -145.87091064453125, -141.14199829101562, -136.41310119628906, -131.6842041015625, -126.9552993774414, -122.22639465332031, -117.49749755859375, -112.76860046386719, -108.03970336914062, -103.31079864501953, -98.58190155029297, -93.85299682617188, -89.12409973144531, -84.39520263671875, -79.66629791259766, -74.9374008178711, -70.20849609375, -65.47959899902344, -60.75069808959961, -56.02179718017578, -51.29290008544922, -46.56399917602539, -41.83509826660156, -37.106201171875, -32.37730026245117, -27.648401260375977, -22.91950225830078, -18.190601348876953, -13.461701393127441, -8.73280143737793, -4.003900527954102, 0.7249984741210938, 5.453897476196289, 10.182798385620117]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 1.0, 3.0, 7.0, 8.0, 10.0, 16.0, 14.0, 18.0, 22.0, 18.0, 22.0, 22.0, 21.0, 20.0, 22.0, 38.0, 36.0, 24.0, 42.0, 30.0, 37.0, 29.0, 46.0, 29.0, 32.0, 42.0, 43.0, 38.0, 34.0, 27.0, 27.0, 20.0, 28.0, 24.0, 26.0, 23.0, 14.0, 13.0, 15.0, 10.0, 8.0, 8.0, 5.0, 7.0, 6.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0], "bins": [-21.769140243530273, -21.129335403442383, -20.489532470703125, -19.849727630615234, -19.209924697875977, -18.570119857788086, -17.930316925048828, -17.290512084960938, -16.650707244873047, -16.010902404785156, -15.371099472045898, -14.731295585632324, -14.09149169921875, -13.45168685913086, -12.811882972717285, -12.172079086303711, -11.532276153564453, -10.892472267150879, -10.252668380737305, -9.61286449432373, -8.973060607910156, -8.333255767822266, -7.693451881408691, -7.053647994995117, -6.413844108581543, -5.774040222167969, -5.1342363357543945, -4.494431972503662, -3.854628086090088, -3.2148241996765137, -2.5750200748443604, -1.935215950012207, -1.2954120635986328, -0.655608057975769, -0.015804052352905273, 0.6239999532699585, 1.2638039588928223, 1.9036078453063965, 2.54341197013855, 3.183216094970703, 3.8230199813842773, 4.462823867797852, 5.102627754211426, 5.742432117462158, 6.382236003875732, 7.022039890289307, 7.661844253540039, 8.301648139953613, 8.941452026367188, 9.581255912780762, 10.221059799194336, 10.86086368560791, 11.500667572021484, 12.140472412109375, 12.78027629852295, 13.420080184936523, 14.059884071350098, 14.699687957763672, 15.339491844177246, 15.97929573059082, 16.61910057067871, 17.25890350341797, 17.89870834350586, 18.53851318359375, 19.178316116333008]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 9.0, 8.0, 10.0, 12.0, 9.0, 8.0, 8.0, 16.0, 24.0, 24.0, 29.0, 39.0, 52.0, 44.0, 42.0, 50.0, 48.0, 46.0, 65.0, 56.0, 54.0, 48.0, 48.0, 49.0, 44.0, 33.0, 20.0, 25.0, 15.0, 22.0, 14.0, 11.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.787109375, -2.711669921875, -2.63623046875, -2.560791015625, -2.4853515625, -2.409912109375, -2.33447265625, -2.259033203125, -2.18359375, -2.108154296875, -2.03271484375, -1.957275390625, -1.8818359375, -1.806396484375, -1.73095703125, -1.655517578125, -1.580078125, -1.504638671875, -1.42919921875, -1.353759765625, -1.2783203125, -1.202880859375, -1.12744140625, -1.052001953125, -0.9765625, -0.901123046875, -0.82568359375, -0.750244140625, -0.6748046875, -0.599365234375, -0.52392578125, -0.448486328125, -0.373046875, -0.297607421875, -0.22216796875, -0.146728515625, -0.0712890625, 0.004150390625, 0.07958984375, 0.155029296875, 0.23046875, 0.305908203125, 0.38134765625, 0.456787109375, 0.5322265625, 0.607666015625, 0.68310546875, 0.758544921875, 0.833984375, 0.909423828125, 0.98486328125, 1.060302734375, 1.1357421875, 1.211181640625, 1.28662109375, 1.362060546875, 1.4375, 1.512939453125, 1.58837890625, 1.663818359375, 1.7392578125, 1.814697265625, 1.89013671875, 1.965576171875, 2.041015625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 17.0, 12.0, 13.0, 20.0, 22.0, 35.0, 66.0, 127.0, 210.0, 486.0, 1144.0, 3100.0, 9495.0, 34004.0, 150617.0, 1156212.0, 2426968.0, 324908.0, 62266.0, 16302.0, 4927.0, 1816.0, 709.0, 357.0, 171.0, 99.0, 47.0, 35.0, 26.0, 19.0, 13.0, 10.0, 3.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.68646240234375, -6.5018310546875, -6.31719970703125, -6.132568359375, -5.94793701171875, -5.7633056640625, -5.57867431640625, -5.39404296875, -5.20941162109375, -5.0247802734375, -4.84014892578125, -4.655517578125, -4.47088623046875, -4.2862548828125, -4.10162353515625, -3.9169921875, -3.73236083984375, -3.5477294921875, -3.36309814453125, -3.178466796875, -2.99383544921875, -2.8092041015625, -2.62457275390625, -2.43994140625, -2.25531005859375, -2.0706787109375, -1.88604736328125, -1.701416015625, -1.51678466796875, -1.3321533203125, -1.14752197265625, -0.962890625, -0.77825927734375, -0.5936279296875, -0.40899658203125, -0.224365234375, -0.03973388671875, 0.1448974609375, 0.32952880859375, 0.51416015625, 0.69879150390625, 0.8834228515625, 1.06805419921875, 1.252685546875, 1.43731689453125, 1.6219482421875, 1.80657958984375, 1.9912109375, 2.17584228515625, 2.3604736328125, 2.54510498046875, 2.729736328125, 2.91436767578125, 3.0989990234375, 3.28363037109375, 3.46826171875, 3.65289306640625, 3.8375244140625, 4.02215576171875, 4.206787109375, 4.39141845703125, 4.5760498046875, 4.76068115234375, 4.9453125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 5.0, 16.0, 21.0, 20.0, 25.0, 44.0, 69.0, 96.0, 132.0, 211.0, 343.0, 473.0, 563.0, 572.0, 432.0, 335.0, 224.0, 148.0, 94.0, 78.0, 54.0, 38.0, 20.0, 19.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1875, -8.9576416015625, -8.727783203125, -8.4979248046875, -8.26806640625, -8.0382080078125, -7.808349609375, -7.5784912109375, -7.3486328125, -7.1187744140625, -6.888916015625, -6.6590576171875, -6.42919921875, -6.1993408203125, -5.969482421875, -5.7396240234375, -5.509765625, -5.2799072265625, -5.050048828125, -4.8201904296875, -4.59033203125, -4.3604736328125, -4.130615234375, -3.9007568359375, -3.6708984375, -3.4410400390625, -3.211181640625, -2.9813232421875, -2.75146484375, -2.5216064453125, -2.291748046875, -2.0618896484375, -1.83203125, -1.6021728515625, -1.372314453125, -1.1424560546875, -0.91259765625, -0.6827392578125, -0.452880859375, -0.2230224609375, 0.0068359375, 0.2366943359375, 0.466552734375, 0.6964111328125, 0.92626953125, 1.1561279296875, 1.385986328125, 1.6158447265625, 1.845703125, 2.0755615234375, 2.305419921875, 2.5352783203125, 2.76513671875, 2.9949951171875, 3.224853515625, 3.4547119140625, 3.6845703125, 3.9144287109375, 4.144287109375, 4.3741455078125, 4.60400390625, 4.8338623046875, 5.063720703125, 5.2935791015625, 5.5234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 17.0, 30.0, 38.0, 69.0, 113.0, 226.0, 363.0, 844.0, 2212.0, 8960.0, 62659.0, 813458.0, 3031703.0, 241598.0, 24755.0, 4599.0, 1402.0, 592.0, 274.0, 135.0, 92.0, 56.0, 32.0, 24.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.5859375, -13.1219482421875, -12.657958984375, -12.1939697265625, -11.72998046875, -11.2659912109375, -10.802001953125, -10.3380126953125, -9.8740234375, -9.4100341796875, -8.946044921875, -8.4820556640625, -8.01806640625, -7.5540771484375, -7.090087890625, -6.6260986328125, -6.162109375, -5.6981201171875, -5.234130859375, -4.7701416015625, -4.30615234375, -3.8421630859375, -3.378173828125, -2.9141845703125, -2.4501953125, -1.9862060546875, -1.522216796875, -1.0582275390625, -0.59423828125, -0.1302490234375, 0.333740234375, 0.7977294921875, 1.26171875, 1.7257080078125, 2.189697265625, 2.6536865234375, 3.11767578125, 3.5816650390625, 4.045654296875, 4.5096435546875, 4.9736328125, 5.4376220703125, 5.901611328125, 6.3656005859375, 6.82958984375, 7.2935791015625, 7.757568359375, 8.2215576171875, 8.685546875, 9.1495361328125, 9.613525390625, 10.0775146484375, 10.54150390625, 11.0054931640625, 11.469482421875, 11.9334716796875, 12.3974609375, 12.8614501953125, 13.325439453125, 13.7894287109375, 14.25341796875, 14.7174072265625, 15.181396484375, 15.6453857421875, 16.109375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 8.0, 16.0, 22.0, 51.0, 76.0, 88.0, 120.0, 135.0, 148.0, 122.0, 69.0, 63.0, 38.0, 21.0, 12.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.174633026123047, -26.935260772705078, -25.69588851928711, -24.45651626586914, -23.217144012451172, -21.977771759033203, -20.738399505615234, -19.499027252197266, -18.259654998779297, -17.020282745361328, -15.78091049194336, -14.54153823852539, -13.302165985107422, -12.062793731689453, -10.823421478271484, -9.584049224853516, -8.344676971435547, -7.105304718017578, -5.865932464599609, -4.626560211181641, -3.387187957763672, -2.147815704345703, -0.9084434509277344, 0.3309288024902344, 1.5703010559082031, 2.809673309326172, 4.049045562744141, 5.288417816162109, 6.527790069580078, 7.767162322998047, 9.006534576416016, 10.245906829833984, 11.485282897949219, 12.724655151367188, 13.964027404785156, 15.203399658203125, 16.442771911621094, 17.682144165039062, 18.92151641845703, 20.160888671875, 21.40026092529297, 22.639633178710938, 23.879005432128906, 25.118377685546875, 26.357749938964844, 27.597122192382812, 28.83649444580078, 30.07586669921875, 31.31523895263672, 32.55461120605469, 33.793983459472656, 35.033355712890625, 36.272727966308594, 37.51210021972656, 38.75147247314453, 39.9908447265625, 41.23021697998047, 42.46958923339844, 43.708961486816406, 44.948333740234375, 46.187705993652344, 47.42707824707031, 48.66645050048828, 49.90582275390625, 51.14519500732422]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 6.0, 9.0, 10.0, 16.0, 15.0, 10.0, 18.0, 18.0, 22.0, 32.0, 30.0, 40.0, 29.0, 39.0, 47.0, 41.0, 36.0, 31.0, 52.0, 47.0, 50.0, 51.0, 43.0, 34.0, 40.0, 28.0, 20.0, 27.0, 27.0, 19.0, 18.0, 21.0, 12.0, 13.0, 8.0, 8.0, 11.0, 7.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.300743103027344, -20.645584106445312, -19.99042320251465, -19.335264205932617, -18.680103302001953, -18.024944305419922, -17.36978530883789, -16.71462631225586, -16.059465408325195, -15.404305458068848, -14.7491455078125, -14.093986511230469, -13.438826560974121, -12.783666610717773, -12.128507614135742, -11.473347663879395, -10.818187713623047, -10.1630277633667, -9.507867813110352, -8.85270881652832, -8.197548866271973, -7.542388916015625, -6.8872294425964355, -6.232069969177246, -5.576910018920898, -4.921750068664551, -4.266590595245361, -3.6114308834075928, -2.956271171569824, -2.3011114597320557, -1.645951747894287, -0.9907922744750977, -0.33563232421875, 0.31952738761901855, 0.9746870994567871, 1.6298468112945557, 2.285006523132324, 2.9401662349700928, 3.5953259468078613, 4.250485420227051, 4.905645370483398, 5.560805320739746, 6.2159647941589355, 6.871124267578125, 7.526284217834473, 8.18144416809082, 8.836603164672852, 9.4917631149292, 10.146923065185547, 10.802083015441895, 11.457242965698242, 12.112401962280273, 12.767561912536621, 13.422721862792969, 14.077880859375, 14.733040809631348, 15.388200759887695, 16.043359756469727, 16.69852066040039, 17.353679656982422, 18.008838653564453, 18.663999557495117, 19.31915855407715, 19.974319458007812, 20.629478454589844]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 14.0, 11.0, 10.0, 7.0, 17.0, 19.0, 21.0, 22.0, 32.0, 39.0, 42.0, 47.0, 38.0, 43.0, 52.0, 56.0, 54.0, 56.0, 46.0, 38.0, 50.0, 40.0, 45.0, 32.0, 35.0, 22.0, 19.0, 20.0, 16.0, 12.0, 14.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5557861328125, -2.480712890625, -2.4056396484375, -2.33056640625, -2.2554931640625, -2.180419921875, -2.1053466796875, -2.0302734375, -1.9552001953125, -1.880126953125, -1.8050537109375, -1.72998046875, -1.6549072265625, -1.579833984375, -1.5047607421875, -1.4296875, -1.3546142578125, -1.279541015625, -1.2044677734375, -1.12939453125, -1.0543212890625, -0.979248046875, -0.9041748046875, -0.8291015625, -0.7540283203125, -0.678955078125, -0.6038818359375, -0.52880859375, -0.4537353515625, -0.378662109375, -0.3035888671875, -0.228515625, -0.1534423828125, -0.078369140625, -0.0032958984375, 0.07177734375, 0.1468505859375, 0.221923828125, 0.2969970703125, 0.3720703125, 0.4471435546875, 0.522216796875, 0.5972900390625, 0.67236328125, 0.7474365234375, 0.822509765625, 0.8975830078125, 0.97265625, 1.0477294921875, 1.122802734375, 1.1978759765625, 1.27294921875, 1.3480224609375, 1.423095703125, 1.4981689453125, 1.5732421875, 1.6483154296875, 1.723388671875, 1.7984619140625, 1.87353515625, 1.9486083984375, 2.023681640625, 2.0987548828125, 2.173828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 14.0, 18.0, 23.0, 28.0, 65.0, 79.0, 123.0, 213.0, 349.0, 516.0, 825.0, 1340.0, 1955.0, 3110.0, 4808.0, 7814.0, 12557.0, 20268.0, 34231.0, 59463.0, 112473.0, 320617.0, 243186.0, 94681.0, 51462.0, 30040.0, 17862.0, 11138.0, 7071.0, 4385.0, 2882.0, 1790.0, 1129.0, 733.0, 473.0, 304.0, 181.0, 112.0, 77.0, 47.0, 23.0, 29.0, 17.0, 8.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.01385498046875, -0.013433575630187988, -0.013012170791625977, -0.012590765953063965, -0.012169361114501953, -0.011747956275939941, -0.01132655143737793, -0.010905146598815918, -0.010483741760253906, -0.010062336921691895, -0.009640932083129883, -0.009219527244567871, -0.00879812240600586, -0.008376717567443848, -0.007955312728881836, -0.007533907890319824, -0.0071125030517578125, -0.006691098213195801, -0.006269693374633789, -0.005848288536071777, -0.005426883697509766, -0.005005478858947754, -0.004584074020385742, -0.0041626691818237305, -0.0037412643432617188, -0.003319859504699707, -0.0028984546661376953, -0.0024770498275756836, -0.002055644989013672, -0.0016342401504516602, -0.0012128353118896484, -0.0007914304733276367, -0.000370025634765625, 5.137920379638672e-05, 0.00047278404235839844, 0.0008941888809204102, 0.0013155937194824219, 0.0017369985580444336, 0.0021584033966064453, 0.002579808235168457, 0.0030012130737304688, 0.0034226179122924805, 0.003844022750854492, 0.004265427589416504, 0.004686832427978516, 0.005108237266540527, 0.005529642105102539, 0.005951046943664551, 0.0063724517822265625, 0.006793856620788574, 0.007215261459350586, 0.007636666297912598, 0.00805807113647461, 0.008479475975036621, 0.008900880813598633, 0.009322285652160645, 0.009743690490722656, 0.010165095329284668, 0.01058650016784668, 0.011007905006408691, 0.011429309844970703, 0.011850714683532715, 0.012272119522094727, 0.012693524360656738, 0.01311492919921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 16.0, 12.0, 12.0, 27.0, 21.0, 29.0, 30.0, 34.0, 40.0, 38.0, 36.0, 38.0, 45.0, 42.0, 1078.0, 38.0, 46.0, 50.0, 40.0, 32.0, 50.0, 44.0, 21.0, 26.0, 22.0, 27.0, 24.0, 20.0, 16.0, 8.0, 8.0, 9.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.740234375, -1.6942138671875, -1.648193359375, -1.6021728515625, -1.55615234375, -1.5101318359375, -1.464111328125, -1.4180908203125, -1.3720703125, -1.3260498046875, -1.280029296875, -1.2340087890625, -1.18798828125, -1.1419677734375, -1.095947265625, -1.0499267578125, -1.00390625, -0.9578857421875, -0.911865234375, -0.8658447265625, -0.81982421875, -0.7738037109375, -0.727783203125, -0.6817626953125, -0.6357421875, -0.5897216796875, -0.543701171875, -0.4976806640625, -0.45166015625, -0.4056396484375, -0.359619140625, -0.3135986328125, -0.267578125, -0.2215576171875, -0.175537109375, -0.1295166015625, -0.08349609375, -0.0374755859375, 0.008544921875, 0.0545654296875, 0.1005859375, 0.1466064453125, 0.192626953125, 0.2386474609375, 0.28466796875, 0.3306884765625, 0.376708984375, 0.4227294921875, 0.46875, 0.5147705078125, 0.560791015625, 0.6068115234375, 0.65283203125, 0.6988525390625, 0.744873046875, 0.7908935546875, 0.8369140625, 0.8829345703125, 0.928955078125, 0.9749755859375, 1.02099609375, 1.0670166015625, 1.113037109375, 1.1590576171875, 1.205078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 13.0, 5.0, 8.0, 21.0, 34.0, 54.0, 69.0, 117.0, 220.0, 349.0, 589.0, 972.0, 1752.0, 2759.0, 5069.0, 8621.0, 15150.0, 27375.0, 50093.0, 95903.0, 227885.0, 1382660.0, 131264.0, 65419.0, 35183.0, 19437.0, 10828.0, 6288.0, 3648.0, 2097.0, 1246.0, 758.0, 471.0, 278.0, 174.0, 128.0, 82.0, 38.0, 22.0, 13.0, 14.0, 15.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.0089186429977417, -0.008613348007202148, -0.008308053016662598, -0.008002758026123047, -0.007697463035583496, -0.007392168045043945, -0.0070868730545043945, -0.006781578063964844, -0.006476283073425293, -0.006170988082885742, -0.005865693092346191, -0.005560398101806641, -0.00525510311126709, -0.004949808120727539, -0.004644513130187988, -0.0043392181396484375, -0.004033923149108887, -0.003728628158569336, -0.003423333168029785, -0.0031180381774902344, -0.0028127431869506836, -0.002507448196411133, -0.002202153205871582, -0.0018968582153320312, -0.0015915632247924805, -0.0012862682342529297, -0.000980973243713379, -0.0006756782531738281, -0.00037038326263427734, -6.508827209472656e-05, 0.00024020671844482422, 0.000545501708984375, 0.0008507966995239258, 0.0011560916900634766, 0.0014613866806030273, 0.0017666816711425781, 0.002071976661682129, 0.0023772716522216797, 0.0026825666427612305, 0.0029878616333007812, 0.003293156623840332, 0.003598451614379883, 0.0039037466049194336, 0.004209041595458984, 0.004514336585998535, 0.004819631576538086, 0.005124926567077637, 0.0054302215576171875, 0.005735516548156738, 0.006040811538696289, 0.00634610652923584, 0.006651401519775391, 0.006956696510314941, 0.007261991500854492, 0.007567286491394043, 0.007872581481933594, 0.008177876472473145, 0.008483171463012695, 0.008788466453552246, 0.009093761444091797, 0.009399056434631348, 0.009704351425170898, 0.01000964641571045, 0.01031494140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 979.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 20.0, 1.0, 0.0, 4.0, 2.0, 5.0, 0.0, 13.0, 40.0, 55.0, 0.0, 313.0, 2397.0, 10804.0, 0.0, 1021150.0, 10988.0, 2288.0, 0.0, 315.0, 72.0, 37.0, 0.0, 24.0, 4.0, 3.0, 0.0, 3.0, 0.0, 11.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 14.0, 11.0, 10.0, 7.0, 17.0, 19.0, 21.0, 22.0, 32.0, 39.0, 42.0, 47.0, 38.0, 43.0, 52.0, 56.0, 54.0, 56.0, 46.0, 38.0, 50.0, 40.0, 45.0, 32.0, 35.0, 22.0, 19.0, 20.0, 16.0, 12.0, 14.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5557861328125, -2.480712890625, -2.4056396484375, -2.33056640625, -2.2554931640625, -2.180419921875, -2.1053466796875, -2.0302734375, -1.9552001953125, -1.880126953125, -1.8050537109375, -1.72998046875, -1.6549072265625, -1.579833984375, -1.5047607421875, -1.4296875, -1.3546142578125, -1.279541015625, -1.2044677734375, -1.12939453125, -1.0543212890625, -0.979248046875, -0.9041748046875, -0.8291015625, -0.7540283203125, -0.678955078125, -0.6038818359375, -0.52880859375, -0.4537353515625, -0.378662109375, -0.3035888671875, -0.228515625, -0.1534423828125, -0.078369140625, -0.0032958984375, 0.07177734375, 0.1468505859375, 0.221923828125, 0.2969970703125, 0.3720703125, 0.4471435546875, 0.522216796875, 0.5972900390625, 0.67236328125, 0.7474365234375, 0.822509765625, 0.8975830078125, 0.97265625, 1.0477294921875, 1.122802734375, 1.1978759765625, 1.27294921875, 1.3480224609375, 1.423095703125, 1.4981689453125, 1.5732421875, 1.6483154296875, 1.723388671875, 1.7984619140625, 1.87353515625, 1.9486083984375, 2.023681640625, 2.0987548828125, 2.173828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 9.0, 7.0, 13.0, 15.0, 22.0, 27.0, 51.0, 77.0, 85.0, 107.0, 181.0, 272.0, 379.0, 552.0, 844.0, 1183.0, 1778.0, 2760.0, 4125.0, 6688.0, 10928.0, 19352.0, 35285.0, 72605.0, 188407.0, 406711.0, 155979.0, 63079.0, 31560.0, 17650.0, 10146.0, 6196.0, 3836.0, 2480.0, 1725.0, 1072.0, 728.0, 461.0, 369.0, 204.0, 176.0, 132.0, 80.0, 54.0, 53.0, 36.0, 17.0, 20.0, 9.0, 12.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4365234375, -1.3907928466796875, -1.345062255859375, -1.2993316650390625, -1.25360107421875, -1.2078704833984375, -1.162139892578125, -1.1164093017578125, -1.0706787109375, -1.0249481201171875, -0.979217529296875, -0.9334869384765625, -0.88775634765625, -0.8420257568359375, -0.796295166015625, -0.7505645751953125, -0.704833984375, -0.6591033935546875, -0.613372802734375, -0.5676422119140625, -0.52191162109375, -0.4761810302734375, -0.430450439453125, -0.3847198486328125, -0.3389892578125, -0.2932586669921875, -0.247528076171875, -0.2017974853515625, -0.15606689453125, -0.1103363037109375, -0.064605712890625, -0.0188751220703125, 0.02685546875, 0.0725860595703125, 0.118316650390625, 0.1640472412109375, 0.20977783203125, 0.2555084228515625, 0.301239013671875, 0.3469696044921875, 0.3927001953125, 0.4384307861328125, 0.484161376953125, 0.5298919677734375, 0.57562255859375, 0.6213531494140625, 0.667083740234375, 0.7128143310546875, 0.758544921875, 0.8042755126953125, 0.850006103515625, 0.8957366943359375, 0.94146728515625, 0.9871978759765625, 1.032928466796875, 1.0786590576171875, 1.1243896484375, 1.1701202392578125, 1.215850830078125, 1.2615814208984375, 1.30731201171875, 1.3530426025390625, 1.398773193359375, 1.4445037841796875, 1.490234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 10.0, 10.0, 9.0, 13.0, 9.0, 17.0, 16.0, 25.0, 25.0, 42.0, 25.0, 31.0, 35.0, 46.0, 62.0, 75.0, 75.0, 245.0, 1613.0, 147.0, 90.0, 54.0, 47.0, 39.0, 42.0, 34.0, 25.0, 26.0, 29.0, 17.0, 20.0, 17.0, 17.0, 11.0, 9.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-7.8671875, -7.6383056640625, -7.409423828125, -7.1805419921875, -6.95166015625, -6.7227783203125, -6.493896484375, -6.2650146484375, -6.0361328125, -5.8072509765625, -5.578369140625, -5.3494873046875, -5.12060546875, -4.8917236328125, -4.662841796875, -4.4339599609375, -4.205078125, -3.9761962890625, -3.747314453125, -3.5184326171875, -3.28955078125, -3.0606689453125, -2.831787109375, -2.6029052734375, -2.3740234375, -2.1451416015625, -1.916259765625, -1.6873779296875, -1.45849609375, -1.2296142578125, -1.000732421875, -0.7718505859375, -0.54296875, -0.3140869140625, -0.085205078125, 0.1436767578125, 0.37255859375, 0.6014404296875, 0.830322265625, 1.0592041015625, 1.2880859375, 1.5169677734375, 1.745849609375, 1.9747314453125, 2.20361328125, 2.4324951171875, 2.661376953125, 2.8902587890625, 3.119140625, 3.3480224609375, 3.576904296875, 3.8057861328125, 4.03466796875, 4.2635498046875, 4.492431640625, 4.7213134765625, 4.9501953125, 5.1790771484375, 5.407958984375, 5.6368408203125, 5.86572265625, 6.0946044921875, 6.323486328125, 6.5523681640625, 6.78125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 11.0, 12.0, 9.0, 19.0, 11.0, 20.0, 22.0, 34.0, 37.0, 54.0, 69.0, 127.0, 167.0, 320.0, 607.0, 1645.0, 8426.0, 102324.0, 2909526.0, 110297.0, 8679.0, 1686.0, 623.0, 361.0, 186.0, 106.0, 68.0, 49.0, 49.0, 31.0, 23.0, 15.0, 15.0, 11.0, 11.0, 9.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.3125, -9.9852294921875, -9.657958984375, -9.3306884765625, -9.00341796875, -8.6761474609375, -8.348876953125, -8.0216064453125, -7.6943359375, -7.3670654296875, -7.039794921875, -6.7125244140625, -6.38525390625, -6.0579833984375, -5.730712890625, -5.4034423828125, -5.076171875, -4.7489013671875, -4.421630859375, -4.0943603515625, -3.76708984375, -3.4398193359375, -3.112548828125, -2.7852783203125, -2.4580078125, -2.1307373046875, -1.803466796875, -1.4761962890625, -1.14892578125, -0.8216552734375, -0.494384765625, -0.1671142578125, 0.16015625, 0.4874267578125, 0.814697265625, 1.1419677734375, 1.46923828125, 1.7965087890625, 2.123779296875, 2.4510498046875, 2.7783203125, 3.1055908203125, 3.432861328125, 3.7601318359375, 4.08740234375, 4.4146728515625, 4.741943359375, 5.0692138671875, 5.396484375, 5.7237548828125, 6.051025390625, 6.3782958984375, 6.70556640625, 7.0328369140625, 7.360107421875, 7.6873779296875, 8.0146484375, 8.3419189453125, 8.669189453125, 8.9964599609375, 9.32373046875, 9.6510009765625, 9.978271484375, 10.3055419921875, 10.6328125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [104.0, 905.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9601569175720215, -1.7863740921020508, 3.38740873336792, 8.56119155883789, 13.734973907470703, 18.908756256103516, 24.08254051208496, 29.256322860717773, 34.43010711669922, 39.60388946533203, 44.777671813964844, 49.951454162597656, 55.12523651123047, 60.29901885986328, 65.47280883789062, 70.64659118652344, 75.82036590576172, 80.99414825439453, 86.16793060302734, 91.34171295166016, 96.51549530029297, 101.68927764892578, 106.86306762695312, 112.03684997558594, 117.21063232421875, 122.38441467285156, 127.55819702148438, 132.7319793701172, 137.90576171875, 143.0795440673828, 148.25332641601562, 153.42710876464844, 158.6009063720703, 163.77468872070312, 168.94847106933594, 174.12225341796875, 179.29603576660156, 184.46981811523438, 189.6436004638672, 194.8173828125, 199.9911651611328, 205.16494750976562, 210.33872985839844, 215.51251220703125, 220.68629455566406, 225.86007690429688, 231.0338592529297, 236.2076416015625, 241.38143920898438, 246.5552215576172, 251.72900390625, 256.9028015136719, 262.0765686035156, 267.2503662109375, 272.42413330078125, 277.5979309082031, 282.7716979980469, 287.94549560546875, 293.1192626953125, 298.2930603027344, 303.4668273925781, 308.640625, 313.81439208984375, 318.9881896972656, 324.1619567871094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 14.0, 11.0, 20.0, 11.0, 23.0, 24.0, 19.0, 30.0, 32.0, 37.0, 37.0, 45.0, 35.0, 45.0, 28.0, 51.0, 45.0, 43.0, 43.0, 37.0, 36.0, 35.0, 48.0, 38.0, 30.0, 26.0, 37.0, 18.0, 16.0, 8.0, 14.0, 11.0, 11.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.54470443725586, -29.739673614501953, -28.934642791748047, -28.12961196899414, -27.324583053588867, -26.51955223083496, -25.714521408081055, -24.90949058532715, -24.104461669921875, -23.29943084716797, -22.494400024414062, -21.689369201660156, -20.884340286254883, -20.079309463500977, -19.27427864074707, -18.469247817993164, -17.664216995239258, -16.85918617248535, -16.054155349731445, -15.249125480651855, -14.444095611572266, -13.63906478881836, -12.834033966064453, -12.029003143310547, -11.223973274230957, -10.41894245147705, -9.613912582397461, -8.808881759643555, -8.003850936889648, -7.198821067810059, -6.393790245056152, -5.588759899139404, -4.783731460571289, -3.978701114654541, -3.173670530319214, -2.3686399459838867, -1.5636096000671387, -0.7585792541503906, 0.046451568603515625, 0.8514819145202637, 1.6565122604370117, 2.4615426063537598, 3.266573190689087, 4.071603775024414, 4.876634120941162, 5.68166446685791, 6.486695289611816, 7.2917256355285645, 8.096755981445312, 8.901786804199219, 9.706816673278809, 10.511847496032715, 11.316877365112305, 12.121908187866211, 12.926939010620117, 13.731969833374023, 14.536999702453613, 15.34203052520752, 16.14706039428711, 16.952091217041016, 17.757122039794922, 18.562152862548828, 19.367183685302734, 20.172212600708008, 20.977243423461914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 1.0, 10.0, 14.0, 13.0, 12.0, 9.0, 18.0, 26.0, 22.0, 31.0, 26.0, 46.0, 53.0, 47.0, 46.0, 36.0, 56.0, 51.0, 64.0, 36.0, 46.0, 48.0, 39.0, 52.0, 37.0, 32.0, 26.0, 15.0, 13.0, 23.0, 15.0, 9.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.569000244140625, -2.49151611328125, -2.414031982421875, -2.3365478515625, -2.259063720703125, -2.18157958984375, -2.104095458984375, -2.026611328125, -1.949127197265625, -1.87164306640625, -1.794158935546875, -1.7166748046875, -1.639190673828125, -1.56170654296875, -1.484222412109375, -1.40673828125, -1.329254150390625, -1.25177001953125, -1.174285888671875, -1.0968017578125, -1.019317626953125, -0.94183349609375, -0.864349365234375, -0.786865234375, -0.709381103515625, -0.63189697265625, -0.554412841796875, -0.4769287109375, -0.399444580078125, -0.32196044921875, -0.244476318359375, -0.1669921875, -0.089508056640625, -0.01202392578125, 0.065460205078125, 0.1429443359375, 0.220428466796875, 0.29791259765625, 0.375396728515625, 0.452880859375, 0.530364990234375, 0.60784912109375, 0.685333251953125, 0.7628173828125, 0.840301513671875, 0.91778564453125, 0.995269775390625, 1.07275390625, 1.150238037109375, 1.22772216796875, 1.305206298828125, 1.3826904296875, 1.460174560546875, 1.53765869140625, 1.615142822265625, 1.692626953125, 1.770111083984375, 1.84759521484375, 1.925079345703125, 2.0025634765625, 2.080047607421875, 2.15753173828125, 2.235015869140625, 2.3125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 9.0, 11.0, 19.0, 16.0, 24.0, 23.0, 37.0, 78.0, 119.0, 228.0, 552.0, 1451.0, 4559.0, 16578.0, 70848.0, 463659.0, 2806713.0, 705475.0, 93968.0, 21088.0, 5619.0, 1841.0, 644.0, 296.0, 121.0, 77.0, 50.0, 41.0, 23.0, 14.0, 20.0, 13.0, 8.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.44140625, -7.2322998046875, -7.023193359375, -6.8140869140625, -6.60498046875, -6.3958740234375, -6.186767578125, -5.9776611328125, -5.7685546875, -5.5594482421875, -5.350341796875, -5.1412353515625, -4.93212890625, -4.7230224609375, -4.513916015625, -4.3048095703125, -4.095703125, -3.8865966796875, -3.677490234375, -3.4683837890625, -3.25927734375, -3.0501708984375, -2.841064453125, -2.6319580078125, -2.4228515625, -2.2137451171875, -2.004638671875, -1.7955322265625, -1.58642578125, -1.3773193359375, -1.168212890625, -0.9591064453125, -0.75, -0.5408935546875, -0.331787109375, -0.1226806640625, 0.08642578125, 0.2955322265625, 0.504638671875, 0.7137451171875, 0.9228515625, 1.1319580078125, 1.341064453125, 1.5501708984375, 1.75927734375, 1.9683837890625, 2.177490234375, 2.3865966796875, 2.595703125, 2.8048095703125, 3.013916015625, 3.2230224609375, 3.43212890625, 3.6412353515625, 3.850341796875, 4.0594482421875, 4.2685546875, 4.4776611328125, 4.686767578125, 4.8958740234375, 5.10498046875, 5.3140869140625, 5.523193359375, 5.7322998046875, 5.94140625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 10.0, 7.0, 21.0, 23.0, 64.0, 85.0, 157.0, 323.0, 562.0, 812.0, 760.0, 525.0, 333.0, 175.0, 93.0, 67.0, 28.0, 12.0, 10.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.4044189453125, -11.058837890625, -10.7132568359375, -10.36767578125, -10.0220947265625, -9.676513671875, -9.3309326171875, -8.9853515625, -8.6397705078125, -8.294189453125, -7.9486083984375, -7.60302734375, -7.2574462890625, -6.911865234375, -6.5662841796875, -6.220703125, -5.8751220703125, -5.529541015625, -5.1839599609375, -4.83837890625, -4.4927978515625, -4.147216796875, -3.8016357421875, -3.4560546875, -3.1104736328125, -2.764892578125, -2.4193115234375, -2.07373046875, -1.7281494140625, -1.382568359375, -1.0369873046875, -0.69140625, -0.3458251953125, -0.000244140625, 0.3453369140625, 0.69091796875, 1.0364990234375, 1.382080078125, 1.7276611328125, 2.0732421875, 2.4188232421875, 2.764404296875, 3.1099853515625, 3.45556640625, 3.8011474609375, 4.146728515625, 4.4923095703125, 4.837890625, 5.1834716796875, 5.529052734375, 5.8746337890625, 6.22021484375, 6.5657958984375, 6.911376953125, 7.2569580078125, 7.6025390625, 7.9481201171875, 8.293701171875, 8.6392822265625, 8.98486328125, 9.3304443359375, 9.676025390625, 10.0216064453125, 10.3671875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 12.0, 25.0, 27.0, 50.0, 86.0, 129.0, 218.0, 364.0, 592.0, 1297.0, 4021.0, 22211.0, 254842.0, 3208463.0, 647882.0, 44151.0, 6320.0, 1728.0, 792.0, 426.0, 244.0, 138.0, 98.0, 63.0, 34.0, 25.0, 20.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.515625, -15.0255126953125, -14.535400390625, -14.0452880859375, -13.55517578125, -13.0650634765625, -12.574951171875, -12.0848388671875, -11.5947265625, -11.1046142578125, -10.614501953125, -10.1243896484375, -9.63427734375, -9.1441650390625, -8.654052734375, -8.1639404296875, -7.673828125, -7.1837158203125, -6.693603515625, -6.2034912109375, -5.71337890625, -5.2232666015625, -4.733154296875, -4.2430419921875, -3.7529296875, -3.2628173828125, -2.772705078125, -2.2825927734375, -1.79248046875, -1.3023681640625, -0.812255859375, -0.3221435546875, 0.16796875, 0.6580810546875, 1.148193359375, 1.6383056640625, 2.12841796875, 2.6185302734375, 3.108642578125, 3.5987548828125, 4.0888671875, 4.5789794921875, 5.069091796875, 5.5592041015625, 6.04931640625, 6.5394287109375, 7.029541015625, 7.5196533203125, 8.009765625, 8.4998779296875, 8.989990234375, 9.4801025390625, 9.97021484375, 10.4603271484375, 10.950439453125, 11.4405517578125, 11.9306640625, 12.4207763671875, 12.910888671875, 13.4010009765625, 13.89111328125, 14.3812255859375, 14.871337890625, 15.3614501953125, 15.8515625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 10.0, 30.0, 60.0, 86.0, 164.0, 177.0, 179.0, 136.0, 92.0, 43.0, 24.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.16366958618164, -41.268028259277344, -39.37238693237305, -37.47674560546875, -35.58110809326172, -33.68546676635742, -31.789825439453125, -29.894184112548828, -27.998544692993164, -26.102903366088867, -24.207263946533203, -22.311622619628906, -20.41598129272461, -18.520341873168945, -16.62470054626465, -14.729060173034668, -12.833419799804688, -10.937779426574707, -9.042139053344727, -7.14649772644043, -5.250857353210449, -3.3552169799804688, -1.4595756530761719, 0.4360647201538086, 2.331705093383789, 4.2273454666137695, 6.122986316680908, 8.018627166748047, 9.914267539978027, 11.809907913208008, 13.705549240112305, 15.601189613342285, 17.496826171875, 19.392467498779297, 21.28810691833496, 23.183748245239258, 25.079387664794922, 26.97502899169922, 28.870670318603516, 30.766311645507812, 32.661949157714844, 34.55759048461914, 36.45323181152344, 38.34886932373047, 40.244510650634766, 42.14015197753906, 44.03579330444336, 45.931434631347656, 47.82707595825195, 49.72271728515625, 51.61835861206055, 53.513999938964844, 55.409637451171875, 57.30527877807617, 59.20092010498047, 61.096561431884766, 62.99220275878906, 64.8878402709961, 66.78348541259766, 68.67912292480469, 70.57476806640625, 72.47040557861328, 74.36604309082031, 76.26168823242188, 78.1573257446289]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 10.0, 11.0, 8.0, 8.0, 16.0, 15.0, 12.0, 15.0, 26.0, 22.0, 25.0, 35.0, 27.0, 28.0, 37.0, 36.0, 30.0, 37.0, 40.0, 43.0, 33.0, 32.0, 41.0, 37.0, 42.0, 31.0, 33.0, 28.0, 31.0, 33.0, 22.0, 20.0, 15.0, 24.0, 18.0, 6.0, 8.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-20.6429443359375, -20.021011352539062, -19.399080276489258, -18.77714729309082, -18.155216217041016, -17.533283233642578, -16.91135025024414, -16.289417266845703, -15.667486190795898, -15.045554161071777, -14.423622131347656, -13.801689147949219, -13.179757118225098, -12.557825088500977, -11.935892105102539, -11.313960075378418, -10.692028045654297, -10.070096015930176, -9.448163986206055, -8.826231002807617, -8.204298973083496, -7.582366943359375, -6.960434436798096, -6.338501930236816, -5.716569900512695, -5.094637870788574, -4.472705364227295, -3.8507730960845947, -3.2288408279418945, -2.6069085597991943, -1.9849762916564941, -1.3630437850952148, -0.7411117553710938, -0.11917948722839355, 0.5027527809143066, 1.1246850490570068, 1.746617317199707, 2.3685495853424072, 2.9904818534851074, 3.6124143600463867, 4.234346389770508, 4.856278419494629, 5.478210926055908, 6.1001434326171875, 6.722075462341309, 7.34400749206543, 7.965939998626709, 8.587872505187988, 9.20980453491211, 9.83173656463623, 10.453668594360352, 11.075601577758789, 11.69753360748291, 12.319465637207031, 12.941398620605469, 13.56333065032959, 14.185262680053711, 14.807194709777832, 15.429126739501953, 16.05105972290039, 16.672992706298828, 17.294923782348633, 17.91685676574707, 18.538787841796875, 19.160720825195312]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 11.0, 12.0, 16.0, 18.0, 19.0, 10.0, 31.0, 30.0, 24.0, 27.0, 44.0, 39.0, 48.0, 38.0, 21.0, 42.0, 42.0, 54.0, 49.0, 44.0, 37.0, 44.0, 35.0, 31.0, 42.0, 30.0, 24.0, 20.0, 15.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.150390625, -2.081634521484375, -2.01287841796875, -1.944122314453125, -1.8753662109375, -1.806610107421875, -1.73785400390625, -1.669097900390625, -1.600341796875, -1.531585693359375, -1.46282958984375, -1.394073486328125, -1.3253173828125, -1.256561279296875, -1.18780517578125, -1.119049072265625, -1.05029296875, -0.981536865234375, -0.91278076171875, -0.844024658203125, -0.7752685546875, -0.706512451171875, -0.63775634765625, -0.569000244140625, -0.500244140625, -0.431488037109375, -0.36273193359375, -0.293975830078125, -0.2252197265625, -0.156463623046875, -0.08770751953125, -0.018951416015625, 0.0498046875, 0.118560791015625, 0.18731689453125, 0.256072998046875, 0.3248291015625, 0.393585205078125, 0.46234130859375, 0.531097412109375, 0.599853515625, 0.668609619140625, 0.73736572265625, 0.806121826171875, 0.8748779296875, 0.943634033203125, 1.01239013671875, 1.081146240234375, 1.14990234375, 1.218658447265625, 1.28741455078125, 1.356170654296875, 1.4249267578125, 1.493682861328125, 1.56243896484375, 1.631195068359375, 1.699951171875, 1.768707275390625, 1.83746337890625, 1.906219482421875, 1.9749755859375, 2.043731689453125, 2.11248779296875, 2.181243896484375, 2.25]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 11.0, 6.0, 17.0, 29.0, 30.0, 53.0, 89.0, 131.0, 176.0, 272.0, 434.0, 639.0, 892.0, 1519.0, 2163.0, 3397.0, 5334.0, 8162.0, 13161.0, 21160.0, 35024.0, 60665.0, 114177.0, 287264.0, 249123.0, 103140.0, 55213.0, 32581.0, 19742.0, 12276.0, 7662.0, 4870.0, 3100.0, 2091.0, 1320.0, 832.0, 609.0, 404.0, 250.0, 184.0, 118.0, 84.0, 47.0, 35.0, 21.0, 20.0, 15.0, 7.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.01360321044921875, -0.013190031051635742, -0.012776851654052734, -0.012363672256469727, -0.011950492858886719, -0.011537313461303711, -0.011124134063720703, -0.010710954666137695, -0.010297775268554688, -0.00988459587097168, -0.009471416473388672, -0.009058237075805664, -0.008645057678222656, -0.008231878280639648, -0.00781869888305664, -0.007405519485473633, -0.006992340087890625, -0.006579160690307617, -0.006165981292724609, -0.0057528018951416016, -0.005339622497558594, -0.004926443099975586, -0.004513263702392578, -0.00410008430480957, -0.0036869049072265625, -0.0032737255096435547, -0.002860546112060547, -0.002447366714477539, -0.0020341873168945312, -0.0016210079193115234, -0.0012078285217285156, -0.0007946491241455078, -0.0003814697265625, 3.170967102050781e-05, 0.0004448890686035156, 0.0008580684661865234, 0.0012712478637695312, 0.001684427261352539, 0.002097606658935547, 0.0025107860565185547, 0.0029239654541015625, 0.0033371448516845703, 0.003750324249267578, 0.004163503646850586, 0.004576683044433594, 0.0049898624420166016, 0.005403041839599609, 0.005816221237182617, 0.006229400634765625, 0.006642580032348633, 0.007055759429931641, 0.0074689388275146484, 0.007882118225097656, 0.008295297622680664, 0.008708477020263672, 0.00912165641784668, 0.009534835815429688, 0.009948015213012695, 0.010361194610595703, 0.010774374008178711, 0.011187553405761719, 0.011600732803344727, 0.012013912200927734, 0.012427091598510742, 0.01284027099609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 9.0, 19.0, 13.0, 12.0, 30.0, 31.0, 26.0, 38.0, 44.0, 33.0, 46.0, 52.0, 52.0, 52.0, 1068.0, 46.0, 53.0, 42.0, 43.0, 27.0, 36.0, 35.0, 40.0, 28.0, 21.0, 19.0, 17.0, 19.0, 10.0, 9.0, 11.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.77734375, -1.727081298828125, -1.67681884765625, -1.626556396484375, -1.5762939453125, -1.526031494140625, -1.47576904296875, -1.425506591796875, -1.375244140625, -1.324981689453125, -1.27471923828125, -1.224456787109375, -1.1741943359375, -1.123931884765625, -1.07366943359375, -1.023406982421875, -0.97314453125, -0.922882080078125, -0.87261962890625, -0.822357177734375, -0.7720947265625, -0.721832275390625, -0.67156982421875, -0.621307373046875, -0.571044921875, -0.520782470703125, -0.47052001953125, -0.420257568359375, -0.3699951171875, -0.319732666015625, -0.26947021484375, -0.219207763671875, -0.1689453125, -0.118682861328125, -0.06842041015625, -0.018157958984375, 0.0321044921875, 0.082366943359375, 0.13262939453125, 0.182891845703125, 0.233154296875, 0.283416748046875, 0.33367919921875, 0.383941650390625, 0.4342041015625, 0.484466552734375, 0.53472900390625, 0.584991455078125, 0.63525390625, 0.685516357421875, 0.73577880859375, 0.786041259765625, 0.8363037109375, 0.886566162109375, 0.93682861328125, 0.987091064453125, 1.037353515625, 1.087615966796875, 1.13787841796875, 1.188140869140625, 1.2384033203125, 1.288665771484375, 1.33892822265625, 1.389190673828125, 1.439453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 16.0, 12.0, 14.0, 27.0, 53.0, 85.0, 93.0, 164.0, 262.0, 428.0, 677.0, 1084.0, 1773.0, 2976.0, 4931.0, 8603.0, 14747.0, 26485.0, 47523.0, 90889.0, 219700.0, 1392243.0, 136007.0, 65163.0, 35399.0, 19828.0, 11322.0, 6542.0, 3903.0, 2375.0, 1383.0, 881.0, 532.0, 341.0, 220.0, 153.0, 103.0, 62.0, 44.0, 31.0, 16.0, 17.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00954437255859375, -0.009228944778442383, -0.008913516998291016, -0.008598089218139648, -0.008282661437988281, -0.007967233657836914, -0.007651805877685547, -0.00733637809753418, -0.0070209503173828125, -0.006705522537231445, -0.006390094757080078, -0.006074666976928711, -0.005759239196777344, -0.0054438114166259766, -0.005128383636474609, -0.004812955856323242, -0.004497528076171875, -0.004182100296020508, -0.0038666725158691406, -0.0035512447357177734, -0.0032358169555664062, -0.002920389175415039, -0.002604961395263672, -0.0022895336151123047, -0.0019741058349609375, -0.0016586780548095703, -0.0013432502746582031, -0.001027822494506836, -0.0007123947143554688, -0.00039696693420410156, -8.153915405273438e-05, 0.0002338886260986328, 0.00054931640625, 0.0008647441864013672, 0.0011801719665527344, 0.0014955997467041016, 0.0018110275268554688, 0.002126455307006836, 0.002441883087158203, 0.0027573108673095703, 0.0030727386474609375, 0.0033881664276123047, 0.003703594207763672, 0.004019021987915039, 0.004334449768066406, 0.0046498775482177734, 0.004965305328369141, 0.005280733108520508, 0.005596160888671875, 0.005911588668823242, 0.006227016448974609, 0.0065424442291259766, 0.006857872009277344, 0.007173299789428711, 0.007488727569580078, 0.007804155349731445, 0.008119583129882812, 0.00843501091003418, 0.008750438690185547, 0.009065866470336914, 0.009381294250488281, 0.009696722030639648, 0.010012149810791016, 0.010327577590942383, 0.01064300537109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 973.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 19.0, 1.0, 0.0, 10.0, 1.0, 11.0, 0.0, 2.0, 38.0, 55.0, 0.0, 331.0, 2405.0, 11960.0, 0.0, 1018940.0, 11984.0, 2299.0, 0.0, 360.0, 61.0, 38.0, 0.0, 7.0, 4.0, 4.0, 0.0, 5.0, 5.0, 15.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 11.0, 12.0, 16.0, 18.0, 19.0, 10.0, 31.0, 30.0, 24.0, 27.0, 44.0, 39.0, 48.0, 38.0, 21.0, 42.0, 42.0, 54.0, 49.0, 44.0, 37.0, 44.0, 35.0, 31.0, 42.0, 30.0, 24.0, 20.0, 15.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.150390625, -2.081634521484375, -2.01287841796875, -1.944122314453125, -1.8753662109375, -1.806610107421875, -1.73785400390625, -1.669097900390625, -1.600341796875, -1.531585693359375, -1.46282958984375, -1.394073486328125, -1.3253173828125, -1.256561279296875, -1.18780517578125, -1.119049072265625, -1.05029296875, -0.981536865234375, -0.91278076171875, -0.844024658203125, -0.7752685546875, -0.706512451171875, -0.63775634765625, -0.569000244140625, -0.500244140625, -0.431488037109375, -0.36273193359375, -0.293975830078125, -0.2252197265625, -0.156463623046875, -0.08770751953125, -0.018951416015625, 0.0498046875, 0.118560791015625, 0.18731689453125, 0.256072998046875, 0.3248291015625, 0.393585205078125, 0.46234130859375, 0.531097412109375, 0.599853515625, 0.668609619140625, 0.73736572265625, 0.806121826171875, 0.8748779296875, 0.943634033203125, 1.01239013671875, 1.081146240234375, 1.14990234375, 1.218658447265625, 1.28741455078125, 1.356170654296875, 1.4249267578125, 1.493682861328125, 1.56243896484375, 1.631195068359375, 1.699951171875, 1.768707275390625, 1.83746337890625, 1.906219482421875, 1.9749755859375, 2.043731689453125, 2.11248779296875, 2.181243896484375, 2.25]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 5.0, 2.0, 8.0, 11.0, 19.0, 22.0, 28.0, 36.0, 52.0, 77.0, 137.0, 198.0, 309.0, 460.0, 776.0, 1189.0, 1900.0, 2964.0, 4951.0, 8050.0, 13456.0, 22749.0, 40406.0, 93820.0, 431212.0, 270642.0, 70898.0, 34187.0, 19676.0, 11696.0, 7033.0, 4289.0, 2631.0, 1732.0, 1056.0, 627.0, 396.0, 288.0, 173.0, 123.0, 87.0, 52.0, 32.0, 27.0, 21.0, 12.0, 11.0, 8.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.068359375, -2.0013427734375, -1.934326171875, -1.8673095703125, -1.80029296875, -1.7332763671875, -1.666259765625, -1.5992431640625, -1.5322265625, -1.4652099609375, -1.398193359375, -1.3311767578125, -1.26416015625, -1.1971435546875, -1.130126953125, -1.0631103515625, -0.99609375, -0.9290771484375, -0.862060546875, -0.7950439453125, -0.72802734375, -0.6610107421875, -0.593994140625, -0.5269775390625, -0.4599609375, -0.3929443359375, -0.325927734375, -0.2589111328125, -0.19189453125, -0.1248779296875, -0.057861328125, 0.0091552734375, 0.076171875, 0.1431884765625, 0.210205078125, 0.2772216796875, 0.34423828125, 0.4112548828125, 0.478271484375, 0.5452880859375, 0.6123046875, 0.6793212890625, 0.746337890625, 0.8133544921875, 0.88037109375, 0.9473876953125, 1.014404296875, 1.0814208984375, 1.1484375, 1.2154541015625, 1.282470703125, 1.3494873046875, 1.41650390625, 1.4835205078125, 1.550537109375, 1.6175537109375, 1.6845703125, 1.7515869140625, 1.818603515625, 1.8856201171875, 1.95263671875, 2.0196533203125, 2.086669921875, 2.1536865234375, 2.220703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 6.0, 7.0, 14.0, 13.0, 21.0, 19.0, 22.0, 24.0, 30.0, 32.0, 38.0, 39.0, 61.0, 45.0, 77.0, 116.0, 334.0, 1529.0, 141.0, 80.0, 50.0, 43.0, 41.0, 37.0, 36.0, 26.0, 18.0, 21.0, 25.0, 18.0, 13.0, 12.0, 7.0, 8.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7578125, -7.5159912109375, -7.274169921875, -7.0323486328125, -6.79052734375, -6.5487060546875, -6.306884765625, -6.0650634765625, -5.8232421875, -5.5814208984375, -5.339599609375, -5.0977783203125, -4.85595703125, -4.6141357421875, -4.372314453125, -4.1304931640625, -3.888671875, -3.6468505859375, -3.405029296875, -3.1632080078125, -2.92138671875, -2.6795654296875, -2.437744140625, -2.1959228515625, -1.9541015625, -1.7122802734375, -1.470458984375, -1.2286376953125, -0.98681640625, -0.7449951171875, -0.503173828125, -0.2613525390625, -0.01953125, 0.2222900390625, 0.464111328125, 0.7059326171875, 0.94775390625, 1.1895751953125, 1.431396484375, 1.6732177734375, 1.9150390625, 2.1568603515625, 2.398681640625, 2.6405029296875, 2.88232421875, 3.1241455078125, 3.365966796875, 3.6077880859375, 3.849609375, 4.0914306640625, 4.333251953125, 4.5750732421875, 4.81689453125, 5.0587158203125, 5.300537109375, 5.5423583984375, 5.7841796875, 6.0260009765625, 6.267822265625, 6.5096435546875, 6.75146484375, 6.9932861328125, 7.235107421875, 7.4769287109375, 7.71875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 8.0, 6.0, 7.0, 5.0, 14.0, 16.0, 19.0, 27.0, 26.0, 38.0, 52.0, 59.0, 91.0, 150.0, 204.0, 321.0, 1000.0, 3881.0, 32593.0, 2440153.0, 641860.0, 20605.0, 2784.0, 776.0, 345.0, 186.0, 124.0, 82.0, 64.0, 53.0, 39.0, 11.0, 27.0, 23.0, 12.0, 11.0, 4.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.60498046875, -11.2412109375, -10.87744140625, -10.513671875, -10.14990234375, -9.7861328125, -9.42236328125, -9.05859375, -8.69482421875, -8.3310546875, -7.96728515625, -7.603515625, -7.23974609375, -6.8759765625, -6.51220703125, -6.1484375, -5.78466796875, -5.4208984375, -5.05712890625, -4.693359375, -4.32958984375, -3.9658203125, -3.60205078125, -3.23828125, -2.87451171875, -2.5107421875, -2.14697265625, -1.783203125, -1.41943359375, -1.0556640625, -0.69189453125, -0.328125, 0.03564453125, 0.3994140625, 0.76318359375, 1.126953125, 1.49072265625, 1.8544921875, 2.21826171875, 2.58203125, 2.94580078125, 3.3095703125, 3.67333984375, 4.037109375, 4.40087890625, 4.7646484375, 5.12841796875, 5.4921875, 5.85595703125, 6.2197265625, 6.58349609375, 6.947265625, 7.31103515625, 7.6748046875, 8.03857421875, 8.40234375, 8.76611328125, 9.1298828125, 9.49365234375, 9.857421875, 10.22119140625, 10.5849609375, 10.94873046875, 11.3125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 248.0, 686.0, 76.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.660686492919922, -23.813861846923828, -20.967037200927734, -18.12021255493164, -15.27338695526123, -12.426562309265137, -9.579736709594727, -6.732912063598633, -3.886087417602539, -1.0392625331878662, 1.8075623512268066, 4.654387474060059, 7.501212120056152, 10.348036766052246, 13.194862365722656, 16.04168701171875, 18.888511657714844, 21.735336303710938, 24.58216094970703, 27.428985595703125, 30.27581024169922, 33.12263488769531, 35.969459533691406, 38.8162841796875, 41.663108825683594, 44.50993347167969, 47.35675811767578, 50.203582763671875, 53.05040740966797, 55.89723205566406, 58.744056701660156, 61.59088134765625, 64.43770599365234, 67.28453063964844, 70.13135528564453, 72.97817993164062, 75.82500457763672, 78.67182922363281, 81.5186538696289, 84.365478515625, 87.2123031616211, 90.05912780761719, 92.90595245361328, 95.75277709960938, 98.59960174560547, 101.44642639160156, 104.29325103759766, 107.14007568359375, 109.98690795898438, 112.83373260498047, 115.68055725097656, 118.52738189697266, 121.37420654296875, 124.22103118896484, 127.06785583496094, 129.91468811035156, 132.76150512695312, 135.60833740234375, 138.4551544189453, 141.30198669433594, 144.1488037109375, 146.99563598632812, 149.8424530029297, 152.6892852783203, 155.53610229492188]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 5.0, 7.0, 11.0, 7.0, 7.0, 22.0, 19.0, 21.0, 23.0, 25.0, 26.0, 22.0, 29.0, 43.0, 40.0, 37.0, 36.0, 39.0, 36.0, 44.0, 48.0, 38.0, 31.0, 43.0, 37.0, 35.0, 39.0, 30.0, 28.0, 20.0, 24.0, 20.0, 20.0, 13.0, 14.0, 12.0, 9.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.083560943603516, -23.362991333007812, -22.64242172241211, -21.921852111816406, -21.201282501220703, -20.480712890625, -19.760143280029297, -19.03957176208496, -18.319002151489258, -17.598432540893555, -16.87786293029785, -16.15729331970215, -15.436722755432129, -14.716153144836426, -13.995583534240723, -13.275012969970703, -12.554444313049316, -11.833874702453613, -11.11330509185791, -10.39273452758789, -9.672164916992188, -8.951595306396484, -8.231025695800781, -7.51045560836792, -6.789885997772217, -6.069316387176514, -5.348746299743652, -4.628176689147949, -3.907606840133667, -3.1870369911193848, -2.4664673805236816, -1.7458972930908203, -1.0253276824951172, -0.30475789308547974, 0.4158118963241577, 1.1363816261291504, 1.8569514751434326, 2.577521324157715, 3.298090934753418, 4.018661022186279, 4.739230632781982, 5.4598002433776855, 6.180370330810547, 6.90093994140625, 7.621509552001953, 8.342079162597656, 9.06264877319336, 9.783219337463379, 10.503788948059082, 11.224358558654785, 11.944928169250488, 12.665498733520508, 13.386068344116211, 14.106637954711914, 14.827207565307617, 15.54777717590332, 16.268346786499023, 16.988916397094727, 17.70948600769043, 18.430055618286133, 19.150625228881836, 19.871196746826172, 20.591766357421875, 21.312335968017578, 22.03290557861328]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 6.0, 4.0, 13.0, 3.0, 8.0, 12.0, 18.0, 17.0, 17.0, 21.0, 25.0, 33.0, 30.0, 33.0, 35.0, 34.0, 45.0, 42.0, 30.0, 37.0, 42.0, 57.0, 47.0, 45.0, 36.0, 41.0, 43.0, 33.0, 32.0, 30.0, 18.0, 25.0, 19.0, 17.0, 11.0, 10.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.283203125, -2.212066650390625, -2.14093017578125, -2.069793701171875, -1.9986572265625, -1.927520751953125, -1.85638427734375, -1.785247802734375, -1.714111328125, -1.642974853515625, -1.57183837890625, -1.500701904296875, -1.4295654296875, -1.358428955078125, -1.28729248046875, -1.216156005859375, -1.14501953125, -1.073883056640625, -1.00274658203125, -0.931610107421875, -0.8604736328125, -0.789337158203125, -0.71820068359375, -0.647064208984375, -0.575927734375, -0.504791259765625, -0.43365478515625, -0.362518310546875, -0.2913818359375, -0.220245361328125, -0.14910888671875, -0.077972412109375, -0.0068359375, 0.064300537109375, 0.13543701171875, 0.206573486328125, 0.2777099609375, 0.348846435546875, 0.41998291015625, 0.491119384765625, 0.562255859375, 0.633392333984375, 0.70452880859375, 0.775665283203125, 0.8468017578125, 0.917938232421875, 0.98907470703125, 1.060211181640625, 1.13134765625, 1.202484130859375, 1.27362060546875, 1.344757080078125, 1.4158935546875, 1.487030029296875, 1.55816650390625, 1.629302978515625, 1.700439453125, 1.771575927734375, 1.84271240234375, 1.913848876953125, 1.9849853515625, 2.056121826171875, 2.12725830078125, 2.198394775390625, 2.26953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 20.0, 25.0, 51.0, 58.0, 95.0, 133.0, 223.0, 349.0, 530.0, 916.0, 1589.0, 2732.0, 5107.0, 9536.0, 18982.0, 39965.0, 90610.0, 237036.0, 766115.0, 1652928.0, 900227.0, 277134.0, 101578.0, 44403.0, 20862.0, 10279.0, 5528.0, 3022.0, 1629.0, 952.0, 582.0, 364.0, 230.0, 167.0, 88.0, 74.0, 44.0, 29.0, 22.0, 13.0, 11.0, 9.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.3673095703125, -3.263916015625, -3.1605224609375, -3.05712890625, -2.9537353515625, -2.850341796875, -2.7469482421875, -2.6435546875, -2.5401611328125, -2.436767578125, -2.3333740234375, -2.22998046875, -2.1265869140625, -2.023193359375, -1.9197998046875, -1.81640625, -1.7130126953125, -1.609619140625, -1.5062255859375, -1.40283203125, -1.2994384765625, -1.196044921875, -1.0926513671875, -0.9892578125, -0.8858642578125, -0.782470703125, -0.6790771484375, -0.57568359375, -0.4722900390625, -0.368896484375, -0.2655029296875, -0.162109375, -0.0587158203125, 0.044677734375, 0.1480712890625, 0.25146484375, 0.3548583984375, 0.458251953125, 0.5616455078125, 0.6650390625, 0.7684326171875, 0.871826171875, 0.9752197265625, 1.07861328125, 1.1820068359375, 1.285400390625, 1.3887939453125, 1.4921875, 1.5955810546875, 1.698974609375, 1.8023681640625, 1.90576171875, 2.0091552734375, 2.112548828125, 2.2159423828125, 2.3193359375, 2.4227294921875, 2.526123046875, 2.6295166015625, 2.73291015625, 2.8363037109375, 2.939697265625, 3.0430908203125, 3.146484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 12.0, 13.0, 16.0, 13.0, 19.0, 40.0, 44.0, 72.0, 82.0, 95.0, 141.0, 219.0, 283.0, 327.0, 401.0, 439.0, 431.0, 329.0, 256.0, 216.0, 162.0, 112.0, 103.0, 73.0, 49.0, 30.0, 20.0, 16.0, 13.0, 10.0, 5.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.12890625, -6.9437255859375, -6.758544921875, -6.5733642578125, -6.38818359375, -6.2030029296875, -6.017822265625, -5.8326416015625, -5.6474609375, -5.4622802734375, -5.277099609375, -5.0919189453125, -4.90673828125, -4.7215576171875, -4.536376953125, -4.3511962890625, -4.166015625, -3.9808349609375, -3.795654296875, -3.6104736328125, -3.42529296875, -3.2401123046875, -3.054931640625, -2.8697509765625, -2.6845703125, -2.4993896484375, -2.314208984375, -2.1290283203125, -1.94384765625, -1.7586669921875, -1.573486328125, -1.3883056640625, -1.203125, -1.0179443359375, -0.832763671875, -0.6475830078125, -0.46240234375, -0.2772216796875, -0.092041015625, 0.0931396484375, 0.2783203125, 0.4635009765625, 0.648681640625, 0.8338623046875, 1.01904296875, 1.2042236328125, 1.389404296875, 1.5745849609375, 1.759765625, 1.9449462890625, 2.130126953125, 2.3153076171875, 2.50048828125, 2.6856689453125, 2.870849609375, 3.0560302734375, 3.2412109375, 3.4263916015625, 3.611572265625, 3.7967529296875, 3.98193359375, 4.1671142578125, 4.352294921875, 4.5374755859375, 4.72265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 20.0, 33.0, 33.0, 50.0, 80.0, 124.0, 234.0, 368.0, 691.0, 1566.0, 4511.0, 16015.0, 76422.0, 503492.0, 2668388.0, 780589.0, 110327.0, 21601.0, 5801.0, 1995.0, 814.0, 428.0, 251.0, 139.0, 92.0, 62.0, 44.0, 26.0, 19.0, 14.0, 7.0, 11.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0103759765625, -7.684814453125, -7.3592529296875, -7.03369140625, -6.7081298828125, -6.382568359375, -6.0570068359375, -5.7314453125, -5.4058837890625, -5.080322265625, -4.7547607421875, -4.42919921875, -4.1036376953125, -3.778076171875, -3.4525146484375, -3.126953125, -2.8013916015625, -2.475830078125, -2.1502685546875, -1.82470703125, -1.4991455078125, -1.173583984375, -0.8480224609375, -0.5224609375, -0.1968994140625, 0.128662109375, 0.4542236328125, 0.77978515625, 1.1053466796875, 1.430908203125, 1.7564697265625, 2.08203125, 2.4075927734375, 2.733154296875, 3.0587158203125, 3.38427734375, 3.7098388671875, 4.035400390625, 4.3609619140625, 4.6865234375, 5.0120849609375, 5.337646484375, 5.6632080078125, 5.98876953125, 6.3143310546875, 6.639892578125, 6.9654541015625, 7.291015625, 7.6165771484375, 7.942138671875, 8.2677001953125, 8.59326171875, 8.9188232421875, 9.244384765625, 9.5699462890625, 9.8955078125, 10.2210693359375, 10.546630859375, 10.8721923828125, 11.19775390625, 11.5233154296875, 11.848876953125, 12.1744384765625, 12.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 24.0, 37.0, 75.0, 111.0, 144.0, 173.0, 141.0, 122.0, 79.0, 58.0, 24.0, 10.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.887874603271484, -43.20592498779297, -41.52397537231445, -39.84202575683594, -38.16007995605469, -36.478126525878906, -34.796180725097656, -33.11423110961914, -31.432281494140625, -29.75033187866211, -28.068382263183594, -26.38643455505371, -24.704484939575195, -23.02253532409668, -21.340587615966797, -19.65863800048828, -17.976688385009766, -16.29473876953125, -14.61279010772705, -12.930841445922852, -11.248891830444336, -9.56694221496582, -7.884993553161621, -6.203044891357422, -4.521095275878906, -2.839146137237549, -1.1571969985961914, 0.524752140045166, 2.2067012786865234, 3.888650894165039, 5.570599555969238, 7.2525482177734375, 8.934494018554688, 10.616443634033203, 12.298392295837402, 13.980340957641602, 15.662290573120117, 17.344240188598633, 19.026187896728516, 20.70813751220703, 22.390087127685547, 24.072036743164062, 25.753986358642578, 27.43593406677246, 29.117883682250977, 30.799833297729492, 32.481781005859375, 34.16373062133789, 35.845680236816406, 37.52762985229492, 39.20957946777344, 40.89152908325195, 42.57347869873047, 44.25542449951172, 45.937374114990234, 47.61932373046875, 49.301273345947266, 50.98322296142578, 52.6651725769043, 54.34712219238281, 56.02906799316406, 57.711021423339844, 59.392967224121094, 61.07491683959961, 62.756866455078125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 9.0, 4.0, 8.0, 7.0, 9.0, 14.0, 11.0, 16.0, 23.0, 22.0, 27.0, 32.0, 30.0, 24.0, 31.0, 46.0, 36.0, 52.0, 35.0, 54.0, 38.0, 45.0, 41.0, 42.0, 33.0, 33.0, 26.0, 33.0, 29.0, 20.0, 21.0, 23.0, 24.0, 23.0, 17.0, 14.0, 10.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.47724151611328, -19.817333221435547, -19.15742301940918, -18.497514724731445, -17.837604522705078, -17.177696228027344, -16.517786026000977, -15.857877731323242, -15.197968482971191, -14.53805923461914, -13.87814998626709, -13.218240737915039, -12.558332443237305, -11.898422241210938, -11.238513946533203, -10.578604698181152, -9.918695449829102, -9.25878620147705, -8.598876953125, -7.938968181610107, -7.279058933258057, -6.619149684906006, -5.959240913391113, -5.2993316650390625, -4.639422416687012, -3.979513168334961, -3.3196041584014893, -2.6596951484680176, -1.9997859001159668, -1.339876651763916, -0.6799676418304443, -0.020058631896972656, 0.6398506164550781, 1.2997597455978394, 1.9596688747406006, 2.6195778846740723, 3.279487133026123, 3.939396381378174, 4.599305152893066, 5.259214401245117, 5.919123649597168, 6.579032897949219, 7.2389421463012695, 7.898850917816162, 8.558759689331055, 9.218669891357422, 9.878578186035156, 10.538487434387207, 11.198396682739258, 11.858305931091309, 12.51821517944336, 13.17812442779541, 13.838033676147461, 14.497941970825195, 15.157851219177246, 15.817760467529297, 16.47766876220703, 17.137577056884766, 17.797487258911133, 18.457395553588867, 19.117305755615234, 19.77721405029297, 20.437124252319336, 21.09703254699707, 21.756942749023438]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 17.0, 15.0, 13.0, 16.0, 36.0, 30.0, 39.0, 28.0, 28.0, 34.0, 42.0, 39.0, 55.0, 38.0, 40.0, 50.0, 34.0, 45.0, 33.0, 39.0, 37.0, 19.0, 26.0, 32.0, 23.0, 20.0, 32.0, 18.0, 12.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.939056396484375, -1.87030029296875, -1.801544189453125, -1.7327880859375, -1.664031982421875, -1.59527587890625, -1.526519775390625, -1.457763671875, -1.389007568359375, -1.32025146484375, -1.251495361328125, -1.1827392578125, -1.113983154296875, -1.04522705078125, -0.976470947265625, -0.90771484375, -0.838958740234375, -0.77020263671875, -0.701446533203125, -0.6326904296875, -0.563934326171875, -0.49517822265625, -0.426422119140625, -0.357666015625, -0.288909912109375, -0.22015380859375, -0.151397705078125, -0.0826416015625, -0.013885498046875, 0.05487060546875, 0.123626708984375, 0.1923828125, 0.261138916015625, 0.32989501953125, 0.398651123046875, 0.4674072265625, 0.536163330078125, 0.60491943359375, 0.673675537109375, 0.742431640625, 0.811187744140625, 0.87994384765625, 0.948699951171875, 1.0174560546875, 1.086212158203125, 1.15496826171875, 1.223724365234375, 1.29248046875, 1.361236572265625, 1.42999267578125, 1.498748779296875, 1.5675048828125, 1.636260986328125, 1.70501708984375, 1.773773193359375, 1.842529296875, 1.911285400390625, 1.98004150390625, 2.048797607421875, 2.1175537109375, 2.186309814453125, 2.25506591796875, 2.323822021484375, 2.392578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 14.0, 23.0, 26.0, 35.0, 74.0, 102.0, 169.0, 252.0, 375.0, 540.0, 780.0, 1087.0, 1770.0, 2730.0, 4116.0, 6308.0, 10217.0, 16300.0, 26546.0, 44655.0, 78352.0, 164455.0, 350468.0, 152501.0, 74824.0, 42920.0, 25356.0, 15864.0, 9933.0, 6132.0, 3985.0, 2572.0, 1700.0, 1046.0, 736.0, 492.0, 399.0, 243.0, 166.0, 106.0, 61.0, 31.0, 34.0, 19.0, 15.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.013885498046875, -0.01348257064819336, -0.013079643249511719, -0.012676715850830078, -0.012273788452148438, -0.011870861053466797, -0.011467933654785156, -0.011065006256103516, -0.010662078857421875, -0.010259151458740234, -0.009856224060058594, -0.009453296661376953, -0.009050369262695312, -0.008647441864013672, -0.008244514465332031, -0.00784158706665039, -0.00743865966796875, -0.007035732269287109, -0.006632804870605469, -0.006229877471923828, -0.0058269500732421875, -0.005424022674560547, -0.005021095275878906, -0.004618167877197266, -0.004215240478515625, -0.0038123130798339844, -0.0034093856811523438, -0.003006458282470703, -0.0026035308837890625, -0.002200603485107422, -0.0017976760864257812, -0.0013947486877441406, -0.0009918212890625, -0.0005888938903808594, -0.00018596649169921875, 0.00021696090698242188, 0.0006198883056640625, 0.0010228157043457031, 0.0014257431030273438, 0.0018286705017089844, 0.002231597900390625, 0.0026345252990722656, 0.0030374526977539062, 0.003440380096435547, 0.0038433074951171875, 0.004246234893798828, 0.004649162292480469, 0.005052089691162109, 0.00545501708984375, 0.005857944488525391, 0.006260871887207031, 0.006663799285888672, 0.0070667266845703125, 0.007469654083251953, 0.007872581481933594, 0.008275508880615234, 0.008678436279296875, 0.009081363677978516, 0.009484291076660156, 0.009887218475341797, 0.010290145874023438, 0.010693073272705078, 0.011096000671386719, 0.01149892807006836, 0.01190185546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 10.0, 11.0, 12.0, 15.0, 12.0, 22.0, 20.0, 22.0, 23.0, 29.0, 24.0, 31.0, 37.0, 35.0, 38.0, 30.0, 35.0, 49.0, 1077.0, 42.0, 39.0, 31.0, 32.0, 39.0, 28.0, 26.0, 19.0, 42.0, 37.0, 26.0, 24.0, 15.0, 11.0, 10.0, 13.0, 13.0, 8.0, 9.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.29779052734375, -1.2537841796875, -1.20977783203125, -1.165771484375, -1.12176513671875, -1.0777587890625, -1.03375244140625, -0.98974609375, -0.94573974609375, -0.9017333984375, -0.85772705078125, -0.813720703125, -0.76971435546875, -0.7257080078125, -0.68170166015625, -0.6376953125, -0.59368896484375, -0.5496826171875, -0.50567626953125, -0.461669921875, -0.41766357421875, -0.3736572265625, -0.32965087890625, -0.28564453125, -0.24163818359375, -0.1976318359375, -0.15362548828125, -0.109619140625, -0.06561279296875, -0.0216064453125, 0.02239990234375, 0.06640625, 0.11041259765625, 0.1544189453125, 0.19842529296875, 0.242431640625, 0.28643798828125, 0.3304443359375, 0.37445068359375, 0.41845703125, 0.46246337890625, 0.5064697265625, 0.55047607421875, 0.594482421875, 0.63848876953125, 0.6824951171875, 0.72650146484375, 0.7705078125, 0.81451416015625, 0.8585205078125, 0.90252685546875, 0.946533203125, 0.99053955078125, 1.0345458984375, 1.07855224609375, 1.12255859375, 1.16656494140625, 1.2105712890625, 1.25457763671875, 1.298583984375, 1.34259033203125, 1.3865966796875, 1.43060302734375, 1.474609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 3.0, 17.0, 26.0, 28.0, 56.0, 75.0, 107.0, 174.0, 282.0, 409.0, 565.0, 1001.0, 1426.0, 2142.0, 3343.0, 5138.0, 7950.0, 12644.0, 19920.0, 31359.0, 50583.0, 85013.0, 170741.0, 1352403.0, 148008.0, 76716.0, 46739.0, 28977.0, 18179.0, 11692.0, 7619.0, 4697.0, 3112.0, 2041.0, 1295.0, 913.0, 555.0, 401.0, 247.0, 179.0, 118.0, 77.0, 49.0, 25.0, 35.0, 22.0, 5.0, 11.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00872802734375, -0.008466839790344238, -0.008205652236938477, -0.007944464683532715, -0.007683277130126953, -0.007422089576721191, -0.00716090202331543, -0.006899714469909668, -0.006638526916503906, -0.0063773393630981445, -0.006116151809692383, -0.005854964256286621, -0.005593776702880859, -0.005332589149475098, -0.005071401596069336, -0.004810214042663574, -0.0045490264892578125, -0.004287838935852051, -0.004026651382446289, -0.0037654638290405273, -0.0035042762756347656, -0.003243088722229004, -0.002981901168823242, -0.0027207136154174805, -0.0024595260620117188, -0.002198338508605957, -0.0019371509552001953, -0.0016759634017944336, -0.0014147758483886719, -0.0011535882949829102, -0.0008924007415771484, -0.0006312131881713867, -0.000370025634765625, -0.00010883808135986328, 0.00015234947204589844, 0.00041353702545166016, 0.0006747245788574219, 0.0009359121322631836, 0.0011970996856689453, 0.001458287239074707, 0.0017194747924804688, 0.0019806623458862305, 0.002241849899291992, 0.002503037452697754, 0.0027642250061035156, 0.0030254125595092773, 0.003286600112915039, 0.0035477876663208008, 0.0038089752197265625, 0.004070162773132324, 0.004331350326538086, 0.004592537879943848, 0.004853725433349609, 0.005114912986755371, 0.005376100540161133, 0.0056372880935668945, 0.005898475646972656, 0.006159663200378418, 0.00642085075378418, 0.006682038307189941, 0.006943225860595703, 0.007204413414001465, 0.0074656009674072266, 0.007726788520812988, 0.00798797607421875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 968.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 17.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 0.0, 46.0, 52.0, 0.0, 256.0, 2449.0, 0.0, 13420.0, 0.0, 1015763.0, 13756.0, 0.0, 2366.0, 274.0, 0.0, 63.0, 30.0, 0.0, 13.0, 0.0, 7.0, 2.0, 0.0, 0.0, 5.0, 0.0, 11.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0346993803977966e-06, -9.96515154838562e-07, -9.583309292793274e-07, -9.201467037200928e-07, -8.819624781608582e-07, -8.437782526016235e-07, -8.055940270423889e-07, -7.674098014831543e-07, -7.292255759239197e-07, -6.910413503646851e-07, -6.528571248054504e-07, -6.146728992462158e-07, -5.764886736869812e-07, -5.383044481277466e-07, -5.00120222568512e-07, -4.6193599700927734e-07, -4.237517714500427e-07, -3.855675458908081e-07, -3.473833203315735e-07, -3.0919909477233887e-07, -2.7101486921310425e-07, -2.3283064365386963e-07, -1.94646418094635e-07, -1.564621925354004e-07, -1.1827796697616577e-07, -8.009374141693115e-08, -4.190951585769653e-08, -3.725290298461914e-09, 3.4458935260772705e-08, 7.264316082000732e-08, 1.1082738637924194e-07, 1.4901161193847656e-07, 1.8719583749771118e-07, 2.253800630569458e-07, 2.635642886161804e-07, 3.0174851417541504e-07, 3.3993273973464966e-07, 3.781169652938843e-07, 4.163011908531189e-07, 4.544854164123535e-07, 4.926696419715881e-07, 5.308538675308228e-07, 5.690380930900574e-07, 6.07222318649292e-07, 6.454065442085266e-07, 6.835907697677612e-07, 7.217749953269958e-07, 7.599592208862305e-07, 7.981434464454651e-07, 8.363276720046997e-07, 8.745118975639343e-07, 9.126961231231689e-07, 9.508803486824036e-07, 9.890645742416382e-07, 1.0272487998008728e-06, 1.0654330253601074e-06, 1.103617250919342e-06, 1.1418014764785767e-06, 1.1799857020378113e-06, 1.218169927597046e-06, 1.2563541531562805e-06, 1.2945383787155151e-06, 1.3327226042747498e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 17.0, 15.0, 13.0, 16.0, 36.0, 30.0, 39.0, 28.0, 28.0, 34.0, 42.0, 39.0, 55.0, 38.0, 40.0, 50.0, 34.0, 45.0, 33.0, 39.0, 37.0, 19.0, 26.0, 32.0, 23.0, 20.0, 32.0, 18.0, 12.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.939056396484375, -1.87030029296875, -1.801544189453125, -1.7327880859375, -1.664031982421875, -1.59527587890625, -1.526519775390625, -1.457763671875, -1.389007568359375, -1.32025146484375, -1.251495361328125, -1.1827392578125, -1.113983154296875, -1.04522705078125, -0.976470947265625, -0.90771484375, -0.838958740234375, -0.77020263671875, -0.701446533203125, -0.6326904296875, -0.563934326171875, -0.49517822265625, -0.426422119140625, -0.357666015625, -0.288909912109375, -0.22015380859375, -0.151397705078125, -0.0826416015625, -0.013885498046875, 0.05487060546875, 0.123626708984375, 0.1923828125, 0.261138916015625, 0.32989501953125, 0.398651123046875, 0.4674072265625, 0.536163330078125, 0.60491943359375, 0.673675537109375, 0.742431640625, 0.811187744140625, 0.87994384765625, 0.948699951171875, 1.0174560546875, 1.086212158203125, 1.15496826171875, 1.223724365234375, 1.29248046875, 1.361236572265625, 1.42999267578125, 1.498748779296875, 1.5675048828125, 1.636260986328125, 1.70501708984375, 1.773773193359375, 1.842529296875, 1.911285400390625, 1.98004150390625, 2.048797607421875, 2.1175537109375, 2.186309814453125, 2.25506591796875, 2.323822021484375, 2.392578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 7.0, 1.0, 10.0, 13.0, 16.0, 26.0, 39.0, 45.0, 73.0, 75.0, 132.0, 183.0, 257.0, 334.0, 515.0, 732.0, 974.0, 1458.0, 2066.0, 2930.0, 4293.0, 6124.0, 9236.0, 14218.0, 23583.0, 49575.0, 144409.0, 479019.0, 177936.0, 57383.0, 26492.0, 15290.0, 9802.0, 6509.0, 4459.0, 3121.0, 2158.0, 1416.0, 1018.0, 733.0, 553.0, 396.0, 265.0, 213.0, 137.0, 111.0, 81.0, 51.0, 32.0, 15.0, 22.0, 14.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.0078125, -1.9461822509765625, -1.884552001953125, -1.8229217529296875, -1.76129150390625, -1.6996612548828125, -1.638031005859375, -1.5764007568359375, -1.5147705078125, -1.4531402587890625, -1.391510009765625, -1.3298797607421875, -1.26824951171875, -1.2066192626953125, -1.144989013671875, -1.0833587646484375, -1.021728515625, -0.9600982666015625, -0.898468017578125, -0.8368377685546875, -0.77520751953125, -0.7135772705078125, -0.651947021484375, -0.5903167724609375, -0.5286865234375, -0.4670562744140625, -0.405426025390625, -0.3437957763671875, -0.28216552734375, -0.2205352783203125, -0.158905029296875, -0.0972747802734375, -0.03564453125, 0.0259857177734375, 0.087615966796875, 0.1492462158203125, 0.21087646484375, 0.2725067138671875, 0.334136962890625, 0.3957672119140625, 0.4573974609375, 0.5190277099609375, 0.580657958984375, 0.6422882080078125, 0.70391845703125, 0.7655487060546875, 0.827178955078125, 0.8888092041015625, 0.950439453125, 1.0120697021484375, 1.073699951171875, 1.1353302001953125, 1.19696044921875, 1.2585906982421875, 1.320220947265625, 1.3818511962890625, 1.4434814453125, 1.5051116943359375, 1.566741943359375, 1.6283721923828125, 1.69000244140625, 1.7516326904296875, 1.813262939453125, 1.8748931884765625, 1.9365234375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 8.0, 6.0, 13.0, 16.0, 14.0, 16.0, 31.0, 18.0, 36.0, 31.0, 32.0, 44.0, 48.0, 77.0, 75.0, 142.0, 1680.0, 243.0, 93.0, 60.0, 48.0, 47.0, 38.0, 31.0, 39.0, 29.0, 19.0, 21.0, 16.0, 17.0, 14.0, 4.0, 7.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9720458984375, -7.694091796875, -7.4161376953125, -7.13818359375, -6.8602294921875, -6.582275390625, -6.3043212890625, -6.0263671875, -5.7484130859375, -5.470458984375, -5.1925048828125, -4.91455078125, -4.6365966796875, -4.358642578125, -4.0806884765625, -3.802734375, -3.5247802734375, -3.246826171875, -2.9688720703125, -2.69091796875, -2.4129638671875, -2.135009765625, -1.8570556640625, -1.5791015625, -1.3011474609375, -1.023193359375, -0.7452392578125, -0.46728515625, -0.1893310546875, 0.088623046875, 0.3665771484375, 0.64453125, 0.9224853515625, 1.200439453125, 1.4783935546875, 1.75634765625, 2.0343017578125, 2.312255859375, 2.5902099609375, 2.8681640625, 3.1461181640625, 3.424072265625, 3.7020263671875, 3.97998046875, 4.2579345703125, 4.535888671875, 4.8138427734375, 5.091796875, 5.3697509765625, 5.647705078125, 5.9256591796875, 6.20361328125, 6.4815673828125, 6.759521484375, 7.0374755859375, 7.3154296875, 7.5933837890625, 7.871337890625, 8.1492919921875, 8.42724609375, 8.7052001953125, 8.983154296875, 9.2611083984375, 9.5390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 9.0, 7.0, 16.0, 21.0, 18.0, 27.0, 21.0, 39.0, 60.0, 67.0, 114.0, 162.0, 222.0, 400.0, 1986.0, 29673.0, 3009534.0, 97732.0, 4067.0, 610.0, 258.0, 181.0, 109.0, 88.0, 72.0, 50.0, 27.0, 29.0, 25.0, 16.0, 19.0, 8.0, 3.0, 8.0, 11.0, 2.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.8125, -17.2984619140625, -16.784423828125, -16.2703857421875, -15.75634765625, -15.2423095703125, -14.728271484375, -14.2142333984375, -13.7001953125, -13.1861572265625, -12.672119140625, -12.1580810546875, -11.64404296875, -11.1300048828125, -10.615966796875, -10.1019287109375, -9.587890625, -9.0738525390625, -8.559814453125, -8.0457763671875, -7.53173828125, -7.0177001953125, -6.503662109375, -5.9896240234375, -5.4755859375, -4.9615478515625, -4.447509765625, -3.9334716796875, -3.41943359375, -2.9053955078125, -2.391357421875, -1.8773193359375, -1.36328125, -0.8492431640625, -0.335205078125, 0.1788330078125, 0.69287109375, 1.2069091796875, 1.720947265625, 2.2349853515625, 2.7490234375, 3.2630615234375, 3.777099609375, 4.2911376953125, 4.80517578125, 5.3192138671875, 5.833251953125, 6.3472900390625, 6.861328125, 7.3753662109375, 7.889404296875, 8.4034423828125, 8.91748046875, 9.4315185546875, 9.945556640625, 10.4595947265625, 10.9736328125, 11.4876708984375, 12.001708984375, 12.5157470703125, 13.02978515625, 13.5438232421875, 14.057861328125, 14.5718994140625, 15.0859375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 169.0, 677.0, 163.0], "bins": [-141.75186157226562, -139.48297119140625, -137.21408081054688, -134.94520568847656, -132.6763153076172, -130.4074249267578, -128.13853454589844, -125.8696517944336, -123.60076141357422, -121.33187103271484, -119.06298828125, -116.79409790039062, -114.52521514892578, -112.2563247680664, -109.98744201660156, -107.71855163574219, -105.44966125488281, -103.18077087402344, -100.9118881225586, -98.64299774169922, -96.37411499023438, -94.105224609375, -91.83633422851562, -89.56745147705078, -87.29856872558594, -85.02967834472656, -82.76079559326172, -80.49190521240234, -78.2230224609375, -75.95413208007812, -73.68524169921875, -71.4163589477539, -69.14747619628906, -66.87858581542969, -64.60970306396484, -62.34081268310547, -60.07192611694336, -57.80303955078125, -55.53415298461914, -53.26526641845703, -50.996376037597656, -48.72748947143555, -46.45860290527344, -44.18971252441406, -41.92082595825195, -39.651939392089844, -37.383052825927734, -35.114166259765625, -32.84527587890625, -30.57638931274414, -28.3075008392334, -26.03861427307129, -23.769725799560547, -21.500839233398438, -19.231952667236328, -16.96306610107422, -14.694177627563477, -12.42529010772705, -10.156402587890625, -7.887516021728516, -5.61862850189209, -3.349740982055664, -1.0808544158935547, 1.188033103942871, 3.4569203853607178]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 12.0, 18.0, 12.0, 20.0, 20.0, 18.0, 24.0, 26.0, 36.0, 30.0, 46.0, 46.0, 37.0, 34.0, 57.0, 59.0, 43.0, 35.0, 35.0, 41.0, 41.0, 31.0, 35.0, 25.0, 32.0, 26.0, 23.0, 20.0, 24.0, 17.0, 10.0, 12.0, 13.0, 6.0, 2.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.954151153564453, -18.2750301361084, -17.595909118652344, -16.91678810119629, -16.237667083740234, -15.55854606628418, -14.879426002502441, -14.200304985046387, -13.521183967590332, -12.842062950134277, -12.162941932678223, -11.483821868896484, -10.80470085144043, -10.125579833984375, -9.44645881652832, -8.767337799072266, -8.088216781616211, -7.409095764160156, -6.729974746704102, -6.050854206085205, -5.37173318862915, -4.692612171173096, -4.013491630554199, -3.3343706130981445, -2.65524959564209, -1.9761286973953247, -1.2970077991485596, -0.617887020111084, 0.0612339973449707, 0.7403550148010254, 1.4194755554199219, 2.0985965728759766, 2.777719497680664, 3.4568405151367188, 4.135961532592773, 4.81508207321167, 5.494203090667725, 6.173324108123779, 6.852444648742676, 7.5315656661987305, 8.210686683654785, 8.88980770111084, 9.568928718566895, 10.248048782348633, 10.927169799804688, 11.606290817260742, 12.285411834716797, 12.964532852172852, 13.643653869628906, 14.322774887084961, 15.001895904541016, 15.68101692199707, 16.360137939453125, 17.03925895690918, 17.718379974365234, 18.397499084472656, 19.076622009277344, 19.7557430267334, 20.434864044189453, 21.113985061645508, 21.793106079101562, 22.472227096557617, 23.151348114013672, 23.830467224121094, 24.50958824157715]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 6.0, 12.0, 7.0, 13.0, 20.0, 15.0, 22.0, 17.0, 23.0, 32.0, 34.0, 41.0, 27.0, 38.0, 43.0, 36.0, 34.0, 40.0, 52.0, 47.0, 39.0, 36.0, 43.0, 27.0, 32.0, 29.0, 24.0, 23.0, 38.0, 27.0, 16.0, 14.0, 19.0, 12.0, 17.0, 4.0, 4.0, 1.0, 4.0, 6.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1015625, -2.031890869140625, -1.96221923828125, -1.892547607421875, -1.8228759765625, -1.753204345703125, -1.68353271484375, -1.613861083984375, -1.544189453125, -1.474517822265625, -1.40484619140625, -1.335174560546875, -1.2655029296875, -1.195831298828125, -1.12615966796875, -1.056488037109375, -0.98681640625, -0.917144775390625, -0.84747314453125, -0.777801513671875, -0.7081298828125, -0.638458251953125, -0.56878662109375, -0.499114990234375, -0.429443359375, -0.359771728515625, -0.29010009765625, -0.220428466796875, -0.1507568359375, -0.081085205078125, -0.01141357421875, 0.058258056640625, 0.1279296875, 0.197601318359375, 0.26727294921875, 0.336944580078125, 0.4066162109375, 0.476287841796875, 0.54595947265625, 0.615631103515625, 0.685302734375, 0.754974365234375, 0.82464599609375, 0.894317626953125, 0.9639892578125, 1.033660888671875, 1.10333251953125, 1.173004150390625, 1.24267578125, 1.312347412109375, 1.38201904296875, 1.451690673828125, 1.5213623046875, 1.591033935546875, 1.66070556640625, 1.730377197265625, 1.800048828125, 1.869720458984375, 1.93939208984375, 2.009063720703125, 2.0787353515625, 2.148406982421875, 2.21807861328125, 2.287750244140625, 2.357421875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 11.0, 13.0, 18.0, 27.0, 26.0, 47.0, 57.0, 79.0, 125.0, 208.0, 376.0, 916.0, 2376.0, 8033.0, 35723.0, 243525.0, 2494000.0, 1262897.0, 116641.0, 20618.0, 5201.0, 1707.0, 686.0, 331.0, 178.0, 104.0, 80.0, 50.0, 39.0, 27.0, 23.0, 28.0, 16.0, 9.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 0.0, 1.0, 2.0], "bins": [-7.7734375, -7.5291748046875, -7.284912109375, -7.0406494140625, -6.79638671875, -6.5521240234375, -6.307861328125, -6.0635986328125, -5.8193359375, -5.5750732421875, -5.330810546875, -5.0865478515625, -4.84228515625, -4.5980224609375, -4.353759765625, -4.1094970703125, -3.865234375, -3.6209716796875, -3.376708984375, -3.1324462890625, -2.88818359375, -2.6439208984375, -2.399658203125, -2.1553955078125, -1.9111328125, -1.6668701171875, -1.422607421875, -1.1783447265625, -0.93408203125, -0.6898193359375, -0.445556640625, -0.2012939453125, 0.04296875, 0.2872314453125, 0.531494140625, 0.7757568359375, 1.02001953125, 1.2642822265625, 1.508544921875, 1.7528076171875, 1.9970703125, 2.2413330078125, 2.485595703125, 2.7298583984375, 2.97412109375, 3.2183837890625, 3.462646484375, 3.7069091796875, 3.951171875, 4.1954345703125, 4.439697265625, 4.6839599609375, 4.92822265625, 5.1724853515625, 5.416748046875, 5.6610107421875, 5.9052734375, 6.1495361328125, 6.393798828125, 6.6380615234375, 6.88232421875, 7.1265869140625, 7.370849609375, 7.6151123046875, 7.859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 18.0, 22.0, 33.0, 33.0, 50.0, 65.0, 90.0, 129.0, 171.0, 193.0, 264.0, 333.0, 449.0, 440.0, 383.0, 310.0, 261.0, 196.0, 157.0, 129.0, 90.0, 67.0, 47.0, 23.0, 28.0, 14.0, 12.0, 14.0, 6.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.64453125, -6.46661376953125, -6.2886962890625, -6.11077880859375, -5.932861328125, -5.75494384765625, -5.5770263671875, -5.39910888671875, -5.22119140625, -5.04327392578125, -4.8653564453125, -4.68743896484375, -4.509521484375, -4.33160400390625, -4.1536865234375, -3.97576904296875, -3.7978515625, -3.61993408203125, -3.4420166015625, -3.26409912109375, -3.086181640625, -2.90826416015625, -2.7303466796875, -2.55242919921875, -2.37451171875, -2.19659423828125, -2.0186767578125, -1.84075927734375, -1.662841796875, -1.48492431640625, -1.3070068359375, -1.12908935546875, -0.951171875, -0.77325439453125, -0.5953369140625, -0.41741943359375, -0.239501953125, -0.06158447265625, 0.1163330078125, 0.29425048828125, 0.47216796875, 0.65008544921875, 0.8280029296875, 1.00592041015625, 1.183837890625, 1.36175537109375, 1.5396728515625, 1.71759033203125, 1.8955078125, 2.07342529296875, 2.2513427734375, 2.42926025390625, 2.607177734375, 2.78509521484375, 2.9630126953125, 3.14093017578125, 3.31884765625, 3.49676513671875, 3.6746826171875, 3.85260009765625, 4.030517578125, 4.20843505859375, 4.3863525390625, 4.56427001953125, 4.7421875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 20.0, 23.0, 35.0, 44.0, 57.0, 77.0, 111.0, 193.0, 282.0, 535.0, 1139.0, 4270.0, 31896.0, 426599.0, 3224666.0, 463204.0, 33963.0, 4647.0, 1139.0, 495.0, 267.0, 185.0, 114.0, 88.0, 58.0, 39.0, 35.0, 23.0, 14.0, 7.0, 9.0, 9.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.1768798828125, -10.720947265625, -10.2650146484375, -9.80908203125, -9.3531494140625, -8.897216796875, -8.4412841796875, -7.9853515625, -7.5294189453125, -7.073486328125, -6.6175537109375, -6.16162109375, -5.7056884765625, -5.249755859375, -4.7938232421875, -4.337890625, -3.8819580078125, -3.426025390625, -2.9700927734375, -2.51416015625, -2.0582275390625, -1.602294921875, -1.1463623046875, -0.6904296875, -0.2344970703125, 0.221435546875, 0.6773681640625, 1.13330078125, 1.5892333984375, 2.045166015625, 2.5010986328125, 2.95703125, 3.4129638671875, 3.868896484375, 4.3248291015625, 4.78076171875, 5.2366943359375, 5.692626953125, 6.1485595703125, 6.6044921875, 7.0604248046875, 7.516357421875, 7.9722900390625, 8.42822265625, 8.8841552734375, 9.340087890625, 9.7960205078125, 10.251953125, 10.7078857421875, 11.163818359375, 11.6197509765625, 12.07568359375, 12.5316162109375, 12.987548828125, 13.4434814453125, 13.8994140625, 14.3553466796875, 14.811279296875, 15.2672119140625, 15.72314453125, 16.1790771484375, 16.635009765625, 17.0909423828125, 17.546875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [4.0, 4.0, 15.0, 31.0, 57.0, 68.0, 132.0, 166.0, 149.0, 144.0, 112.0, 80.0, 34.0, 15.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.939248085021973, -12.229952812194824, -10.520657539367676, -8.811361312866211, -7.102066516876221, -5.392770767211914, -3.6834754943847656, -1.9741802215576172, -0.26488494873046875, 1.4444104433059692, 3.1537058353424072, 4.863001346588135, 6.572296619415283, 8.28159236907959, 9.990887641906738, 11.700182914733887, 13.409478187561035, 15.118773460388184, 16.82806968688965, 18.537364959716797, 20.246660232543945, 21.955955505371094, 23.665250778198242, 25.37454605102539, 27.08384132385254, 28.793136596679688, 30.502431869506836, 32.211727142333984, 33.921024322509766, 35.63031768798828, 37.33961486816406, 39.04890823364258, 40.75820541381836, 42.46750259399414, 44.176795959472656, 45.88609313964844, 47.59538650512695, 49.304683685302734, 51.01397705078125, 52.72327423095703, 54.43256759643555, 56.14186477661133, 57.851158142089844, 59.560455322265625, 61.26974868774414, 62.97904586791992, 64.68833923339844, 66.39763641357422, 68.10693359375, 69.81623077392578, 71.52552795410156, 73.23481750488281, 74.9441146850586, 76.65341186523438, 78.36270904541016, 80.0719985961914, 81.78129577636719, 83.49059295654297, 85.19989013671875, 86.9091796875, 88.61847686767578, 90.32777404785156, 92.03707122802734, 93.7463607788086, 95.45565795898438]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 11.0, 9.0, 9.0, 16.0, 15.0, 20.0, 14.0, 23.0, 22.0, 22.0, 32.0, 25.0, 30.0, 43.0, 35.0, 42.0, 41.0, 52.0, 39.0, 41.0, 35.0, 39.0, 40.0, 43.0, 43.0, 37.0, 33.0, 24.0, 32.0, 18.0, 20.0, 12.0, 12.0, 9.0, 7.0, 13.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.55908966064453, -16.9721622467041, -16.38523292541504, -15.79830551147461, -15.211377143859863, -14.624448776245117, -14.037521362304688, -13.450592994689941, -12.863664627075195, -12.27673625946045, -11.689807891845703, -11.102880477905273, -10.515952110290527, -9.929023742675781, -9.342096328735352, -8.755167961120605, -8.16823959350586, -7.581311225891113, -6.994383335113525, -6.4074554443359375, -5.820527076721191, -5.233598709106445, -4.646670818328857, -4.0597429275512695, -3.4728145599365234, -2.8858864307403564, -2.2989583015441895, -1.7120301723480225, -1.1251020431518555, -0.5381739139556885, 0.048754215240478516, 0.6356821060180664, 1.2226104736328125, 1.8095386028289795, 2.3964667320251465, 2.9833948612213135, 3.5703229904174805, 4.157251358032227, 4.7441792488098145, 5.331107139587402, 5.918035507202148, 6.5049638748168945, 7.091891765594482, 7.67881965637207, 8.265748023986816, 8.852676391601562, 9.439603805541992, 10.026532173156738, 10.613460540771484, 11.20038890838623, 11.787317276000977, 12.374244689941406, 12.961173057556152, 13.548101425170898, 14.135028839111328, 14.721957206726074, 15.30888557434082, 15.895813941955566, 16.482742309570312, 17.069669723510742, 17.656597137451172, 18.243526458740234, 18.830453872680664, 19.417381286621094, 20.004310607910156]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 5.0, 13.0, 16.0, 12.0, 13.0, 18.0, 26.0, 17.0, 24.0, 37.0, 36.0, 28.0, 36.0, 42.0, 46.0, 44.0, 33.0, 46.0, 36.0, 30.0, 54.0, 34.0, 26.0, 29.0, 27.0, 27.0, 31.0, 30.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0594482421875, -1.989990234375, -1.9205322265625, -1.85107421875, -1.7816162109375, -1.712158203125, -1.6427001953125, -1.5732421875, -1.5037841796875, -1.434326171875, -1.3648681640625, -1.29541015625, -1.2259521484375, -1.156494140625, -1.0870361328125, -1.017578125, -0.9481201171875, -0.878662109375, -0.8092041015625, -0.73974609375, -0.6702880859375, -0.600830078125, -0.5313720703125, -0.4619140625, -0.3924560546875, -0.322998046875, -0.2535400390625, -0.18408203125, -0.1146240234375, -0.045166015625, 0.0242919921875, 0.09375, 0.1632080078125, 0.232666015625, 0.3021240234375, 0.37158203125, 0.4410400390625, 0.510498046875, 0.5799560546875, 0.6494140625, 0.7188720703125, 0.788330078125, 0.8577880859375, 0.92724609375, 0.9967041015625, 1.066162109375, 1.1356201171875, 1.205078125, 1.2745361328125, 1.343994140625, 1.4134521484375, 1.48291015625, 1.5523681640625, 1.621826171875, 1.6912841796875, 1.7607421875, 1.8302001953125, 1.899658203125, 1.9691162109375, 2.03857421875, 2.1080322265625, 2.177490234375, 2.2469482421875, 2.31640625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 10.0, 15.0, 27.0, 42.0, 51.0, 74.0, 124.0, 181.0, 227.0, 331.0, 482.0, 765.0, 1035.0, 1550.0, 2337.0, 3495.0, 5298.0, 8192.0, 12959.0, 20445.0, 33734.0, 55774.0, 98218.0, 214681.0, 287990.0, 124621.0, 67647.0, 39952.0, 24766.0, 15314.0, 9692.0, 6105.0, 4094.0, 2632.0, 1801.0, 1182.0, 813.0, 569.0, 398.0, 306.0, 182.0, 133.0, 100.0, 61.0, 44.0, 32.0, 19.0, 15.0, 8.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.01373291015625, -0.013319015502929688, -0.012905120849609375, -0.012491226196289062, -0.01207733154296875, -0.011663436889648438, -0.011249542236328125, -0.010835647583007812, -0.0104217529296875, -0.010007858276367188, -0.009593963623046875, -0.009180068969726562, -0.00876617431640625, -0.008352279663085938, -0.007938385009765625, -0.0075244903564453125, -0.007110595703125, -0.0066967010498046875, -0.006282806396484375, -0.0058689117431640625, -0.00545501708984375, -0.0050411224365234375, -0.004627227783203125, -0.0042133331298828125, -0.0037994384765625, -0.0033855438232421875, -0.002971649169921875, -0.0025577545166015625, -0.00214385986328125, -0.0017299652099609375, -0.001316070556640625, -0.0009021759033203125, -0.00048828125, -7.43865966796875e-05, 0.000339508056640625, 0.0007534027099609375, 0.00116729736328125, 0.0015811920166015625, 0.001995086669921875, 0.0024089813232421875, 0.0028228759765625, 0.0032367706298828125, 0.003650665283203125, 0.0040645599365234375, 0.00447845458984375, 0.0048923492431640625, 0.005306243896484375, 0.0057201385498046875, 0.006134033203125, 0.0065479278564453125, 0.006961822509765625, 0.0073757171630859375, 0.00778961181640625, 0.008203506469726562, 0.008617401123046875, 0.009031295776367188, 0.0094451904296875, 0.009859085083007812, 0.010272979736328125, 0.010686874389648438, 0.01110076904296875, 0.011514663696289062, 0.011928558349609375, 0.012342453002929688, 0.01275634765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 8.0, 3.0, 9.0, 11.0, 15.0, 14.0, 17.0, 16.0, 25.0, 15.0, 28.0, 34.0, 29.0, 40.0, 35.0, 32.0, 51.0, 45.0, 32.0, 1084.0, 34.0, 56.0, 39.0, 34.0, 41.0, 41.0, 22.0, 32.0, 29.0, 24.0, 22.0, 20.0, 17.0, 18.0, 9.0, 6.0, 12.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.7880859375, -1.734893798828125, -1.68170166015625, -1.628509521484375, -1.5753173828125, -1.522125244140625, -1.46893310546875, -1.415740966796875, -1.362548828125, -1.309356689453125, -1.25616455078125, -1.202972412109375, -1.1497802734375, -1.096588134765625, -1.04339599609375, -0.990203857421875, -0.93701171875, -0.883819580078125, -0.83062744140625, -0.777435302734375, -0.7242431640625, -0.671051025390625, -0.61785888671875, -0.564666748046875, -0.511474609375, -0.458282470703125, -0.40509033203125, -0.351898193359375, -0.2987060546875, -0.245513916015625, -0.19232177734375, -0.139129638671875, -0.0859375, -0.032745361328125, 0.02044677734375, 0.073638916015625, 0.1268310546875, 0.180023193359375, 0.23321533203125, 0.286407470703125, 0.339599609375, 0.392791748046875, 0.44598388671875, 0.499176025390625, 0.5523681640625, 0.605560302734375, 0.65875244140625, 0.711944580078125, 0.76513671875, 0.818328857421875, 0.87152099609375, 0.924713134765625, 0.9779052734375, 1.031097412109375, 1.08428955078125, 1.137481689453125, 1.190673828125, 1.243865966796875, 1.29705810546875, 1.350250244140625, 1.4034423828125, 1.456634521484375, 1.50982666015625, 1.563018798828125, 1.6162109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 21.0, 26.0, 28.0, 34.0, 65.0, 113.0, 142.0, 229.0, 376.0, 487.0, 808.0, 1187.0, 1937.0, 2783.0, 4517.0, 7065.0, 11336.0, 18259.0, 30208.0, 50222.0, 89777.0, 196904.0, 1366546.0, 137272.0, 70230.0, 40862.0, 24502.0, 15113.0, 9392.0, 5832.0, 3859.0, 2439.0, 1500.0, 1057.0, 659.0, 408.0, 290.0, 210.0, 129.0, 94.0, 68.0, 45.0, 26.0, 25.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0096588134765625, -0.009340047836303711, -0.009021282196044922, -0.008702516555786133, -0.008383750915527344, -0.008064985275268555, -0.007746219635009766, -0.0074274539947509766, -0.0071086883544921875, -0.0067899227142333984, -0.006471157073974609, -0.00615239143371582, -0.005833625793457031, -0.005514860153198242, -0.005196094512939453, -0.004877328872680664, -0.004558563232421875, -0.004239797592163086, -0.003921031951904297, -0.003602266311645508, -0.0032835006713867188, -0.0029647350311279297, -0.0026459693908691406, -0.0023272037506103516, -0.0020084381103515625, -0.0016896724700927734, -0.0013709068298339844, -0.0010521411895751953, -0.0007333755493164062, -0.0004146099090576172, -9.584426879882812e-05, 0.00022292137145996094, 0.00054168701171875, 0.0008604526519775391, 0.0011792182922363281, 0.0014979839324951172, 0.0018167495727539062, 0.0021355152130126953, 0.0024542808532714844, 0.0027730464935302734, 0.0030918121337890625, 0.0034105777740478516, 0.0037293434143066406, 0.00404810905456543, 0.004366874694824219, 0.004685640335083008, 0.005004405975341797, 0.005323171615600586, 0.005641937255859375, 0.005960702896118164, 0.006279468536376953, 0.006598234176635742, 0.006916999816894531, 0.00723576545715332, 0.007554531097412109, 0.007873296737670898, 0.008192062377929688, 0.008510828018188477, 0.008829593658447266, 0.009148359298706055, 0.009467124938964844, 0.009785890579223633, 0.010104656219482422, 0.010423421859741211, 0.0107421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 956.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 31.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 37.0, 31.0, 0.0, 40.0, 0.0, 267.0, 2896.0, 0.0, 16532.0, 0.0, 1008809.0, 16601.0, 0.0, 2915.0, 0.0, 238.0, 53.0, 0.0, 43.0, 0.0, 26.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 20.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0961666703224182e-06, -1.0598450899124146e-06, -1.0235235095024109e-06, -9.872019290924072e-07, -9.508803486824036e-07, -9.145587682723999e-07, -8.782371878623962e-07, -8.419156074523926e-07, -8.055940270423889e-07, -7.692724466323853e-07, -7.329508662223816e-07, -6.966292858123779e-07, -6.603077054023743e-07, -6.239861249923706e-07, -5.876645445823669e-07, -5.513429641723633e-07, -5.150213837623596e-07, -4.78699803352356e-07, -4.423782229423523e-07, -4.0605664253234863e-07, -3.6973506212234497e-07, -3.334134817123413e-07, -2.9709190130233765e-07, -2.60770320892334e-07, -2.2444874048233032e-07, -1.8812716007232666e-07, -1.51805579662323e-07, -1.1548399925231934e-07, -7.916241884231567e-08, -4.284083843231201e-08, -6.51925802230835e-09, 2.9802322387695312e-08, 6.612390279769897e-08, 1.0244548320770264e-07, 1.387670636177063e-07, 1.7508864402770996e-07, 2.1141022443771362e-07, 2.477318048477173e-07, 2.8405338525772095e-07, 3.203749656677246e-07, 3.5669654607772827e-07, 3.9301812648773193e-07, 4.293397068977356e-07, 4.6566128730773926e-07, 5.019828677177429e-07, 5.383044481277466e-07, 5.746260285377502e-07, 6.109476089477539e-07, 6.472691893577576e-07, 6.835907697677612e-07, 7.199123501777649e-07, 7.562339305877686e-07, 7.925555109977722e-07, 8.288770914077759e-07, 8.651986718177795e-07, 9.015202522277832e-07, 9.378418326377869e-07, 9.741634130477905e-07, 1.0104849934577942e-06, 1.0468065738677979e-06, 1.0831281542778015e-06, 1.1194497346878052e-06, 1.1557713150978088e-06, 1.1920928955078125e-06]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 5.0, 13.0, 16.0, 12.0, 13.0, 18.0, 26.0, 17.0, 24.0, 37.0, 36.0, 28.0, 36.0, 42.0, 46.0, 44.0, 33.0, 46.0, 36.0, 30.0, 54.0, 34.0, 26.0, 29.0, 27.0, 27.0, 31.0, 30.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0594482421875, -1.989990234375, -1.9205322265625, -1.85107421875, -1.7816162109375, -1.712158203125, -1.6427001953125, -1.5732421875, -1.5037841796875, -1.434326171875, -1.3648681640625, -1.29541015625, -1.2259521484375, -1.156494140625, -1.0870361328125, -1.017578125, -0.9481201171875, -0.878662109375, -0.8092041015625, -0.73974609375, -0.6702880859375, -0.600830078125, -0.5313720703125, -0.4619140625, -0.3924560546875, -0.322998046875, -0.2535400390625, -0.18408203125, -0.1146240234375, -0.045166015625, 0.0242919921875, 0.09375, 0.1632080078125, 0.232666015625, 0.3021240234375, 0.37158203125, 0.4410400390625, 0.510498046875, 0.5799560546875, 0.6494140625, 0.7188720703125, 0.788330078125, 0.8577880859375, 0.92724609375, 0.9967041015625, 1.066162109375, 1.1356201171875, 1.205078125, 1.2745361328125, 1.343994140625, 1.4134521484375, 1.48291015625, 1.5523681640625, 1.621826171875, 1.6912841796875, 1.7607421875, 1.8302001953125, 1.899658203125, 1.9691162109375, 2.03857421875, 2.1080322265625, 2.177490234375, 2.2469482421875, 2.31640625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 18.0, 20.0, 12.0, 27.0, 31.0, 55.0, 87.0, 130.0, 240.0, 303.0, 494.0, 786.0, 1184.0, 1921.0, 2934.0, 4611.0, 7436.0, 11998.0, 18922.0, 30815.0, 52054.0, 143133.0, 483663.0, 150971.0, 53311.0, 30948.0, 19378.0, 12305.0, 7528.0, 4851.0, 3028.0, 1895.0, 1247.0, 817.0, 494.0, 298.0, 200.0, 149.0, 90.0, 54.0, 40.0, 31.0, 12.0, 8.0, 8.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.28515625, -2.21697998046875, -2.1488037109375, -2.08062744140625, -2.012451171875, -1.94427490234375, -1.8760986328125, -1.80792236328125, -1.73974609375, -1.67156982421875, -1.6033935546875, -1.53521728515625, -1.467041015625, -1.39886474609375, -1.3306884765625, -1.26251220703125, -1.1943359375, -1.12615966796875, -1.0579833984375, -0.98980712890625, -0.921630859375, -0.85345458984375, -0.7852783203125, -0.71710205078125, -0.64892578125, -0.58074951171875, -0.5125732421875, -0.44439697265625, -0.376220703125, -0.30804443359375, -0.2398681640625, -0.17169189453125, -0.103515625, -0.03533935546875, 0.0328369140625, 0.10101318359375, 0.169189453125, 0.23736572265625, 0.3055419921875, 0.37371826171875, 0.44189453125, 0.51007080078125, 0.5782470703125, 0.64642333984375, 0.714599609375, 0.78277587890625, 0.8509521484375, 0.91912841796875, 0.9873046875, 1.05548095703125, 1.1236572265625, 1.19183349609375, 1.260009765625, 1.32818603515625, 1.3963623046875, 1.46453857421875, 1.53271484375, 1.60089111328125, 1.6690673828125, 1.73724365234375, 1.805419921875, 1.87359619140625, 1.9417724609375, 2.00994873046875, 2.078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 8.0, 10.0, 10.0, 12.0, 20.0, 10.0, 15.0, 21.0, 35.0, 25.0, 39.0, 37.0, 32.0, 49.0, 77.0, 136.0, 1590.0, 310.0, 105.0, 58.0, 51.0, 42.0, 46.0, 32.0, 31.0, 32.0, 33.0, 20.0, 22.0, 27.0, 19.0, 8.0, 12.0, 11.0, 11.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-8.265625, -8.0140380859375, -7.762451171875, -7.5108642578125, -7.25927734375, -7.0076904296875, -6.756103515625, -6.5045166015625, -6.2529296875, -6.0013427734375, -5.749755859375, -5.4981689453125, -5.24658203125, -4.9949951171875, -4.743408203125, -4.4918212890625, -4.240234375, -3.9886474609375, -3.737060546875, -3.4854736328125, -3.23388671875, -2.9822998046875, -2.730712890625, -2.4791259765625, -2.2275390625, -1.9759521484375, -1.724365234375, -1.4727783203125, -1.22119140625, -0.9696044921875, -0.718017578125, -0.4664306640625, -0.21484375, 0.0367431640625, 0.288330078125, 0.5399169921875, 0.79150390625, 1.0430908203125, 1.294677734375, 1.5462646484375, 1.7978515625, 2.0494384765625, 2.301025390625, 2.5526123046875, 2.80419921875, 3.0557861328125, 3.307373046875, 3.5589599609375, 3.810546875, 4.0621337890625, 4.313720703125, 4.5653076171875, 4.81689453125, 5.0684814453125, 5.320068359375, 5.5716552734375, 5.8232421875, 6.0748291015625, 6.326416015625, 6.5780029296875, 6.82958984375, 7.0811767578125, 7.332763671875, 7.5843505859375, 7.8359375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 15.0, 14.0, 12.0, 20.0, 20.0, 24.0, 31.0, 46.0, 52.0, 90.0, 84.0, 118.0, 149.0, 212.0, 375.0, 1123.0, 7061.0, 98740.0, 2927814.0, 100267.0, 7219.0, 1049.0, 367.0, 197.0, 144.0, 110.0, 78.0, 66.0, 35.0, 28.0, 20.0, 22.0, 11.0, 18.0, 14.0, 8.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.3359375, -12.91259765625, -12.4892578125, -12.06591796875, -11.642578125, -11.21923828125, -10.7958984375, -10.37255859375, -9.94921875, -9.52587890625, -9.1025390625, -8.67919921875, -8.255859375, -7.83251953125, -7.4091796875, -6.98583984375, -6.5625, -6.13916015625, -5.7158203125, -5.29248046875, -4.869140625, -4.44580078125, -4.0224609375, -3.59912109375, -3.17578125, -2.75244140625, -2.3291015625, -1.90576171875, -1.482421875, -1.05908203125, -0.6357421875, -0.21240234375, 0.2109375, 0.63427734375, 1.0576171875, 1.48095703125, 1.904296875, 2.32763671875, 2.7509765625, 3.17431640625, 3.59765625, 4.02099609375, 4.4443359375, 4.86767578125, 5.291015625, 5.71435546875, 6.1376953125, 6.56103515625, 6.984375, 7.40771484375, 7.8310546875, 8.25439453125, 8.677734375, 9.10107421875, 9.5244140625, 9.94775390625, 10.37109375, 10.79443359375, 11.2177734375, 11.64111328125, 12.064453125, 12.48779296875, 12.9111328125, 13.33447265625, 13.7578125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 9.0, 298.0, 656.0, 53.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.055992126464844, -13.795495986938477, -10.53499984741211, -7.274503707885742, -4.014007568359375, -0.7535114288330078, 2.5069847106933594, 5.767480850219727, 9.027976989746094, 12.288473129272461, 15.548969268798828, 18.809465408325195, 22.069961547851562, 25.33045768737793, 28.590953826904297, 31.851449966430664, 35.11194610595703, 38.37244415283203, 41.632938385009766, 44.8934326171875, 48.1539306640625, 51.4144287109375, 54.674922943115234, 57.93541717529297, 61.19591522216797, 64.45641326904297, 67.71690368652344, 70.97740173339844, 74.23789978027344, 77.49839782714844, 80.75889587402344, 84.0193862915039, 87.27987670898438, 90.54037475585938, 93.80087280273438, 97.06136322021484, 100.32186126708984, 103.58235931396484, 106.84284973144531, 110.10334777832031, 113.36384582519531, 116.62434387207031, 119.88484191894531, 123.14533233642578, 126.40583038330078, 129.66632080078125, 132.92681884765625, 136.18731689453125, 139.44781494140625, 142.70831298828125, 145.96881103515625, 149.22930908203125, 152.48980712890625, 155.7502899169922, 159.0107879638672, 162.2712860107422, 165.5317840576172, 168.7922821044922, 172.0527801513672, 175.3132781982422, 178.57376098632812, 181.83425903320312, 185.09475708007812, 188.35525512695312, 191.61575317382812]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 5.0, 14.0, 13.0, 12.0, 6.0, 20.0, 16.0, 18.0, 22.0, 25.0, 31.0, 32.0, 38.0, 26.0, 36.0, 39.0, 34.0, 36.0, 37.0, 33.0, 43.0, 27.0, 54.0, 46.0, 26.0, 29.0, 32.0, 23.0, 29.0, 25.0, 24.0, 18.0, 13.0, 17.0, 14.0, 9.0, 10.0, 8.0, 12.0, 9.0, 2.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-20.439821243286133, -19.773361206054688, -19.106901168823242, -18.440441131591797, -17.77398109436035, -17.107521057128906, -16.441062927246094, -15.774602890014648, -15.108142852783203, -14.441682815551758, -13.775222778320312, -13.108762741088867, -12.442303657531738, -11.775843620300293, -11.109383583068848, -10.442924499511719, -9.776463508605957, -9.110003471374512, -8.443543434143066, -7.777083873748779, -7.110624313354492, -6.444164276123047, -5.777704238891602, -5.1112446784973145, -4.444784641265869, -3.778324842453003, -3.1118650436401367, -2.4454050064086914, -1.7789452075958252, -1.112485408782959, -0.44602537155151367, 0.22043418884277344, 0.8868942260742188, 1.553354024887085, 2.219813823699951, 2.8862738609313965, 3.5527336597442627, 4.219193458557129, 4.885653495788574, 5.552113056182861, 6.218573093414307, 6.885033130645752, 7.551492691040039, 8.217952728271484, 8.88441276550293, 9.550872802734375, 10.21733283996582, 10.88379192352295, 11.550251960754395, 12.21671199798584, 12.883172035217285, 13.549631118774414, 14.21609115600586, 14.882551193237305, 15.54901123046875, 16.215471267700195, 16.88193130493164, 17.548391342163086, 18.21485137939453, 18.881311416625977, 19.547771453857422, 20.214229583740234, 20.880691528320312, 21.547149658203125, 22.21360969543457]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 1.0, 2.0, 8.0, 7.0, 12.0, 12.0, 9.0, 14.0, 14.0, 20.0, 14.0, 21.0, 31.0, 40.0, 25.0, 44.0, 46.0, 35.0, 38.0, 45.0, 35.0, 39.0, 52.0, 46.0, 34.0, 29.0, 30.0, 27.0, 40.0, 22.0, 24.0, 35.0, 31.0, 25.0, 20.0, 11.0, 10.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.168426513671875, -2.09466552734375, -2.020904541015625, -1.9471435546875, -1.873382568359375, -1.79962158203125, -1.725860595703125, -1.652099609375, -1.578338623046875, -1.50457763671875, -1.430816650390625, -1.3570556640625, -1.283294677734375, -1.20953369140625, -1.135772705078125, -1.06201171875, -0.988250732421875, -0.91448974609375, -0.840728759765625, -0.7669677734375, -0.693206787109375, -0.61944580078125, -0.545684814453125, -0.471923828125, -0.398162841796875, -0.32440185546875, -0.250640869140625, -0.1768798828125, -0.103118896484375, -0.02935791015625, 0.044403076171875, 0.1181640625, 0.191925048828125, 0.26568603515625, 0.339447021484375, 0.4132080078125, 0.486968994140625, 0.56072998046875, 0.634490966796875, 0.708251953125, 0.782012939453125, 0.85577392578125, 0.929534912109375, 1.0032958984375, 1.077056884765625, 1.15081787109375, 1.224578857421875, 1.29833984375, 1.372100830078125, 1.44586181640625, 1.519622802734375, 1.5933837890625, 1.667144775390625, 1.74090576171875, 1.814666748046875, 1.888427734375, 1.962188720703125, 2.03594970703125, 2.109710693359375, 2.1834716796875, 2.257232666015625, 2.33099365234375, 2.404754638671875, 2.478515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 13.0, 7.0, 10.0, 14.0, 27.0, 27.0, 28.0, 48.0, 76.0, 102.0, 145.0, 170.0, 293.0, 436.0, 640.0, 1041.0, 1895.0, 3543.0, 7088.0, 14999.0, 35893.0, 95645.0, 300903.0, 1018189.0, 1662454.0, 719415.0, 207287.0, 69938.0, 28182.0, 12243.0, 5864.0, 3076.0, 1707.0, 936.0, 622.0, 391.0, 246.0, 162.0, 136.0, 105.0, 79.0, 61.0, 33.0, 23.0, 29.0, 15.0, 15.0, 12.0, 6.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.689453125, -3.575408935546875, -3.46136474609375, -3.347320556640625, -3.2332763671875, -3.119232177734375, -3.00518798828125, -2.891143798828125, -2.777099609375, -2.663055419921875, -2.54901123046875, -2.434967041015625, -2.3209228515625, -2.206878662109375, -2.09283447265625, -1.978790283203125, -1.86474609375, -1.750701904296875, -1.63665771484375, -1.522613525390625, -1.4085693359375, -1.294525146484375, -1.18048095703125, -1.066436767578125, -0.952392578125, -0.838348388671875, -0.72430419921875, -0.610260009765625, -0.4962158203125, -0.382171630859375, -0.26812744140625, -0.154083251953125, -0.0400390625, 0.074005126953125, 0.18804931640625, 0.302093505859375, 0.4161376953125, 0.530181884765625, 0.64422607421875, 0.758270263671875, 0.872314453125, 0.986358642578125, 1.10040283203125, 1.214447021484375, 1.3284912109375, 1.442535400390625, 1.55657958984375, 1.670623779296875, 1.78466796875, 1.898712158203125, 2.01275634765625, 2.126800537109375, 2.2408447265625, 2.354888916015625, 2.46893310546875, 2.582977294921875, 2.697021484375, 2.811065673828125, 2.92510986328125, 3.039154052734375, 3.1531982421875, 3.267242431640625, 3.38128662109375, 3.495330810546875, 3.609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 29.0, 34.0, 55.0, 68.0, 117.0, 138.0, 211.0, 245.0, 329.0, 402.0, 484.0, 454.0, 390.0, 278.0, 191.0, 159.0, 122.0, 93.0, 66.0, 48.0, 38.0, 19.0, 16.0, 14.0, 17.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.85546875, -7.66253662109375, -7.4696044921875, -7.27667236328125, -7.083740234375, -6.89080810546875, -6.6978759765625, -6.50494384765625, -6.31201171875, -6.11907958984375, -5.9261474609375, -5.73321533203125, -5.540283203125, -5.34735107421875, -5.1544189453125, -4.96148681640625, -4.7685546875, -4.57562255859375, -4.3826904296875, -4.18975830078125, -3.996826171875, -3.80389404296875, -3.6109619140625, -3.41802978515625, -3.22509765625, -3.03216552734375, -2.8392333984375, -2.64630126953125, -2.453369140625, -2.26043701171875, -2.0675048828125, -1.87457275390625, -1.681640625, -1.48870849609375, -1.2957763671875, -1.10284423828125, -0.909912109375, -0.71697998046875, -0.5240478515625, -0.33111572265625, -0.13818359375, 0.05474853515625, 0.2476806640625, 0.44061279296875, 0.633544921875, 0.82647705078125, 1.0194091796875, 1.21234130859375, 1.4052734375, 1.59820556640625, 1.7911376953125, 1.98406982421875, 2.177001953125, 2.36993408203125, 2.5628662109375, 2.75579833984375, 2.94873046875, 3.14166259765625, 3.3345947265625, 3.52752685546875, 3.720458984375, 3.91339111328125, 4.1063232421875, 4.29925537109375, 4.4921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 16.0, 21.0, 24.0, 41.0, 48.0, 69.0, 101.0, 137.0, 205.0, 307.0, 596.0, 1388.0, 4978.0, 27048.0, 217859.0, 2204622.0, 1561977.0, 149146.0, 19373.0, 3782.0, 1142.0, 491.0, 282.0, 162.0, 133.0, 76.0, 53.0, 49.0, 46.0, 22.0, 20.0, 19.0, 17.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.0921630859375, -7.739013671875, -7.3858642578125, -7.03271484375, -6.6795654296875, -6.326416015625, -5.9732666015625, -5.6201171875, -5.2669677734375, -4.913818359375, -4.5606689453125, -4.20751953125, -3.8543701171875, -3.501220703125, -3.1480712890625, -2.794921875, -2.4417724609375, -2.088623046875, -1.7354736328125, -1.38232421875, -1.0291748046875, -0.676025390625, -0.3228759765625, 0.0302734375, 0.3834228515625, 0.736572265625, 1.0897216796875, 1.44287109375, 1.7960205078125, 2.149169921875, 2.5023193359375, 2.85546875, 3.2086181640625, 3.561767578125, 3.9149169921875, 4.26806640625, 4.6212158203125, 4.974365234375, 5.3275146484375, 5.6806640625, 6.0338134765625, 6.386962890625, 6.7401123046875, 7.09326171875, 7.4464111328125, 7.799560546875, 8.1527099609375, 8.505859375, 8.8590087890625, 9.212158203125, 9.5653076171875, 9.91845703125, 10.2716064453125, 10.624755859375, 10.9779052734375, 11.3310546875, 11.6842041015625, 12.037353515625, 12.3905029296875, 12.74365234375, 13.0968017578125, 13.449951171875, 13.8031005859375, 14.15625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 8.0, 15.0, 22.0, 29.0, 45.0, 65.0, 91.0, 116.0, 115.0, 117.0, 110.0, 84.0, 59.0, 47.0, 23.0, 23.0, 14.0, 12.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.782926559448242, -17.738866806030273, -16.694808959960938, -15.650749206542969, -14.606689453125, -13.562630653381348, -12.518571853637695, -11.474512100219727, -10.430453300476074, -9.386394500732422, -8.342334747314453, -7.298275947570801, -6.25421667098999, -5.21015739440918, -4.166098594665527, -3.122039318084717, -2.0779800415039062, -1.0339208841323853, 0.010138273239135742, 1.0541973114013672, 2.0982565879821777, 3.1423158645629883, 4.186374664306641, 5.230433940887451, 6.274493217468262, 7.318552494049072, 8.362611770629883, 9.406670570373535, 10.450729370117188, 11.494789123535156, 12.538847923278809, 13.582906723022461, 14.626968383789062, 15.671027183532715, 16.715085983276367, 17.759145736694336, 18.803205490112305, 19.84726333618164, 20.89132308959961, 21.935382843017578, 22.979442596435547, 24.023502349853516, 25.06756019592285, 26.11161994934082, 27.15567970275879, 28.199737548828125, 29.243797302246094, 30.287857055664062, 31.3319149017334, 32.375972747802734, 33.4200325012207, 34.46409225463867, 35.50815200805664, 36.55221176147461, 37.59626770019531, 38.64032745361328, 39.68438720703125, 40.72844696044922, 41.77250671386719, 42.816566467285156, 43.86062240600586, 44.90468215942383, 45.9487419128418, 46.992801666259766, 48.036861419677734]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 13.0, 9.0, 12.0, 11.0, 18.0, 24.0, 16.0, 27.0, 36.0, 31.0, 24.0, 31.0, 39.0, 46.0, 30.0, 38.0, 43.0, 33.0, 45.0, 37.0, 44.0, 46.0, 48.0, 32.0, 26.0, 21.0, 32.0, 36.0, 25.0, 22.0, 16.0, 15.0, 21.0, 6.0, 12.0, 9.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.000259399414062, -17.39913558959961, -16.798011779785156, -16.196887969970703, -15.595763206481934, -14.99463939666748, -14.393514633178711, -13.792390823364258, -13.191267013549805, -12.590143203735352, -11.989019393920898, -11.387894630432129, -10.786770820617676, -10.185647010803223, -9.584522247314453, -8.9833984375, -8.382274627685547, -7.781150817871094, -7.180026531219482, -6.578902244567871, -5.977778434753418, -5.376654624938965, -4.7755303382873535, -4.174406051635742, -3.573282241821289, -2.972158193588257, -2.3710341453552246, -1.7699100971221924, -1.1687860488891602, -0.5676620006561279, 0.0334620475769043, 0.6345863342285156, 1.2357101440429688, 1.836834192276001, 2.437958240509033, 3.0390822887420654, 3.6402063369750977, 4.241330146789551, 4.842454433441162, 5.443578720092773, 6.044702529907227, 6.64582633972168, 7.246950626373291, 7.848074913024902, 8.449198722839355, 9.050322532653809, 9.651447296142578, 10.252571105957031, 10.853694915771484, 11.454818725585938, 12.05594253540039, 12.65706729888916, 13.258191108703613, 13.859314918518066, 14.460439682006836, 15.061563491821289, 15.662687301635742, 16.263811111450195, 16.86493492126465, 17.4660587310791, 18.067184448242188, 18.66830825805664, 19.269432067871094, 19.870555877685547, 20.4716796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 18.0, 15.0, 17.0, 25.0, 22.0, 34.0, 30.0, 31.0, 32.0, 41.0, 35.0, 41.0, 56.0, 40.0, 34.0, 33.0, 41.0, 32.0, 32.0, 40.0, 54.0, 34.0, 22.0, 30.0, 25.0, 21.0, 16.0, 14.0, 10.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.203125, -2.129730224609375, -2.05633544921875, -1.982940673828125, -1.9095458984375, -1.836151123046875, -1.76275634765625, -1.689361572265625, -1.615966796875, -1.542572021484375, -1.46917724609375, -1.395782470703125, -1.3223876953125, -1.248992919921875, -1.17559814453125, -1.102203369140625, -1.02880859375, -0.955413818359375, -0.88201904296875, -0.808624267578125, -0.7352294921875, -0.661834716796875, -0.58843994140625, -0.515045166015625, -0.441650390625, -0.368255615234375, -0.29486083984375, -0.221466064453125, -0.1480712890625, -0.074676513671875, -0.00128173828125, 0.072113037109375, 0.1455078125, 0.218902587890625, 0.29229736328125, 0.365692138671875, 0.4390869140625, 0.512481689453125, 0.58587646484375, 0.659271240234375, 0.732666015625, 0.806060791015625, 0.87945556640625, 0.952850341796875, 1.0262451171875, 1.099639892578125, 1.17303466796875, 1.246429443359375, 1.31982421875, 1.393218994140625, 1.46661376953125, 1.540008544921875, 1.6134033203125, 1.686798095703125, 1.76019287109375, 1.833587646484375, 1.906982421875, 1.980377197265625, 2.05377197265625, 2.127166748046875, 2.2005615234375, 2.273956298828125, 2.34735107421875, 2.420745849609375, 2.494140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 10.0, 21.0, 29.0, 32.0, 47.0, 72.0, 99.0, 145.0, 201.0, 292.0, 449.0, 642.0, 864.0, 1263.0, 1921.0, 2811.0, 4269.0, 6446.0, 9772.0, 15363.0, 25099.0, 41179.0, 71033.0, 133263.0, 299428.0, 200992.0, 93079.0, 52826.0, 31603.0, 19371.0, 12199.0, 7903.0, 5144.0, 3338.0, 2278.0, 1577.0, 1050.0, 748.0, 517.0, 351.0, 245.0, 158.0, 132.0, 86.0, 59.0, 35.0, 34.0, 33.0, 17.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.01372528076171875, -0.013306021690368652, -0.012886762619018555, -0.012467503547668457, -0.01204824447631836, -0.011628985404968262, -0.011209726333618164, -0.010790467262268066, -0.010371208190917969, -0.009951949119567871, -0.009532690048217773, -0.009113430976867676, -0.008694171905517578, -0.00827491283416748, -0.007855653762817383, -0.007436394691467285, -0.0070171356201171875, -0.00659787654876709, -0.006178617477416992, -0.0057593584060668945, -0.005340099334716797, -0.004920840263366699, -0.0045015811920166016, -0.004082322120666504, -0.0036630630493164062, -0.0032438039779663086, -0.002824544906616211, -0.0024052858352661133, -0.0019860267639160156, -0.001566767692565918, -0.0011475086212158203, -0.0007282495498657227, -0.000308990478515625, 0.00011026859283447266, 0.0005295276641845703, 0.000948786735534668, 0.0013680458068847656, 0.0017873048782348633, 0.002206563949584961, 0.0026258230209350586, 0.0030450820922851562, 0.003464341163635254, 0.0038836002349853516, 0.004302859306335449, 0.004722118377685547, 0.0051413774490356445, 0.005560636520385742, 0.00597989559173584, 0.0063991546630859375, 0.006818413734436035, 0.007237672805786133, 0.0076569318771362305, 0.008076190948486328, 0.008495450019836426, 0.008914709091186523, 0.009333968162536621, 0.009753227233886719, 0.010172486305236816, 0.010591745376586914, 0.011011004447937012, 0.01143026351928711, 0.011849522590637207, 0.012268781661987305, 0.012688040733337402, 0.0131072998046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 6.0, 13.0, 24.0, 19.0, 28.0, 26.0, 37.0, 46.0, 29.0, 52.0, 43.0, 48.0, 43.0, 40.0, 1067.0, 57.0, 62.0, 49.0, 29.0, 48.0, 36.0, 42.0, 25.0, 24.0, 26.0, 23.0, 9.0, 9.0, 5.0, 7.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.349609375, -2.2863922119140625, -2.223175048828125, -2.1599578857421875, -2.09674072265625, -2.0335235595703125, -1.970306396484375, -1.9070892333984375, -1.8438720703125, -1.7806549072265625, -1.717437744140625, -1.6542205810546875, -1.59100341796875, -1.5277862548828125, -1.464569091796875, -1.4013519287109375, -1.338134765625, -1.2749176025390625, -1.211700439453125, -1.1484832763671875, -1.08526611328125, -1.0220489501953125, -0.958831787109375, -0.8956146240234375, -0.8323974609375, -0.7691802978515625, -0.705963134765625, -0.6427459716796875, -0.57952880859375, -0.5163116455078125, -0.453094482421875, -0.3898773193359375, -0.32666015625, -0.2634429931640625, -0.200225830078125, -0.1370086669921875, -0.07379150390625, -0.0105743408203125, 0.052642822265625, 0.1158599853515625, 0.1790771484375, 0.2422943115234375, 0.305511474609375, 0.3687286376953125, 0.43194580078125, 0.4951629638671875, 0.558380126953125, 0.6215972900390625, 0.684814453125, 0.7480316162109375, 0.811248779296875, 0.8744659423828125, 0.93768310546875, 1.0009002685546875, 1.064117431640625, 1.1273345947265625, 1.1905517578125, 1.2537689208984375, 1.316986083984375, 1.3802032470703125, 1.44342041015625, 1.5066375732421875, 1.569854736328125, 1.6330718994140625, 1.6962890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 5.0, 8.0, 21.0, 31.0, 48.0, 78.0, 114.0, 190.0, 288.0, 501.0, 925.0, 1386.0, 2288.0, 4101.0, 7141.0, 13017.0, 24359.0, 46570.0, 94666.0, 236920.0, 1399201.0, 132488.0, 62600.0, 31684.0, 16980.0, 8980.0, 5310.0, 2879.0, 1698.0, 1015.0, 603.0, 398.0, 227.0, 121.0, 106.0, 75.0, 31.0, 18.0, 15.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01261138916015625, -0.012193918228149414, -0.011776447296142578, -0.011358976364135742, -0.010941505432128906, -0.01052403450012207, -0.010106563568115234, -0.009689092636108398, -0.009271621704101562, -0.008854150772094727, -0.00843667984008789, -0.008019208908081055, -0.007601737976074219, -0.007184267044067383, -0.006766796112060547, -0.006349325180053711, -0.005931854248046875, -0.005514383316040039, -0.005096912384033203, -0.004679441452026367, -0.004261970520019531, -0.0038444995880126953, -0.0034270286560058594, -0.0030095577239990234, -0.0025920867919921875, -0.0021746158599853516, -0.0017571449279785156, -0.0013396739959716797, -0.0009222030639648438, -0.0005047321319580078, -8.726119995117188e-05, 0.00033020973205566406, 0.0007476806640625, 0.001165151596069336, 0.0015826225280761719, 0.002000093460083008, 0.0024175643920898438, 0.0028350353240966797, 0.0032525062561035156, 0.0036699771881103516, 0.0040874481201171875, 0.0045049190521240234, 0.004922389984130859, 0.005339860916137695, 0.005757331848144531, 0.006174802780151367, 0.006592273712158203, 0.007009744644165039, 0.007427215576171875, 0.007844686508178711, 0.008262157440185547, 0.008679628372192383, 0.009097099304199219, 0.009514570236206055, 0.00993204116821289, 0.010349512100219727, 0.010766983032226562, 0.011184453964233398, 0.011601924896240234, 0.01201939582824707, 0.012436866760253906, 0.012854337692260742, 0.013271808624267578, 0.013689279556274414, 0.01410675048828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 966.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 20.0, 37.0, 41.0, 216.0, 2361.0, 14002.0, 1015336.0, 13776.0, 2358.0, 244.0, 49.0, 25.0, 31.0, 4.0, 6.0, 0.0, 0.0, 0.0, 6.0, 19.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06, 1.9073486328125e-06]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 18.0, 15.0, 17.0, 25.0, 22.0, 34.0, 30.0, 31.0, 32.0, 41.0, 35.0, 41.0, 56.0, 40.0, 34.0, 33.0, 41.0, 32.0, 32.0, 40.0, 54.0, 34.0, 22.0, 30.0, 25.0, 21.0, 16.0, 14.0, 10.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.203125, -2.129730224609375, -2.05633544921875, -1.982940673828125, -1.9095458984375, -1.836151123046875, -1.76275634765625, -1.689361572265625, -1.615966796875, -1.542572021484375, -1.46917724609375, -1.395782470703125, -1.3223876953125, -1.248992919921875, -1.17559814453125, -1.102203369140625, -1.02880859375, -0.955413818359375, -0.88201904296875, -0.808624267578125, -0.7352294921875, -0.661834716796875, -0.58843994140625, -0.515045166015625, -0.441650390625, -0.368255615234375, -0.29486083984375, -0.221466064453125, -0.1480712890625, -0.074676513671875, -0.00128173828125, 0.072113037109375, 0.1455078125, 0.218902587890625, 0.29229736328125, 0.365692138671875, 0.4390869140625, 0.512481689453125, 0.58587646484375, 0.659271240234375, 0.732666015625, 0.806060791015625, 0.87945556640625, 0.952850341796875, 1.0262451171875, 1.099639892578125, 1.17303466796875, 1.246429443359375, 1.31982421875, 1.393218994140625, 1.46661376953125, 1.540008544921875, 1.6134033203125, 1.686798095703125, 1.76019287109375, 1.833587646484375, 1.906982421875, 1.980377197265625, 2.05377197265625, 2.127166748046875, 2.2005615234375, 2.273956298828125, 2.34735107421875, 2.420745849609375, 2.494140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 6.0, 15.0, 15.0, 18.0, 25.0, 46.0, 74.0, 84.0, 139.0, 240.0, 352.0, 538.0, 914.0, 1537.0, 2352.0, 3868.0, 6669.0, 11958.0, 22260.0, 41288.0, 84156.0, 216426.0, 375748.0, 143304.0, 63424.0, 32331.0, 17277.0, 9651.0, 5430.0, 3156.0, 1956.0, 1185.0, 696.0, 476.0, 317.0, 206.0, 140.0, 86.0, 53.0, 40.0, 35.0, 14.0, 15.0, 8.0, 9.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0625, -1.99444580078125, -1.9263916015625, -1.85833740234375, -1.790283203125, -1.72222900390625, -1.6541748046875, -1.58612060546875, -1.51806640625, -1.45001220703125, -1.3819580078125, -1.31390380859375, -1.245849609375, -1.17779541015625, -1.1097412109375, -1.04168701171875, -0.9736328125, -0.90557861328125, -0.8375244140625, -0.76947021484375, -0.701416015625, -0.63336181640625, -0.5653076171875, -0.49725341796875, -0.42919921875, -0.36114501953125, -0.2930908203125, -0.22503662109375, -0.156982421875, -0.08892822265625, -0.0208740234375, 0.04718017578125, 0.115234375, 0.18328857421875, 0.2513427734375, 0.31939697265625, 0.387451171875, 0.45550537109375, 0.5235595703125, 0.59161376953125, 0.65966796875, 0.72772216796875, 0.7957763671875, 0.86383056640625, 0.931884765625, 0.99993896484375, 1.0679931640625, 1.13604736328125, 1.2041015625, 1.27215576171875, 1.3402099609375, 1.40826416015625, 1.476318359375, 1.54437255859375, 1.6124267578125, 1.68048095703125, 1.74853515625, 1.81658935546875, 1.8846435546875, 1.95269775390625, 2.020751953125, 2.08880615234375, 2.1568603515625, 2.22491455078125, 2.29296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 5.0, 10.0, 7.0, 8.0, 8.0, 12.0, 13.0, 16.0, 25.0, 29.0, 29.0, 34.0, 41.0, 57.0, 66.0, 66.0, 140.0, 345.0, 1529.0, 159.0, 89.0, 71.0, 37.0, 29.0, 44.0, 36.0, 22.0, 24.0, 17.0, 23.0, 15.0, 11.0, 13.0, 8.0, 1.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.902587890625, -9.56298828125, -9.223388671875, -8.8837890625, -8.544189453125, -8.20458984375, -7.864990234375, -7.525390625, -7.185791015625, -6.84619140625, -6.506591796875, -6.1669921875, -5.827392578125, -5.48779296875, -5.148193359375, -4.80859375, -4.468994140625, -4.12939453125, -3.789794921875, -3.4501953125, -3.110595703125, -2.77099609375, -2.431396484375, -2.091796875, -1.752197265625, -1.41259765625, -1.072998046875, -0.7333984375, -0.393798828125, -0.05419921875, 0.285400390625, 0.625, 0.964599609375, 1.30419921875, 1.643798828125, 1.9833984375, 2.322998046875, 2.66259765625, 3.002197265625, 3.341796875, 3.681396484375, 4.02099609375, 4.360595703125, 4.7001953125, 5.039794921875, 5.37939453125, 5.718994140625, 6.05859375, 6.398193359375, 6.73779296875, 7.077392578125, 7.4169921875, 7.756591796875, 8.09619140625, 8.435791015625, 8.775390625, 9.114990234375, 9.45458984375, 9.794189453125, 10.1337890625, 10.473388671875, 10.81298828125, 11.152587890625, 11.4921875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 8.0, 8.0, 20.0, 13.0, 24.0, 31.0, 36.0, 48.0, 64.0, 90.0, 124.0, 160.0, 306.0, 732.0, 2912.0, 34336.0, 2993491.0, 106564.0, 4624.0, 1028.0, 382.0, 216.0, 133.0, 81.0, 63.0, 55.0, 38.0, 31.0, 21.0, 14.0, 9.0, 16.0, 12.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -22.141845703125, -21.50244140625, -20.863037109375, -20.2236328125, -19.584228515625, -18.94482421875, -18.305419921875, -17.666015625, -17.026611328125, -16.38720703125, -15.747802734375, -15.1083984375, -14.468994140625, -13.82958984375, -13.190185546875, -12.55078125, -11.911376953125, -11.27197265625, -10.632568359375, -9.9931640625, -9.353759765625, -8.71435546875, -8.074951171875, -7.435546875, -6.796142578125, -6.15673828125, -5.517333984375, -4.8779296875, -4.238525390625, -3.59912109375, -2.959716796875, -2.3203125, -1.680908203125, -1.04150390625, -0.402099609375, 0.2373046875, 0.876708984375, 1.51611328125, 2.155517578125, 2.794921875, 3.434326171875, 4.07373046875, 4.713134765625, 5.3525390625, 5.991943359375, 6.63134765625, 7.270751953125, 7.91015625, 8.549560546875, 9.18896484375, 9.828369140625, 10.4677734375, 11.107177734375, 11.74658203125, 12.385986328125, 13.025390625, 13.664794921875, 14.30419921875, 14.943603515625, 15.5830078125, 16.222412109375, 16.86181640625, 17.501220703125, 18.140625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 627.0, 377.0, 4.0, 0.0, 2.0], "bins": [-321.0364990234375, -315.677001953125, -310.3175048828125, -304.9580383300781, -299.5985412597656, -294.2390441894531, -288.87957763671875, -283.52008056640625, -278.16058349609375, -272.80108642578125, -267.44158935546875, -262.0821228027344, -256.7226257324219, -251.36312866210938, -246.00364685058594, -240.6441650390625, -235.28466796875, -229.9251708984375, -224.56568908691406, -219.20620727539062, -213.84671020507812, -208.48721313476562, -203.1277313232422, -197.76824951171875, -192.40875244140625, -187.04925537109375, -181.6897735595703, -176.33029174804688, -170.97079467773438, -165.61129760742188, -160.25181579589844, -154.892333984375, -149.53282165527344, -144.17333984375, -138.8138427734375, -133.454345703125, -128.09486389160156, -122.7353744506836, -117.37588500976562, -112.01639556884766, -106.65690612792969, -101.29741668701172, -95.93792724609375, -90.57843780517578, -85.21894836425781, -79.85945892333984, -74.49996948242188, -69.1404800415039, -63.78099060058594, -58.42150115966797, -53.06201171875, -47.70252227783203, -42.34303283691406, -36.983543395996094, -31.624053955078125, -26.264564514160156, -20.905075073242188, -15.545585632324219, -10.18609619140625, -4.826606750488281, 0.5328826904296875, 5.892372131347656, 11.251861572265625, 16.611351013183594, 21.970840454101562]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 5.0, 3.0, 4.0, 11.0, 11.0, 11.0, 15.0, 17.0, 20.0, 17.0, 32.0, 24.0, 23.0, 17.0, 30.0, 31.0, 35.0, 44.0, 48.0, 29.0, 52.0, 37.0, 30.0, 34.0, 27.0, 38.0, 29.0, 27.0, 20.0, 35.0, 32.0, 31.0, 21.0, 25.0, 23.0, 16.0, 9.0, 11.0, 17.0, 16.0, 4.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.73444366455078, -17.103490829467773, -16.4725399017334, -15.84158706665039, -15.210634231567383, -14.579682350158691, -13.94873046875, -13.317777633666992, -12.6868257522583, -12.05587387084961, -11.424921035766602, -10.79396915435791, -10.163017272949219, -9.532064437866211, -8.90111255645752, -8.270160675048828, -7.63920783996582, -7.008255481719971, -6.377303123474121, -5.74635124206543, -5.11539888381958, -4.4844465255737305, -3.85349440574646, -3.2225422859191895, -2.59158992767334, -1.9606376886367798, -1.3296854496002197, -0.6987332105636597, -0.06778097152709961, 0.56317138671875, 1.1941235065460205, 1.825075626373291, 2.4560279846191406, 3.0869803428649902, 3.7179324626922607, 4.348884582519531, 4.979836940765381, 5.6107892990112305, 6.241741180419922, 6.8726935386657715, 7.503645896911621, 8.134597778320312, 8.76555061340332, 9.396502494812012, 10.027454376220703, 10.658407211303711, 11.289359092712402, 11.920310974121094, 12.551263809204102, 13.182215690612793, 13.8131685256958, 14.444120407104492, 15.0750732421875, 15.706025123596191, 16.336977005004883, 16.96792984008789, 17.598880767822266, 18.229833602905273, 18.86078453063965, 19.491737365722656, 20.122690200805664, 20.753643035888672, 21.384593963623047, 22.015546798706055, 22.646499633789062]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 11.0, 11.0, 15.0, 14.0, 13.0, 24.0, 22.0, 24.0, 33.0, 24.0, 22.0, 40.0, 41.0, 38.0, 41.0, 40.0, 47.0, 45.0, 28.0, 40.0, 27.0, 33.0, 43.0, 37.0, 40.0, 28.0, 34.0, 25.0, 25.0, 14.0, 10.0, 14.0, 13.0, 6.0, 10.0, 7.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.326171875, -2.251739501953125, -2.17730712890625, -2.102874755859375, -2.0284423828125, -1.954010009765625, -1.87957763671875, -1.805145263671875, -1.730712890625, -1.656280517578125, -1.58184814453125, -1.507415771484375, -1.4329833984375, -1.358551025390625, -1.28411865234375, -1.209686279296875, -1.13525390625, -1.060821533203125, -0.98638916015625, -0.911956787109375, -0.8375244140625, -0.763092041015625, -0.68865966796875, -0.614227294921875, -0.539794921875, -0.465362548828125, -0.39093017578125, -0.316497802734375, -0.2420654296875, -0.167633056640625, -0.09320068359375, -0.018768310546875, 0.0556640625, 0.130096435546875, 0.20452880859375, 0.278961181640625, 0.3533935546875, 0.427825927734375, 0.50225830078125, 0.576690673828125, 0.651123046875, 0.725555419921875, 0.79998779296875, 0.874420166015625, 0.9488525390625, 1.023284912109375, 1.09771728515625, 1.172149658203125, 1.24658203125, 1.321014404296875, 1.39544677734375, 1.469879150390625, 1.5443115234375, 1.618743896484375, 1.69317626953125, 1.767608642578125, 1.842041015625, 1.916473388671875, 1.99090576171875, 2.065338134765625, 2.1397705078125, 2.214202880859375, 2.28863525390625, 2.363067626953125, 2.4375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 7.0, 2.0, 7.0, 4.0, 6.0, 8.0, 11.0, 18.0, 14.0, 15.0, 18.0, 17.0, 29.0, 29.0, 40.0, 72.0, 169.0, 398.0, 1247.0, 4859.0, 27133.0, 239721.0, 2587714.0, 1220465.0, 94314.0, 13456.0, 2941.0, 843.0, 301.0, 121.0, 73.0, 49.0, 28.0, 31.0, 23.0, 11.0, 14.0, 12.0, 9.0, 7.0, 5.0, 8.0, 7.0, 1.0, 9.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.34375, -8.0728759765625, -7.802001953125, -7.5311279296875, -7.26025390625, -6.9893798828125, -6.718505859375, -6.4476318359375, -6.1767578125, -5.9058837890625, -5.635009765625, -5.3641357421875, -5.09326171875, -4.8223876953125, -4.551513671875, -4.2806396484375, -4.009765625, -3.7388916015625, -3.468017578125, -3.1971435546875, -2.92626953125, -2.6553955078125, -2.384521484375, -2.1136474609375, -1.8427734375, -1.5718994140625, -1.301025390625, -1.0301513671875, -0.75927734375, -0.4884033203125, -0.217529296875, 0.0533447265625, 0.32421875, 0.5950927734375, 0.865966796875, 1.1368408203125, 1.40771484375, 1.6785888671875, 1.949462890625, 2.2203369140625, 2.4912109375, 2.7620849609375, 3.032958984375, 3.3038330078125, 3.57470703125, 3.8455810546875, 4.116455078125, 4.3873291015625, 4.658203125, 4.9290771484375, 5.199951171875, 5.4708251953125, 5.74169921875, 6.0125732421875, 6.283447265625, 6.5543212890625, 6.8251953125, 7.0960693359375, 7.366943359375, 7.6378173828125, 7.90869140625, 8.1795654296875, 8.450439453125, 8.7213134765625, 8.9921875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 9.0, 14.0, 20.0, 29.0, 34.0, 48.0, 54.0, 76.0, 87.0, 123.0, 140.0, 222.0, 227.0, 297.0, 357.0, 385.0, 388.0, 353.0, 282.0, 198.0, 156.0, 142.0, 96.0, 65.0, 67.0, 44.0, 36.0, 27.0, 23.0, 19.0, 7.0, 9.0, 6.0, 5.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.27349853515625, -4.1134033203125, -3.95330810546875, -3.793212890625, -3.63311767578125, -3.4730224609375, -3.31292724609375, -3.15283203125, -2.99273681640625, -2.8326416015625, -2.67254638671875, -2.512451171875, -2.35235595703125, -2.1922607421875, -2.03216552734375, -1.8720703125, -1.71197509765625, -1.5518798828125, -1.39178466796875, -1.231689453125, -1.07159423828125, -0.9114990234375, -0.75140380859375, -0.59130859375, -0.43121337890625, -0.2711181640625, -0.11102294921875, 0.049072265625, 0.20916748046875, 0.3692626953125, 0.52935791015625, 0.689453125, 0.84954833984375, 1.0096435546875, 1.16973876953125, 1.329833984375, 1.48992919921875, 1.6500244140625, 1.81011962890625, 1.97021484375, 2.13031005859375, 2.2904052734375, 2.45050048828125, 2.610595703125, 2.77069091796875, 2.9307861328125, 3.09088134765625, 3.2509765625, 3.41107177734375, 3.5711669921875, 3.73126220703125, 3.891357421875, 4.05145263671875, 4.2115478515625, 4.37164306640625, 4.53173828125, 4.69183349609375, 4.8519287109375, 5.01202392578125, 5.172119140625, 5.33221435546875, 5.4923095703125, 5.65240478515625, 5.8125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 13.0, 10.0, 14.0, 28.0, 31.0, 43.0, 50.0, 66.0, 79.0, 104.0, 134.0, 186.0, 339.0, 688.0, 2233.0, 12044.0, 92964.0, 964973.0, 2733939.0, 341190.0, 36965.0, 5396.0, 1285.0, 492.0, 283.0, 165.0, 131.0, 85.0, 81.0, 57.0, 55.0, 36.0, 29.0, 20.0, 17.0, 11.0, 12.0, 4.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-12.421875, -12.06982421875, -11.7177734375, -11.36572265625, -11.013671875, -10.66162109375, -10.3095703125, -9.95751953125, -9.60546875, -9.25341796875, -8.9013671875, -8.54931640625, -8.197265625, -7.84521484375, -7.4931640625, -7.14111328125, -6.7890625, -6.43701171875, -6.0849609375, -5.73291015625, -5.380859375, -5.02880859375, -4.6767578125, -4.32470703125, -3.97265625, -3.62060546875, -3.2685546875, -2.91650390625, -2.564453125, -2.21240234375, -1.8603515625, -1.50830078125, -1.15625, -0.80419921875, -0.4521484375, -0.10009765625, 0.251953125, 0.60400390625, 0.9560546875, 1.30810546875, 1.66015625, 2.01220703125, 2.3642578125, 2.71630859375, 3.068359375, 3.42041015625, 3.7724609375, 4.12451171875, 4.4765625, 4.82861328125, 5.1806640625, 5.53271484375, 5.884765625, 6.23681640625, 6.5888671875, 6.94091796875, 7.29296875, 7.64501953125, 7.9970703125, 8.34912109375, 8.701171875, 9.05322265625, 9.4052734375, 9.75732421875, 10.109375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 15.0, 23.0, 26.0, 58.0, 74.0, 127.0, 104.0, 130.0, 133.0, 99.0, 79.0, 51.0, 43.0, 15.0, 11.0, 10.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.18479537963867, -31.056053161621094, -29.927310943603516, -28.798568725585938, -27.66982650756836, -26.54108428955078, -25.41234016418457, -24.283597946166992, -23.154855728149414, -22.026113510131836, -20.897371292114258, -19.76862907409668, -18.63988494873047, -17.51114273071289, -16.382400512695312, -15.253658294677734, -14.124916076660156, -12.996173858642578, -11.867431640625, -10.738688468933105, -9.609946250915527, -8.48120403289795, -7.352461338043213, -6.223718643188477, -5.094976425170898, -3.966233968734741, -2.837491512298584, -1.7087490558624268, -0.5800065994262695, 0.5487356185913086, 1.677478313446045, 2.8062210083007812, 3.9349594116210938, 5.063701629638672, 6.192444324493408, 7.3211870193481445, 8.449929237365723, 9.5786714553833, 10.707414627075195, 11.836156845092773, 12.964899063110352, 14.09364128112793, 15.222383499145508, 16.351125717163086, 17.479869842529297, 18.608612060546875, 19.737354278564453, 20.86609649658203, 21.99483871459961, 23.123580932617188, 24.252323150634766, 25.381065368652344, 26.509807586669922, 27.6385498046875, 28.76729393005371, 29.89603614807129, 31.024778366088867, 32.15352249145508, 33.282264709472656, 34.411006927490234, 35.53974914550781, 36.66849136352539, 37.79723358154297, 38.92597579956055, 40.054718017578125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 3.0, 13.0, 12.0, 14.0, 10.0, 11.0, 19.0, 24.0, 27.0, 25.0, 36.0, 27.0, 40.0, 34.0, 33.0, 41.0, 39.0, 37.0, 30.0, 43.0, 38.0, 38.0, 35.0, 40.0, 43.0, 36.0, 30.0, 27.0, 26.0, 30.0, 16.0, 16.0, 17.0, 16.0, 13.0, 8.0, 14.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-18.091873168945312, -17.55296516418457, -17.01405906677246, -16.47515106201172, -15.93624496459961, -15.397336959838867, -14.858429908752441, -14.319522857666016, -13.78061580657959, -13.241708755493164, -12.702801704406738, -12.163894653320312, -11.62498664855957, -11.086080551147461, -10.547172546386719, -10.008265495300293, -9.469358444213867, -8.930451393127441, -8.391544342041016, -7.852636814117432, -7.313729763031006, -6.77482271194458, -6.235915184020996, -5.69700813293457, -5.1581010818481445, -4.619194030761719, -4.080286979675293, -3.541379451751709, -3.002472400665283, -2.4635653495788574, -1.9246580600738525, -1.3857507705688477, -0.8468437194824219, -0.30793654918670654, 0.2309706211090088, 0.7698777914047241, 1.3087849617004395, 1.8476920127868652, 2.38659930229187, 2.925506591796875, 3.464413642883301, 4.003320693969727, 4.542227745056152, 5.081135272979736, 5.620042324066162, 6.158949375152588, 6.697856903076172, 7.236763954162598, 7.775671005249023, 8.31457805633545, 8.853485107421875, 9.3923921585083, 9.931299209594727, 10.470207214355469, 11.009114265441895, 11.54802131652832, 12.086928367614746, 12.625835418701172, 13.164742469787598, 13.703649520874023, 14.242557525634766, 14.781463623046875, 15.320371627807617, 15.859278678894043, 16.39818572998047]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 8.0, 6.0, 7.0, 20.0, 9.0, 13.0, 11.0, 14.0, 22.0, 32.0, 25.0, 29.0, 37.0, 32.0, 44.0, 39.0, 36.0, 35.0, 42.0, 44.0, 47.0, 23.0, 37.0, 51.0, 36.0, 34.0, 32.0, 34.0, 29.0, 27.0, 29.0, 14.0, 17.0, 9.0, 8.0, 11.0, 11.0, 3.0, 7.0, 7.0, 1.0, 6.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1829833984375, -2.106201171875, -2.0294189453125, -1.95263671875, -1.8758544921875, -1.799072265625, -1.7222900390625, -1.6455078125, -1.5687255859375, -1.491943359375, -1.4151611328125, -1.33837890625, -1.2615966796875, -1.184814453125, -1.1080322265625, -1.03125, -0.9544677734375, -0.877685546875, -0.8009033203125, -0.72412109375, -0.6473388671875, -0.570556640625, -0.4937744140625, -0.4169921875, -0.3402099609375, -0.263427734375, -0.1866455078125, -0.10986328125, -0.0330810546875, 0.043701171875, 0.1204833984375, 0.197265625, 0.2740478515625, 0.350830078125, 0.4276123046875, 0.50439453125, 0.5811767578125, 0.657958984375, 0.7347412109375, 0.8115234375, 0.8883056640625, 0.965087890625, 1.0418701171875, 1.11865234375, 1.1954345703125, 1.272216796875, 1.3489990234375, 1.42578125, 1.5025634765625, 1.579345703125, 1.6561279296875, 1.73291015625, 1.8096923828125, 1.886474609375, 1.9632568359375, 2.0400390625, 2.1168212890625, 2.193603515625, 2.2703857421875, 2.34716796875, 2.4239501953125, 2.500732421875, 2.5775146484375, 2.654296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 10.0, 17.0, 28.0, 44.0, 70.0, 118.0, 109.0, 249.0, 318.0, 496.0, 622.0, 987.0, 1427.0, 2087.0, 2895.0, 4329.0, 6298.0, 9639.0, 14505.0, 22587.0, 35080.0, 58273.0, 102190.0, 238475.0, 267166.0, 111061.0, 61827.0, 37558.0, 23536.0, 15233.0, 10006.0, 6838.0, 4536.0, 3048.0, 2172.0, 1522.0, 977.0, 735.0, 467.0, 365.0, 209.0, 148.0, 107.0, 75.0, 40.0, 24.0, 20.0, 18.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0133819580078125, -0.012951135635375977, -0.012520313262939453, -0.01208949089050293, -0.011658668518066406, -0.011227846145629883, -0.01079702377319336, -0.010366201400756836, -0.009935379028320312, -0.009504556655883789, -0.009073734283447266, -0.008642911911010742, -0.008212089538574219, -0.007781267166137695, -0.007350444793701172, -0.0069196224212646484, -0.006488800048828125, -0.0060579776763916016, -0.005627155303955078, -0.005196332931518555, -0.004765510559082031, -0.004334688186645508, -0.0039038658142089844, -0.003473043441772461, -0.0030422210693359375, -0.002611398696899414, -0.0021805763244628906, -0.0017497539520263672, -0.0013189315795898438, -0.0008881092071533203, -0.0004572868347167969, -2.6464462280273438e-05, 0.00040435791015625, 0.0008351802825927734, 0.0012660026550292969, 0.0016968250274658203, 0.0021276473999023438, 0.002558469772338867, 0.0029892921447753906, 0.003420114517211914, 0.0038509368896484375, 0.004281759262084961, 0.004712581634521484, 0.005143404006958008, 0.005574226379394531, 0.006005048751831055, 0.006435871124267578, 0.0068666934967041016, 0.007297515869140625, 0.0077283382415771484, 0.008159160614013672, 0.008589982986450195, 0.009020805358886719, 0.009451627731323242, 0.009882450103759766, 0.010313272476196289, 0.010744094848632812, 0.011174917221069336, 0.01160573959350586, 0.012036561965942383, 0.012467384338378906, 0.01289820671081543, 0.013329029083251953, 0.013759851455688477, 0.014190673828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 3.0, 1.0, 6.0, 10.0, 19.0, 11.0, 15.0, 22.0, 21.0, 29.0, 23.0, 21.0, 20.0, 43.0, 42.0, 39.0, 30.0, 51.0, 37.0, 1074.0, 48.0, 40.0, 40.0, 32.0, 35.0, 42.0, 33.0, 27.0, 22.0, 33.0, 25.0, 12.0, 18.0, 14.0, 16.0, 8.0, 10.0, 10.0, 7.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6298828125, -1.5752716064453125, -1.520660400390625, -1.4660491943359375, -1.41143798828125, -1.3568267822265625, -1.302215576171875, -1.2476043701171875, -1.1929931640625, -1.1383819580078125, -1.083770751953125, -1.0291595458984375, -0.97454833984375, -0.9199371337890625, -0.865325927734375, -0.8107147216796875, -0.756103515625, -0.7014923095703125, -0.646881103515625, -0.5922698974609375, -0.53765869140625, -0.4830474853515625, -0.428436279296875, -0.3738250732421875, -0.3192138671875, -0.2646026611328125, -0.209991455078125, -0.1553802490234375, -0.10076904296875, -0.0461578369140625, 0.008453369140625, 0.0630645751953125, 0.11767578125, 0.1722869873046875, 0.226898193359375, 0.2815093994140625, 0.33612060546875, 0.3907318115234375, 0.445343017578125, 0.4999542236328125, 0.5545654296875, 0.6091766357421875, 0.663787841796875, 0.7183990478515625, 0.77301025390625, 0.8276214599609375, 0.882232666015625, 0.9368438720703125, 0.991455078125, 1.0460662841796875, 1.100677490234375, 1.1552886962890625, 1.20989990234375, 1.2645111083984375, 1.319122314453125, 1.3737335205078125, 1.4283447265625, 1.4829559326171875, 1.537567138671875, 1.5921783447265625, 1.64678955078125, 1.7014007568359375, 1.756011962890625, 1.8106231689453125, 1.865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 19.0, 11.0, 23.0, 37.0, 58.0, 95.0, 107.0, 170.0, 234.0, 411.0, 540.0, 815.0, 1137.0, 1874.0, 2752.0, 4167.0, 6462.0, 9792.0, 15690.0, 25251.0, 41462.0, 70228.0, 136787.0, 1358509.0, 196746.0, 89160.0, 51036.0, 30451.0, 18864.0, 11964.0, 7690.0, 4768.0, 3256.0, 2150.0, 1410.0, 951.0, 644.0, 436.0, 315.0, 217.0, 143.0, 90.0, 62.0, 37.0, 40.0, 20.0, 13.0, 13.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0], "bins": [-0.01119232177734375, -0.010860204696655273, -0.010528087615966797, -0.01019597053527832, -0.009863853454589844, -0.009531736373901367, -0.00919961929321289, -0.008867502212524414, -0.008535385131835938, -0.008203268051147461, -0.007871150970458984, -0.007539033889770508, -0.007206916809082031, -0.006874799728393555, -0.006542682647705078, -0.0062105655670166016, -0.005878448486328125, -0.0055463314056396484, -0.005214214324951172, -0.004882097244262695, -0.004549980163574219, -0.004217863082885742, -0.0038857460021972656, -0.003553628921508789, -0.0032215118408203125, -0.002889394760131836, -0.0025572776794433594, -0.002225160598754883, -0.0018930435180664062, -0.0015609264373779297, -0.0012288093566894531, -0.0008966922760009766, -0.0005645751953125, -0.00023245811462402344, 9.965896606445312e-05, 0.0004317760467529297, 0.0007638931274414062, 0.0010960102081298828, 0.0014281272888183594, 0.001760244369506836, 0.0020923614501953125, 0.002424478530883789, 0.0027565956115722656, 0.003088712692260742, 0.0034208297729492188, 0.0037529468536376953, 0.004085063934326172, 0.0044171810150146484, 0.004749298095703125, 0.0050814151763916016, 0.005413532257080078, 0.005745649337768555, 0.006077766418457031, 0.006409883499145508, 0.006742000579833984, 0.007074117660522461, 0.0074062347412109375, 0.007738351821899414, 0.00807046890258789, 0.008402585983276367, 0.008734703063964844, 0.00906682014465332, 0.009398937225341797, 0.009731054306030273, 0.01006317138671875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 916.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [19.0, 1.0, 0.0, 6.0, 0.0, 1.0, 0.0, 29.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 28.0, 38.0, 63.0, 76.0, 0.0, 357.0, 3578.0, 25980.0, 988220.0, 26051.0, 3515.0, 342.0, 86.0, 0.0, 54.0, 41.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 3.0, 0.0, 6.0, 0.0, 1.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1390075087547302e-06, -1.085922122001648e-06, -1.0328367352485657e-06, -9.797513484954834e-07, -9.266659617424011e-07, -8.735805749893188e-07, -8.204951882362366e-07, -7.674098014831543e-07, -7.14324414730072e-07, -6.612390279769897e-07, -6.081536412239075e-07, -5.550682544708252e-07, -5.019828677177429e-07, -4.4889748096466064e-07, -3.9581209421157837e-07, -3.427267074584961e-07, -2.896413207054138e-07, -2.3655593395233154e-07, -1.8347054719924927e-07, -1.30385160446167e-07, -7.729977369308472e-08, -2.421438694000244e-08, 2.8870999813079834e-08, 8.195638656616211e-08, 1.3504177331924438e-07, 1.8812716007232666e-07, 2.4121254682540894e-07, 2.942979335784912e-07, 3.473833203315735e-07, 4.0046870708465576e-07, 4.5355409383773804e-07, 5.066394805908203e-07, 5.597248673439026e-07, 6.128102540969849e-07, 6.658956408500671e-07, 7.189810276031494e-07, 7.720664143562317e-07, 8.25151801109314e-07, 8.782371878623962e-07, 9.313225746154785e-07, 9.844079613685608e-07, 1.037493348121643e-06, 1.0905787348747253e-06, 1.1436641216278076e-06, 1.1967495083808899e-06, 1.2498348951339722e-06, 1.3029202818870544e-06, 1.3560056686401367e-06, 1.409091055393219e-06, 1.4621764421463013e-06, 1.5152618288993835e-06, 1.5683472156524658e-06, 1.621432602405548e-06, 1.6745179891586304e-06, 1.7276033759117126e-06, 1.780688762664795e-06, 1.8337741494178772e-06, 1.8868595361709595e-06, 1.9399449229240417e-06, 1.993030309677124e-06, 2.0461156964302063e-06, 2.0992010831832886e-06, 2.152286469936371e-06, 2.205371856689453e-06]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1023.0], "bins": [-2.4395898634566038e-08, -2.4014711996755977e-08, -2.3633527135302757e-08, -2.3252340497492696e-08, -2.2871155636039475e-08, -2.2489968998229415e-08, -2.2108782360419355e-08, -2.1727597498966134e-08, -2.1346410861156073e-08, -2.0965224223346013e-08, -2.0584039361892792e-08, -2.020285272408273e-08, -1.982166786262951e-08, -1.944048122481945e-08, -1.905929636336623e-08, -1.867810972555617e-08, -1.829692308774611e-08, -1.7915736449936048e-08, -1.7534551588482827e-08, -1.7153364950672767e-08, -1.6772180089219546e-08, -1.6390993451409486e-08, -1.6009806813599425e-08, -1.5628621952146204e-08, -1.5247437090692983e-08, -1.4866251341061343e-08, -1.4485065591429702e-08, -1.4103878953619642e-08, -1.3722693203988001e-08, -1.334150745435636e-08, -1.296032170472472e-08, -1.257913595509308e-08, -1.2197949317283019e-08, -1.1816763567651378e-08, -1.1435577818019738e-08, -1.1054391180209677e-08, -1.0673205430578037e-08, -1.0292019680946396e-08, -9.910833931314755e-09, -9.529648181683115e-09, -9.148461543873054e-09, -8.767275794241414e-09, -8.386090044609773e-09, -8.004903406799713e-09, -7.623717657168072e-09, -7.242531907536431e-09, -6.861346157904791e-09, -6.48016040827315e-09, -6.0989746586415094e-09, -5.717788909009869e-09, -5.336602715289018e-09, -4.955416965657378e-09, -4.574230771936527e-09, -4.1930450223048865e-09, -3.811859272673246e-09, -3.4306733009970003e-09, -3.0494873293207547e-09, -2.668301357644509e-09, -2.2871153859682636e-09, -1.905929636336623e-09, -1.5247436646603774e-09, -1.1435576929841318e-09, -7.623719433524911e-10, -3.8118597167624557e-10, 0.0]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 8.0, 6.0, 7.0, 20.0, 9.0, 13.0, 11.0, 14.0, 22.0, 32.0, 25.0, 29.0, 37.0, 32.0, 44.0, 39.0, 36.0, 35.0, 42.0, 44.0, 47.0, 23.0, 37.0, 51.0, 36.0, 34.0, 32.0, 34.0, 29.0, 27.0, 29.0, 14.0, 17.0, 9.0, 8.0, 11.0, 11.0, 3.0, 7.0, 7.0, 1.0, 6.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1829833984375, -2.106201171875, -2.0294189453125, -1.95263671875, -1.8758544921875, -1.799072265625, -1.7222900390625, -1.6455078125, -1.5687255859375, -1.491943359375, -1.4151611328125, -1.33837890625, -1.2615966796875, -1.184814453125, -1.1080322265625, -1.03125, -0.9544677734375, -0.877685546875, -0.8009033203125, -0.72412109375, -0.6473388671875, -0.570556640625, -0.4937744140625, -0.4169921875, -0.3402099609375, -0.263427734375, -0.1866455078125, -0.10986328125, -0.0330810546875, 0.043701171875, 0.1204833984375, 0.197265625, 0.2740478515625, 0.350830078125, 0.4276123046875, 0.50439453125, 0.5811767578125, 0.657958984375, 0.7347412109375, 0.8115234375, 0.8883056640625, 0.965087890625, 1.0418701171875, 1.11865234375, 1.1954345703125, 1.272216796875, 1.3489990234375, 1.42578125, 1.5025634765625, 1.579345703125, 1.6561279296875, 1.73291015625, 1.8096923828125, 1.886474609375, 1.9632568359375, 2.0400390625, 2.1168212890625, 2.193603515625, 2.2703857421875, 2.34716796875, 2.4239501953125, 2.500732421875, 2.5775146484375, 2.654296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 5.0, 8.0, 14.0, 25.0, 49.0, 63.0, 97.0, 187.0, 361.0, 562.0, 1029.0, 1795.0, 3323.0, 6017.0, 11507.0, 21801.0, 41989.0, 81398.0, 197352.0, 430352.0, 123197.0, 60115.0, 31633.0, 16352.0, 8778.0, 4704.0, 2636.0, 1363.0, 772.0, 457.0, 252.0, 166.0, 83.0, 48.0, 24.0, 21.0, 9.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.457275390625, -2.36376953125, -2.270263671875, -2.1767578125, -2.083251953125, -1.98974609375, -1.896240234375, -1.802734375, -1.709228515625, -1.61572265625, -1.522216796875, -1.4287109375, -1.335205078125, -1.24169921875, -1.148193359375, -1.0546875, -0.961181640625, -0.86767578125, -0.774169921875, -0.6806640625, -0.587158203125, -0.49365234375, -0.400146484375, -0.306640625, -0.213134765625, -0.11962890625, -0.026123046875, 0.0673828125, 0.160888671875, 0.25439453125, 0.347900390625, 0.44140625, 0.534912109375, 0.62841796875, 0.721923828125, 0.8154296875, 0.908935546875, 1.00244140625, 1.095947265625, 1.189453125, 1.282958984375, 1.37646484375, 1.469970703125, 1.5634765625, 1.656982421875, 1.75048828125, 1.843994140625, 1.9375, 2.031005859375, 2.12451171875, 2.218017578125, 2.3115234375, 2.405029296875, 2.49853515625, 2.592041015625, 2.685546875, 2.779052734375, 2.87255859375, 2.966064453125, 3.0595703125, 3.153076171875, 3.24658203125, 3.340087890625, 3.43359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 2.0, 3.0, 4.0, 10.0, 9.0, 8.0, 3.0, 4.0, 8.0, 16.0, 22.0, 17.0, 21.0, 26.0, 32.0, 25.0, 47.0, 45.0, 53.0, 56.0, 74.0, 141.0, 1461.0, 372.0, 123.0, 79.0, 56.0, 46.0, 42.0, 33.0, 29.0, 31.0, 32.0, 32.0, 24.0, 11.0, 12.0, 9.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.921875, -9.64581298828125, -9.3697509765625, -9.09368896484375, -8.817626953125, -8.54156494140625, -8.2655029296875, -7.98944091796875, -7.71337890625, -7.43731689453125, -7.1612548828125, -6.88519287109375, -6.609130859375, -6.33306884765625, -6.0570068359375, -5.78094482421875, -5.5048828125, -5.22882080078125, -4.9527587890625, -4.67669677734375, -4.400634765625, -4.12457275390625, -3.8485107421875, -3.57244873046875, -3.29638671875, -3.02032470703125, -2.7442626953125, -2.46820068359375, -2.192138671875, -1.91607666015625, -1.6400146484375, -1.36395263671875, -1.087890625, -0.81182861328125, -0.5357666015625, -0.25970458984375, 0.016357421875, 0.29241943359375, 0.5684814453125, 0.84454345703125, 1.12060546875, 1.39666748046875, 1.6727294921875, 1.94879150390625, 2.224853515625, 2.50091552734375, 2.7769775390625, 3.05303955078125, 3.3291015625, 3.60516357421875, 3.8812255859375, 4.15728759765625, 4.433349609375, 4.70941162109375, 4.9854736328125, 5.26153564453125, 5.53759765625, 5.81365966796875, 6.0897216796875, 6.36578369140625, 6.641845703125, 6.91790771484375, 7.1939697265625, 7.47003173828125, 7.74609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 7.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 14.0, 22.0, 21.0, 46.0, 51.0, 61.0, 83.0, 104.0, 139.0, 214.0, 349.0, 1063.0, 11363.0, 735154.0, 2375581.0, 18699.0, 1408.0, 395.0, 228.0, 178.0, 112.0, 86.0, 62.0, 53.0, 38.0, 34.0, 27.0, 18.0, 13.0, 13.0, 5.0, 6.0, 12.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.3125, -14.7470703125, -14.181640625, -13.6162109375, -13.05078125, -12.4853515625, -11.919921875, -11.3544921875, -10.7890625, -10.2236328125, -9.658203125, -9.0927734375, -8.52734375, -7.9619140625, -7.396484375, -6.8310546875, -6.265625, -5.7001953125, -5.134765625, -4.5693359375, -4.00390625, -3.4384765625, -2.873046875, -2.3076171875, -1.7421875, -1.1767578125, -0.611328125, -0.0458984375, 0.51953125, 1.0849609375, 1.650390625, 2.2158203125, 2.78125, 3.3466796875, 3.912109375, 4.4775390625, 5.04296875, 5.6083984375, 6.173828125, 6.7392578125, 7.3046875, 7.8701171875, 8.435546875, 9.0009765625, 9.56640625, 10.1318359375, 10.697265625, 11.2626953125, 11.828125, 12.3935546875, 12.958984375, 13.5244140625, 14.08984375, 14.6552734375, 15.220703125, 15.7861328125, 16.3515625, 16.9169921875, 17.482421875, 18.0478515625, 18.61328125, 19.1787109375, 19.744140625, 20.3095703125, 20.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 113.0, 800.0, 101.0, 4.0], "bins": [-266.6261291503906, -262.2872619628906, -257.9483947753906, -253.60952758789062, -249.27066040039062, -244.93177795410156, -240.59291076660156, -236.25404357910156, -231.91517639160156, -227.57630920410156, -223.23744201660156, -218.89857482910156, -214.5596923828125, -210.2208251953125, -205.8819580078125, -201.5430908203125, -197.2042236328125, -192.8653564453125, -188.5264892578125, -184.1876220703125, -179.8487548828125, -175.50987243652344, -171.17100524902344, -166.83213806152344, -162.49327087402344, -158.15440368652344, -153.81553649902344, -149.47666931152344, -145.13778686523438, -140.79891967773438, -136.46005249023438, -132.12118530273438, -127.78233337402344, -123.44346618652344, -119.10459899902344, -114.7657241821289, -110.4268569946289, -106.0879898071289, -101.74911499023438, -97.41024780273438, -93.07138061523438, -88.73251342773438, -84.39364624023438, -80.05477142333984, -75.71590423583984, -71.37703704833984, -67.03816223144531, -62.69929504394531, -58.36042785644531, -54.02156066894531, -49.68268966674805, -45.34381866455078, -41.00495147705078, -36.66608428955078, -32.327213287353516, -27.988344192504883, -23.64947509765625, -19.310606002807617, -14.971736907958984, -10.632867813110352, -6.293998718261719, -1.955129623413086, 2.383739471435547, 6.72260856628418, 11.061477661132812]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 13.0, 12.0, 10.0, 14.0, 16.0, 18.0, 20.0, 32.0, 22.0, 31.0, 36.0, 32.0, 38.0, 36.0, 43.0, 39.0, 33.0, 32.0, 36.0, 35.0, 34.0, 46.0, 35.0, 37.0, 26.0, 33.0, 25.0, 26.0, 18.0, 19.0, 22.0, 14.0, 18.0, 10.0, 8.0, 13.0, 7.0, 10.0, 2.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.844926834106445, -24.092288970947266, -23.339649200439453, -22.58700942993164, -21.83437156677246, -21.08173370361328, -20.32909393310547, -19.576454162597656, -18.823816299438477, -18.071178436279297, -17.318538665771484, -16.565898895263672, -15.813261032104492, -15.060622215270996, -14.3079833984375, -13.555344581604004, -12.802705764770508, -12.050066947937012, -11.297428131103516, -10.54478931427002, -9.792150497436523, -9.039511680603027, -8.286872863769531, -7.534234046936035, -6.781595230102539, -6.028956413269043, -5.276317596435547, -4.523678779602051, -3.7710399627685547, -3.0184011459350586, -2.2657623291015625, -1.5131235122680664, -0.7604827880859375, -0.007843971252441406, 0.7447948455810547, 1.4974336624145508, 2.250072479248047, 3.002711296081543, 3.755350112915039, 4.507988929748535, 5.260627746582031, 6.013266563415527, 6.765905380249023, 7.5185441970825195, 8.271183013916016, 9.023821830749512, 9.776460647583008, 10.529099464416504, 11.28173828125, 12.034377098083496, 12.787015914916992, 13.539654731750488, 14.292293548583984, 15.04493236541748, 15.797571182250977, 16.550209045410156, 17.30284881591797, 18.05548858642578, 18.80812644958496, 19.56076431274414, 20.313404083251953, 21.066043853759766, 21.818681716918945, 22.571319580078125, 23.323959350585938]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 9.0, 4.0, 8.0, 13.0, 11.0, 6.0, 7.0, 14.0, 18.0, 15.0, 17.0, 23.0, 39.0, 30.0, 37.0, 34.0, 31.0, 36.0, 39.0, 39.0, 30.0, 38.0, 45.0, 46.0, 34.0, 40.0, 35.0, 31.0, 30.0, 18.0, 40.0, 27.0, 25.0, 23.0, 24.0, 17.0, 12.0, 6.0, 9.0, 10.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2818603515625, -2.202392578125, -2.1229248046875, -2.04345703125, -1.9639892578125, -1.884521484375, -1.8050537109375, -1.7255859375, -1.6461181640625, -1.566650390625, -1.4871826171875, -1.40771484375, -1.3282470703125, -1.248779296875, -1.1693115234375, -1.08984375, -1.0103759765625, -0.930908203125, -0.8514404296875, -0.77197265625, -0.6925048828125, -0.613037109375, -0.5335693359375, -0.4541015625, -0.3746337890625, -0.295166015625, -0.2156982421875, -0.13623046875, -0.0567626953125, 0.022705078125, 0.1021728515625, 0.181640625, 0.2611083984375, 0.340576171875, 0.4200439453125, 0.49951171875, 0.5789794921875, 0.658447265625, 0.7379150390625, 0.8173828125, 0.8968505859375, 0.976318359375, 1.0557861328125, 1.13525390625, 1.2147216796875, 1.294189453125, 1.3736572265625, 1.453125, 1.5325927734375, 1.612060546875, 1.6915283203125, 1.77099609375, 1.8504638671875, 1.929931640625, 2.0093994140625, 2.0888671875, 2.1683349609375, 2.247802734375, 2.3272705078125, 2.40673828125, 2.4862060546875, 2.565673828125, 2.6451416015625, 2.724609375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 13.0, 7.0, 11.0, 9.0, 12.0, 15.0, 9.0, 25.0, 30.0, 42.0, 46.0, 64.0, 126.0, 222.0, 447.0, 1253.0, 3876.0, 15484.0, 85891.0, 790957.0, 2676925.0, 536980.0, 63938.0, 12416.0, 3241.0, 1099.0, 496.0, 221.0, 129.0, 77.0, 61.0, 29.0, 23.0, 18.0, 16.0, 14.0, 10.0, 5.0, 10.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.140625, -6.9058837890625, -6.671142578125, -6.4364013671875, -6.20166015625, -5.9669189453125, -5.732177734375, -5.4974365234375, -5.2626953125, -5.0279541015625, -4.793212890625, -4.5584716796875, -4.32373046875, -4.0889892578125, -3.854248046875, -3.6195068359375, -3.384765625, -3.1500244140625, -2.915283203125, -2.6805419921875, -2.44580078125, -2.2110595703125, -1.976318359375, -1.7415771484375, -1.5068359375, -1.2720947265625, -1.037353515625, -0.8026123046875, -0.56787109375, -0.3331298828125, -0.098388671875, 0.1363525390625, 0.37109375, 0.6058349609375, 0.840576171875, 1.0753173828125, 1.31005859375, 1.5447998046875, 1.779541015625, 2.0142822265625, 2.2490234375, 2.4837646484375, 2.718505859375, 2.9532470703125, 3.18798828125, 3.4227294921875, 3.657470703125, 3.8922119140625, 4.126953125, 4.3616943359375, 4.596435546875, 4.8311767578125, 5.06591796875, 5.3006591796875, 5.535400390625, 5.7701416015625, 6.0048828125, 6.2396240234375, 6.474365234375, 6.7091064453125, 6.94384765625, 7.1785888671875, 7.413330078125, 7.6480712890625, 7.8828125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 10.0, 13.0, 24.0, 30.0, 28.0, 41.0, 53.0, 67.0, 102.0, 139.0, 192.0, 246.0, 319.0, 372.0, 444.0, 455.0, 360.0, 272.0, 254.0, 172.0, 133.0, 93.0, 78.0, 40.0, 36.0, 24.0, 21.0, 18.0, 11.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.49169921875, -5.3076171875, -5.12353515625, -4.939453125, -4.75537109375, -4.5712890625, -4.38720703125, -4.203125, -4.01904296875, -3.8349609375, -3.65087890625, -3.466796875, -3.28271484375, -3.0986328125, -2.91455078125, -2.73046875, -2.54638671875, -2.3623046875, -2.17822265625, -1.994140625, -1.81005859375, -1.6259765625, -1.44189453125, -1.2578125, -1.07373046875, -0.8896484375, -0.70556640625, -0.521484375, -0.33740234375, -0.1533203125, 0.03076171875, 0.21484375, 0.39892578125, 0.5830078125, 0.76708984375, 0.951171875, 1.13525390625, 1.3193359375, 1.50341796875, 1.6875, 1.87158203125, 2.0556640625, 2.23974609375, 2.423828125, 2.60791015625, 2.7919921875, 2.97607421875, 3.16015625, 3.34423828125, 3.5283203125, 3.71240234375, 3.896484375, 4.08056640625, 4.2646484375, 4.44873046875, 4.6328125, 4.81689453125, 5.0009765625, 5.18505859375, 5.369140625, 5.55322265625, 5.7373046875, 5.92138671875, 6.10546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 14.0, 21.0, 16.0, 31.0, 31.0, 46.0, 83.0, 123.0, 146.0, 230.0, 333.0, 625.0, 3511.0, 106962.0, 3537351.0, 531688.0, 10913.0, 923.0, 375.0, 248.0, 158.0, 126.0, 83.0, 55.0, 45.0, 45.0, 30.0, 26.0, 11.0, 12.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -21.13818359375, -20.5107421875, -19.88330078125, -19.255859375, -18.62841796875, -18.0009765625, -17.37353515625, -16.74609375, -16.11865234375, -15.4912109375, -14.86376953125, -14.236328125, -13.60888671875, -12.9814453125, -12.35400390625, -11.7265625, -11.09912109375, -10.4716796875, -9.84423828125, -9.216796875, -8.58935546875, -7.9619140625, -7.33447265625, -6.70703125, -6.07958984375, -5.4521484375, -4.82470703125, -4.197265625, -3.56982421875, -2.9423828125, -2.31494140625, -1.6875, -1.06005859375, -0.4326171875, 0.19482421875, 0.822265625, 1.44970703125, 2.0771484375, 2.70458984375, 3.33203125, 3.95947265625, 4.5869140625, 5.21435546875, 5.841796875, 6.46923828125, 7.0966796875, 7.72412109375, 8.3515625, 8.97900390625, 9.6064453125, 10.23388671875, 10.861328125, 11.48876953125, 12.1162109375, 12.74365234375, 13.37109375, 13.99853515625, 14.6259765625, 15.25341796875, 15.880859375, 16.50830078125, 17.1357421875, 17.76318359375, 18.390625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 12.0, 73.0, 234.0, 379.0, 233.0, 75.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.6937713623047, -125.3545913696289, -122.01541137695312, -118.67623138427734, -115.33705139160156, -111.99787139892578, -108.65869140625, -105.31951904296875, -101.98033142089844, -98.64115142822266, -95.30197143554688, -91.9627914428711, -88.62361145019531, -85.28443145751953, -81.94525146484375, -78.6060791015625, -75.26689910888672, -71.92771911621094, -68.58853912353516, -65.24935913085938, -61.910179138183594, -58.57099914550781, -55.2318229675293, -51.892642974853516, -48.553462982177734, -45.21428298950195, -41.87510299682617, -38.535926818847656, -35.196746826171875, -31.85756492614746, -28.518386840820312, -25.17920684814453, -21.84003448486328, -18.5008544921875, -15.161675453186035, -11.82249641418457, -8.483316421508789, -5.144136428833008, -1.8049583435058594, 1.5342216491699219, 4.873401641845703, 8.212581634521484, 11.55176067352295, 14.890939712524414, 18.230119705200195, 21.569299697875977, 24.908477783203125, 28.247657775878906, 31.586837768554688, 34.92601776123047, 38.26519775390625, 41.60437774658203, 44.94355773925781, 48.282737731933594, 51.62191390991211, 54.96109390258789, 58.30027389526367, 61.63945388793945, 64.97863006591797, 68.31781005859375, 71.65699005126953, 74.99617004394531, 78.3353500366211, 81.67453002929688, 85.01371002197266]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 7.0, 6.0, 8.0, 8.0, 10.0, 19.0, 13.0, 9.0, 12.0, 26.0, 22.0, 29.0, 21.0, 29.0, 23.0, 29.0, 21.0, 30.0, 35.0, 34.0, 45.0, 42.0, 38.0, 33.0, 39.0, 41.0, 47.0, 21.0, 33.0, 30.0, 28.0, 32.0, 21.0, 20.0, 19.0, 12.0, 15.0, 13.0, 9.0, 11.0, 5.0, 7.0, 7.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.971534729003906, -15.46187686920166, -14.952219009399414, -14.442560195922852, -13.932902336120605, -13.42324447631836, -12.913585662841797, -12.40392780303955, -11.894269943237305, -11.384612083435059, -10.874954223632812, -10.36529541015625, -9.855637550354004, -9.345979690551758, -8.836320877075195, -8.32666301727295, -7.817005157470703, -7.307347297668457, -6.797688961029053, -6.288030624389648, -5.778372764587402, -5.268714904785156, -4.759056568145752, -4.249398231506348, -3.7397403717041016, -3.2300822734832764, -2.720424175262451, -2.210766077041626, -1.7011079788208008, -1.1914498805999756, -0.6817917823791504, -0.1721336841583252, 0.3375244140625, 0.8471825122833252, 1.3568406105041504, 1.8664987087249756, 2.376156806945801, 2.885814905166626, 3.395473003387451, 3.9051311016082764, 4.414789199829102, 4.924447059631348, 5.434105396270752, 5.943763732910156, 6.453421592712402, 6.963079452514648, 7.472737789154053, 7.982396125793457, 8.492053985595703, 9.00171184539795, 9.511369705200195, 10.021028518676758, 10.530686378479004, 11.04034423828125, 11.550003051757812, 12.059660911560059, 12.569318771362305, 13.07897663116455, 13.588634490966797, 14.09829330444336, 14.607951164245605, 15.117609024047852, 15.627267837524414, 16.136924743652344, 16.646583557128906]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 9.0, 15.0, 13.0, 16.0, 19.0, 24.0, 19.0, 32.0, 30.0, 34.0, 36.0, 45.0, 38.0, 33.0, 43.0, 50.0, 41.0, 43.0, 42.0, 37.0, 36.0, 39.0, 36.0, 30.0, 36.0, 30.0, 26.0, 18.0, 21.0, 15.0, 10.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51953125, -2.436309814453125, -2.35308837890625, -2.269866943359375, -2.1866455078125, -2.103424072265625, -2.02020263671875, -1.936981201171875, -1.853759765625, -1.770538330078125, -1.68731689453125, -1.604095458984375, -1.5208740234375, -1.437652587890625, -1.35443115234375, -1.271209716796875, -1.18798828125, -1.104766845703125, -1.02154541015625, -0.938323974609375, -0.8551025390625, -0.771881103515625, -0.68865966796875, -0.605438232421875, -0.522216796875, -0.438995361328125, -0.35577392578125, -0.272552490234375, -0.1893310546875, -0.106109619140625, -0.02288818359375, 0.060333251953125, 0.1435546875, 0.226776123046875, 0.30999755859375, 0.393218994140625, 0.4764404296875, 0.559661865234375, 0.64288330078125, 0.726104736328125, 0.809326171875, 0.892547607421875, 0.97576904296875, 1.058990478515625, 1.1422119140625, 1.225433349609375, 1.30865478515625, 1.391876220703125, 1.47509765625, 1.558319091796875, 1.64154052734375, 1.724761962890625, 1.8079833984375, 1.891204833984375, 1.97442626953125, 2.057647705078125, 2.140869140625, 2.224090576171875, 2.30731201171875, 2.390533447265625, 2.4737548828125, 2.556976318359375, 2.64019775390625, 2.723419189453125, 2.806640625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 19.0, 35.0, 29.0, 49.0, 83.0, 106.0, 143.0, 230.0, 335.0, 465.0, 750.0, 1063.0, 1589.0, 2379.0, 3690.0, 5789.0, 9255.0, 14929.0, 24838.0, 42883.0, 79056.0, 168009.0, 350266.0, 159941.0, 76681.0, 41970.0, 24190.0, 14406.0, 8832.0, 5615.0, 3643.0, 2362.0, 1638.0, 1047.0, 711.0, 480.0, 327.0, 243.0, 140.0, 108.0, 75.0, 41.0, 28.0, 25.0, 15.0, 10.0, 6.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01617431640625, -0.015676259994506836, -0.015178203582763672, -0.014680147171020508, -0.014182090759277344, -0.01368403434753418, -0.013185977935791016, -0.012687921524047852, -0.012189865112304688, -0.011691808700561523, -0.01119375228881836, -0.010695695877075195, -0.010197639465332031, -0.009699583053588867, -0.009201526641845703, -0.008703470230102539, -0.008205413818359375, -0.007707357406616211, -0.007209300994873047, -0.006711244583129883, -0.006213188171386719, -0.005715131759643555, -0.005217075347900391, -0.0047190189361572266, -0.0042209625244140625, -0.0037229061126708984, -0.0032248497009277344, -0.0027267932891845703, -0.0022287368774414062, -0.0017306804656982422, -0.0012326240539550781, -0.0007345676422119141, -0.00023651123046875, 0.00026154518127441406, 0.0007596015930175781, 0.0012576580047607422, 0.0017557144165039062, 0.0022537708282470703, 0.0027518272399902344, 0.0032498836517333984, 0.0037479400634765625, 0.0042459964752197266, 0.004744052886962891, 0.005242109298706055, 0.005740165710449219, 0.006238222122192383, 0.006736278533935547, 0.007234334945678711, 0.007732391357421875, 0.008230447769165039, 0.008728504180908203, 0.009226560592651367, 0.009724617004394531, 0.010222673416137695, 0.01072072982788086, 0.011218786239624023, 0.011716842651367188, 0.012214899063110352, 0.012712955474853516, 0.01321101188659668, 0.013709068298339844, 0.014207124710083008, 0.014705181121826172, 0.015203237533569336, 0.0157012939453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 10.0, 11.0, 12.0, 17.0, 9.0, 20.0, 13.0, 34.0, 21.0, 31.0, 20.0, 39.0, 35.0, 28.0, 39.0, 35.0, 38.0, 35.0, 1062.0, 37.0, 48.0, 44.0, 42.0, 33.0, 26.0, 31.0, 42.0, 40.0, 28.0, 26.0, 19.0, 24.0, 12.0, 19.0, 6.0, 9.0, 11.0, 7.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7514190673828125, -1.696197509765625, -1.6409759521484375, -1.58575439453125, -1.5305328369140625, -1.475311279296875, -1.4200897216796875, -1.3648681640625, -1.3096466064453125, -1.254425048828125, -1.1992034912109375, -1.14398193359375, -1.0887603759765625, -1.033538818359375, -0.9783172607421875, -0.923095703125, -0.8678741455078125, -0.812652587890625, -0.7574310302734375, -0.70220947265625, -0.6469879150390625, -0.591766357421875, -0.5365447998046875, -0.4813232421875, -0.4261016845703125, -0.370880126953125, -0.3156585693359375, -0.26043701171875, -0.2052154541015625, -0.149993896484375, -0.0947723388671875, -0.03955078125, 0.0156707763671875, 0.070892333984375, 0.1261138916015625, 0.18133544921875, 0.2365570068359375, 0.291778564453125, 0.3470001220703125, 0.4022216796875, 0.4574432373046875, 0.512664794921875, 0.5678863525390625, 0.62310791015625, 0.6783294677734375, 0.733551025390625, 0.7887725830078125, 0.843994140625, 0.8992156982421875, 0.954437255859375, 1.0096588134765625, 1.06488037109375, 1.1201019287109375, 1.175323486328125, 1.2305450439453125, 1.2857666015625, 1.3409881591796875, 1.396209716796875, 1.4514312744140625, 1.50665283203125, 1.5618743896484375, 1.617095947265625, 1.6723175048828125, 1.7275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 14.0, 11.0, 24.0, 33.0, 50.0, 71.0, 122.0, 187.0, 265.0, 399.0, 563.0, 982.0, 1543.0, 2188.0, 3621.0, 5786.0, 9224.0, 15008.0, 24491.0, 40315.0, 67074.0, 123018.0, 1316240.0, 227594.0, 104741.0, 59905.0, 35452.0, 22248.0, 13300.0, 8323.0, 5233.0, 3255.0, 2016.0, 1365.0, 868.0, 543.0, 353.0, 229.0, 166.0, 110.0, 62.0, 46.0, 31.0, 18.0, 18.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0105743408203125, -0.010242700576782227, -0.009911060333251953, -0.00957942008972168, -0.009247779846191406, -0.008916139602661133, -0.00858449935913086, -0.008252859115600586, -0.007921218872070312, -0.007589578628540039, -0.007257938385009766, -0.006926298141479492, -0.006594657897949219, -0.006263017654418945, -0.005931377410888672, -0.0055997371673583984, -0.005268096923828125, -0.0049364566802978516, -0.004604816436767578, -0.004273176193237305, -0.003941535949707031, -0.003609895706176758, -0.0032782554626464844, -0.002946615219116211, -0.0026149749755859375, -0.002283334732055664, -0.0019516944885253906, -0.0016200542449951172, -0.0012884140014648438, -0.0009567737579345703, -0.0006251335144042969, -0.00029349327087402344, 3.814697265625e-05, 0.00036978721618652344, 0.0007014274597167969, 0.0010330677032470703, 0.0013647079467773438, 0.0016963481903076172, 0.0020279884338378906, 0.002359628677368164, 0.0026912689208984375, 0.003022909164428711, 0.0033545494079589844, 0.003686189651489258, 0.004017829895019531, 0.004349470138549805, 0.004681110382080078, 0.0050127506256103516, 0.005344390869140625, 0.0056760311126708984, 0.006007671356201172, 0.006339311599731445, 0.006670951843261719, 0.007002592086791992, 0.007334232330322266, 0.007665872573852539, 0.007997512817382812, 0.008329153060913086, 0.00866079330444336, 0.008992433547973633, 0.009324073791503906, 0.00965571403503418, 0.009987354278564453, 0.010318994522094727, 0.010650634765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 920.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 4.0, 5.0, 8.0, 0.0, 28.0, 0.0, 2.0, 6.0, 45.0, 56.0, 468.0, 3761.0, 1013982.0, 25755.0, 4200.0, 114.0, 29.0, 41.0, 4.0, 0.0, 14.0, 17.0, 5.0, 3.0, 0.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.6582350730895996e-06, -3.56137752532959e-06, -3.46451997756958e-06, -3.3676624298095703e-06, -3.2708048820495605e-06, -3.1739473342895508e-06, -3.077089786529541e-06, -2.9802322387695312e-06, -2.8833746910095215e-06, -2.7865171432495117e-06, -2.689659595489502e-06, -2.592802047729492e-06, -2.4959444999694824e-06, -2.3990869522094727e-06, -2.302229404449463e-06, -2.205371856689453e-06, -2.1085143089294434e-06, -2.0116567611694336e-06, -1.914799213409424e-06, -1.817941665649414e-06, -1.7210841178894043e-06, -1.6242265701293945e-06, -1.5273690223693848e-06, -1.430511474609375e-06, -1.3336539268493652e-06, -1.2367963790893555e-06, -1.1399388313293457e-06, -1.043081283569336e-06, -9.462237358093262e-07, -8.493661880493164e-07, -7.525086402893066e-07, -6.556510925292969e-07, -5.587935447692871e-07, -4.6193599700927734e-07, -3.650784492492676e-07, -2.682209014892578e-07, -1.7136335372924805e-07, -7.450580596923828e-08, 2.2351741790771484e-08, 1.1920928955078125e-07, 2.1606683731079102e-07, 3.129243850708008e-07, 4.0978193283081055e-07, 5.066394805908203e-07, 6.034970283508301e-07, 7.003545761108398e-07, 7.972121238708496e-07, 8.940696716308594e-07, 9.909272193908691e-07, 1.087784767150879e-06, 1.1846423149108887e-06, 1.2814998626708984e-06, 1.3783574104309082e-06, 1.475214958190918e-06, 1.5720725059509277e-06, 1.6689300537109375e-06, 1.7657876014709473e-06, 1.862645149230957e-06, 1.959502696990967e-06, 2.0563602447509766e-06, 2.1532177925109863e-06, 2.250075340270996e-06, 2.346932888031006e-06, 2.4437904357910156e-06]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 9.0, 15.0, 13.0, 16.0, 19.0, 24.0, 19.0, 32.0, 30.0, 34.0, 36.0, 45.0, 38.0, 33.0, 43.0, 50.0, 41.0, 43.0, 42.0, 37.0, 36.0, 39.0, 36.0, 30.0, 36.0, 30.0, 26.0, 18.0, 21.0, 15.0, 10.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51953125, -2.436309814453125, -2.35308837890625, -2.269866943359375, -2.1866455078125, -2.103424072265625, -2.02020263671875, -1.936981201171875, -1.853759765625, -1.770538330078125, -1.68731689453125, -1.604095458984375, -1.5208740234375, -1.437652587890625, -1.35443115234375, -1.271209716796875, -1.18798828125, -1.104766845703125, -1.02154541015625, -0.938323974609375, -0.8551025390625, -0.771881103515625, -0.68865966796875, -0.605438232421875, -0.522216796875, -0.438995361328125, -0.35577392578125, -0.272552490234375, -0.1893310546875, -0.106109619140625, -0.02288818359375, 0.060333251953125, 0.1435546875, 0.226776123046875, 0.30999755859375, 0.393218994140625, 0.4764404296875, 0.559661865234375, 0.64288330078125, 0.726104736328125, 0.809326171875, 0.892547607421875, 0.97576904296875, 1.058990478515625, 1.1422119140625, 1.225433349609375, 1.30865478515625, 1.391876220703125, 1.47509765625, 1.558319091796875, 1.64154052734375, 1.724761962890625, 1.8079833984375, 1.891204833984375, 1.97442626953125, 2.057647705078125, 2.140869140625, 2.224090576171875, 2.30731201171875, 2.390533447265625, 2.4737548828125, 2.556976318359375, 2.64019775390625, 2.723419189453125, 2.806640625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 7.0, 14.0, 8.0, 18.0, 28.0, 50.0, 79.0, 117.0, 214.0, 294.0, 482.0, 700.0, 1053.0, 1685.0, 2555.0, 3662.0, 5641.0, 8608.0, 13509.0, 23390.0, 45808.0, 110490.0, 331359.0, 297673.0, 99670.0, 42131.0, 21985.0, 12964.0, 8418.0, 5465.0, 3564.0, 2361.0, 1609.0, 1016.0, 647.0, 459.0, 305.0, 193.0, 119.0, 82.0, 52.0, 25.0, 21.0, 12.0, 12.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8506317138671875, -1.776458740234375, -1.7022857666015625, -1.62811279296875, -1.5539398193359375, -1.479766845703125, -1.4055938720703125, -1.3314208984375, -1.2572479248046875, -1.183074951171875, -1.1089019775390625, -1.03472900390625, -0.9605560302734375, -0.886383056640625, -0.8122100830078125, -0.738037109375, -0.6638641357421875, -0.589691162109375, -0.5155181884765625, -0.44134521484375, -0.3671722412109375, -0.292999267578125, -0.2188262939453125, -0.1446533203125, -0.0704803466796875, 0.003692626953125, 0.0778656005859375, 0.15203857421875, 0.2262115478515625, 0.300384521484375, 0.3745574951171875, 0.44873046875, 0.5229034423828125, 0.597076416015625, 0.6712493896484375, 0.74542236328125, 0.8195953369140625, 0.893768310546875, 0.9679412841796875, 1.0421142578125, 1.1162872314453125, 1.190460205078125, 1.2646331787109375, 1.33880615234375, 1.4129791259765625, 1.487152099609375, 1.5613250732421875, 1.635498046875, 1.7096710205078125, 1.783843994140625, 1.8580169677734375, 1.93218994140625, 2.0063629150390625, 2.080535888671875, 2.1547088623046875, 2.2288818359375, 2.3030548095703125, 2.377227783203125, 2.4514007568359375, 2.52557373046875, 2.5997467041015625, 2.673919677734375, 2.7480926513671875, 2.822265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 11.0, 4.0, 6.0, 7.0, 8.0, 10.0, 22.0, 22.0, 31.0, 27.0, 30.0, 34.0, 41.0, 49.0, 33.0, 74.0, 102.0, 226.0, 1545.0, 208.0, 107.0, 58.0, 67.0, 56.0, 38.0, 32.0, 43.0, 27.0, 25.0, 22.0, 13.0, 13.0, 17.0, 9.0, 8.0, 5.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.0234375, -9.741455078125, -9.45947265625, -9.177490234375, -8.8955078125, -8.613525390625, -8.33154296875, -8.049560546875, -7.767578125, -7.485595703125, -7.20361328125, -6.921630859375, -6.6396484375, -6.357666015625, -6.07568359375, -5.793701171875, -5.51171875, -5.229736328125, -4.94775390625, -4.665771484375, -4.3837890625, -4.101806640625, -3.81982421875, -3.537841796875, -3.255859375, -2.973876953125, -2.69189453125, -2.409912109375, -2.1279296875, -1.845947265625, -1.56396484375, -1.281982421875, -1.0, -0.718017578125, -0.43603515625, -0.154052734375, 0.1279296875, 0.409912109375, 0.69189453125, 0.973876953125, 1.255859375, 1.537841796875, 1.81982421875, 2.101806640625, 2.3837890625, 2.665771484375, 2.94775390625, 3.229736328125, 3.51171875, 3.793701171875, 4.07568359375, 4.357666015625, 4.6396484375, 4.921630859375, 5.20361328125, 5.485595703125, 5.767578125, 6.049560546875, 6.33154296875, 6.613525390625, 6.8955078125, 7.177490234375, 7.45947265625, 7.741455078125, 8.0234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 4.0, 7.0, 12.0, 12.0, 14.0, 25.0, 32.0, 38.0, 53.0, 62.0, 68.0, 108.0, 134.0, 174.0, 241.0, 399.0, 1074.0, 7221.0, 225166.0, 2880887.0, 25974.0, 2355.0, 489.0, 279.0, 206.0, 167.0, 98.0, 88.0, 70.0, 59.0, 42.0, 36.0, 17.0, 14.0, 20.0, 11.0, 9.0, 16.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8885498046875, -13.378662109375, -12.8687744140625, -12.35888671875, -11.8489990234375, -11.339111328125, -10.8292236328125, -10.3193359375, -9.8094482421875, -9.299560546875, -8.7896728515625, -8.27978515625, -7.7698974609375, -7.260009765625, -6.7501220703125, -6.240234375, -5.7303466796875, -5.220458984375, -4.7105712890625, -4.20068359375, -3.6907958984375, -3.180908203125, -2.6710205078125, -2.1611328125, -1.6512451171875, -1.141357421875, -0.6314697265625, -0.12158203125, 0.3883056640625, 0.898193359375, 1.4080810546875, 1.91796875, 2.4278564453125, 2.937744140625, 3.4476318359375, 3.95751953125, 4.4674072265625, 4.977294921875, 5.4871826171875, 5.9970703125, 6.5069580078125, 7.016845703125, 7.5267333984375, 8.03662109375, 8.5465087890625, 9.056396484375, 9.5662841796875, 10.076171875, 10.5860595703125, 11.095947265625, 11.6058349609375, 12.11572265625, 12.6256103515625, 13.135498046875, 13.6453857421875, 14.1552734375, 14.6651611328125, 15.175048828125, 15.6849365234375, 16.19482421875, 16.7047119140625, 17.214599609375, 17.7244873046875, 18.234375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 25.0, 122.0, 291.0, 340.0, 182.0, 48.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.730520248413086, -7.510559558868408, -6.2905988693237305, -5.0706377029418945, -3.850677013397217, -2.630716323852539, -1.4107551574707031, -0.1907949447631836, 1.0291662216186523, 2.24912691116333, 3.469087839126587, 4.689048767089844, 5.9090094566345215, 7.128970146179199, 8.348931312561035, 9.568891525268555, 10.78885269165039, 12.008813858032227, 13.228774070739746, 14.448735237121582, 15.668695449829102, 16.888656616210938, 18.108617782592773, 19.32857894897461, 20.548538208007812, 21.76849937438965, 22.988460540771484, 24.208419799804688, 25.428380966186523, 26.64834213256836, 27.868303298950195, 29.08826446533203, 30.308223724365234, 31.52818489074707, 32.748146057128906, 33.96810531616211, 35.18806838989258, 36.40802764892578, 37.62799072265625, 38.84794998168945, 40.067909240722656, 41.28786849975586, 42.50783157348633, 43.72779083251953, 44.94775390625, 46.1677131652832, 47.387672424316406, 48.607635498046875, 49.827598571777344, 51.04755783081055, 52.267520904541016, 53.48748016357422, 54.70744323730469, 55.92740249633789, 57.147361755371094, 58.36732482910156, 59.587284088134766, 60.80724334716797, 62.02720642089844, 63.24716567993164, 64.46712493896484, 65.68708801269531, 66.90705108642578, 68.12700653076172, 69.34696960449219]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 2.0, 4.0, 7.0, 9.0, 7.0, 9.0, 20.0, 14.0, 20.0, 17.0, 21.0, 24.0, 30.0, 31.0, 41.0, 41.0, 30.0, 40.0, 49.0, 37.0, 46.0, 55.0, 47.0, 51.0, 36.0, 38.0, 36.0, 40.0, 31.0, 33.0, 17.0, 18.0, 17.0, 13.0, 12.0, 13.0, 10.0, 9.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.985671997070312, -23.186918258666992, -22.388166427612305, -21.589412689208984, -20.790658950805664, -19.991907119750977, -19.193153381347656, -18.39440155029297, -17.59564781188965, -16.796894073486328, -15.998141288757324, -15.19938850402832, -14.400635719299316, -13.601882934570312, -12.803129196166992, -12.004376411437988, -11.205622673034668, -10.406869888305664, -9.608116149902344, -8.80936336517334, -8.010610580444336, -7.211857318878174, -6.413104057312012, -5.614351272583008, -4.815598011016846, -4.016844749450684, -3.2180919647216797, -2.4193387031555176, -1.6205856800079346, -0.8218326568603516, -0.023079395294189453, 0.7756733894348145, 1.5744266510009766, 2.3731796741485596, 3.1719326972961426, 3.9706859588623047, 4.769438743591309, 5.568192005157471, 6.366945266723633, 7.165698051452637, 7.964451313018799, 8.763204574584961, 9.561957359313965, 10.360710144042969, 11.159463882446289, 11.958216667175293, 12.756969451904297, 13.555723190307617, 14.354475975036621, 15.153228759765625, 15.951982498168945, 16.750736236572266, 17.549488067626953, 18.348241806030273, 19.146995544433594, 19.94574737548828, 20.7445011138916, 21.543254852294922, 22.34200668334961, 23.14076042175293, 23.93951416015625, 24.738265991210938, 25.537019729614258, 26.335773468017578, 27.134525299072266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 9.0, 8.0, 7.0, 10.0, 12.0, 12.0, 16.0, 22.0, 21.0, 25.0, 28.0, 31.0, 30.0, 34.0, 40.0, 34.0, 44.0, 41.0, 47.0, 53.0, 29.0, 41.0, 44.0, 39.0, 35.0, 38.0, 31.0, 27.0, 30.0, 29.0, 18.0, 26.0, 12.0, 12.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6015625, -2.516021728515625, -2.43048095703125, -2.344940185546875, -2.2593994140625, -2.173858642578125, -2.08831787109375, -2.002777099609375, -1.917236328125, -1.831695556640625, -1.74615478515625, -1.660614013671875, -1.5750732421875, -1.489532470703125, -1.40399169921875, -1.318450927734375, -1.23291015625, -1.147369384765625, -1.06182861328125, -0.976287841796875, -0.8907470703125, -0.805206298828125, -0.71966552734375, -0.634124755859375, -0.548583984375, -0.463043212890625, -0.37750244140625, -0.291961669921875, -0.2064208984375, -0.120880126953125, -0.03533935546875, 0.050201416015625, 0.1357421875, 0.221282958984375, 0.30682373046875, 0.392364501953125, 0.4779052734375, 0.563446044921875, 0.64898681640625, 0.734527587890625, 0.820068359375, 0.905609130859375, 0.99114990234375, 1.076690673828125, 1.1622314453125, 1.247772216796875, 1.33331298828125, 1.418853759765625, 1.50439453125, 1.589935302734375, 1.67547607421875, 1.761016845703125, 1.8465576171875, 1.932098388671875, 2.01763916015625, 2.103179931640625, 2.188720703125, 2.274261474609375, 2.35980224609375, 2.445343017578125, 2.5308837890625, 2.616424560546875, 2.70196533203125, 2.787506103515625, 2.873046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 17.0, 7.0, 9.0, 24.0, 39.0, 35.0, 68.0, 99.0, 233.0, 383.0, 828.0, 1741.0, 4370.0, 12456.0, 43219.0, 190694.0, 1057691.0, 2141286.0, 588223.0, 110633.0, 27777.0, 8451.0, 3151.0, 1368.0, 633.0, 303.0, 180.0, 100.0, 71.0, 56.0, 25.0, 19.0, 13.0, 14.0, 7.0, 6.0, 3.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.1373291015625, -4.962158203125, -4.7869873046875, -4.61181640625, -4.4366455078125, -4.261474609375, -4.0863037109375, -3.9111328125, -3.7359619140625, -3.560791015625, -3.3856201171875, -3.21044921875, -3.0352783203125, -2.860107421875, -2.6849365234375, -2.509765625, -2.3345947265625, -2.159423828125, -1.9842529296875, -1.80908203125, -1.6339111328125, -1.458740234375, -1.2835693359375, -1.1083984375, -0.9332275390625, -0.758056640625, -0.5828857421875, -0.40771484375, -0.2325439453125, -0.057373046875, 0.1177978515625, 0.29296875, 0.4681396484375, 0.643310546875, 0.8184814453125, 0.99365234375, 1.1688232421875, 1.343994140625, 1.5191650390625, 1.6943359375, 1.8695068359375, 2.044677734375, 2.2198486328125, 2.39501953125, 2.5701904296875, 2.745361328125, 2.9205322265625, 3.095703125, 3.2708740234375, 3.446044921875, 3.6212158203125, 3.79638671875, 3.9715576171875, 4.146728515625, 4.3218994140625, 4.4970703125, 4.6722412109375, 4.847412109375, 5.0225830078125, 5.19775390625, 5.3729248046875, 5.548095703125, 5.7232666015625, 5.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 11.0, 5.0, 13.0, 22.0, 27.0, 51.0, 56.0, 73.0, 83.0, 133.0, 206.0, 253.0, 310.0, 380.0, 442.0, 448.0, 380.0, 325.0, 247.0, 167.0, 123.0, 84.0, 73.0, 44.0, 34.0, 18.0, 16.0, 10.0, 13.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.13507080078125, -4.9576416015625, -4.78021240234375, -4.602783203125, -4.42535400390625, -4.2479248046875, -4.07049560546875, -3.89306640625, -3.71563720703125, -3.5382080078125, -3.36077880859375, -3.183349609375, -3.00592041015625, -2.8284912109375, -2.65106201171875, -2.4736328125, -2.29620361328125, -2.1187744140625, -1.94134521484375, -1.763916015625, -1.58648681640625, -1.4090576171875, -1.23162841796875, -1.05419921875, -0.87677001953125, -0.6993408203125, -0.52191162109375, -0.344482421875, -0.16705322265625, 0.0103759765625, 0.18780517578125, 0.365234375, 0.54266357421875, 0.7200927734375, 0.89752197265625, 1.074951171875, 1.25238037109375, 1.4298095703125, 1.60723876953125, 1.78466796875, 1.96209716796875, 2.1395263671875, 2.31695556640625, 2.494384765625, 2.67181396484375, 2.8492431640625, 3.02667236328125, 3.2041015625, 3.38153076171875, 3.5589599609375, 3.73638916015625, 3.913818359375, 4.09124755859375, 4.2686767578125, 4.44610595703125, 4.62353515625, 4.80096435546875, 4.9783935546875, 5.15582275390625, 5.333251953125, 5.51068115234375, 5.6881103515625, 5.86553955078125, 6.04296875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 10.0, 3.0, 14.0, 30.0, 36.0, 56.0, 71.0, 98.0, 154.0, 199.0, 345.0, 671.0, 3431.0, 74683.0, 3127225.0, 963465.0, 20616.0, 1644.0, 513.0, 314.0, 201.0, 134.0, 83.0, 80.0, 57.0, 50.0, 33.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.046875, -19.4541015625, -18.861328125, -18.2685546875, -17.67578125, -17.0830078125, -16.490234375, -15.8974609375, -15.3046875, -14.7119140625, -14.119140625, -13.5263671875, -12.93359375, -12.3408203125, -11.748046875, -11.1552734375, -10.5625, -9.9697265625, -9.376953125, -8.7841796875, -8.19140625, -7.5986328125, -7.005859375, -6.4130859375, -5.8203125, -5.2275390625, -4.634765625, -4.0419921875, -3.44921875, -2.8564453125, -2.263671875, -1.6708984375, -1.078125, -0.4853515625, 0.107421875, 0.7001953125, 1.29296875, 1.8857421875, 2.478515625, 3.0712890625, 3.6640625, 4.2568359375, 4.849609375, 5.4423828125, 6.03515625, 6.6279296875, 7.220703125, 7.8134765625, 8.40625, 8.9990234375, 9.591796875, 10.1845703125, 10.77734375, 11.3701171875, 11.962890625, 12.5556640625, 13.1484375, 13.7412109375, 14.333984375, 14.9267578125, 15.51953125, 16.1123046875, 16.705078125, 17.2978515625, 17.890625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 14.0, 26.0, 37.0, 71.0, 99.0, 114.0, 132.0, 155.0, 136.0, 85.0, 54.0, 39.0, 24.0, 14.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.38740158081055, -34.17501449584961, -32.962623596191406, -31.75023651123047, -30.5378475189209, -29.325458526611328, -28.11307144165039, -26.90068244934082, -25.68829345703125, -24.47590446472168, -23.26351547241211, -22.051128387451172, -20.8387393951416, -19.62635040283203, -18.413963317871094, -17.201574325561523, -15.989185333251953, -14.776796340942383, -13.564408302307129, -12.352020263671875, -11.139631271362305, -9.927242279052734, -8.71485424041748, -7.502466201782227, -6.290077209472656, -5.077688694000244, -3.865300178527832, -2.65291166305542, -1.4405231475830078, -0.2281346321105957, 0.9842538833618164, 2.1966419219970703, 3.409027099609375, 4.621415615081787, 5.833804130554199, 7.046192646026611, 8.258581161499023, 9.470970153808594, 10.683358192443848, 11.895746231079102, 13.108135223388672, 14.320524215698242, 15.532912254333496, 16.74530029296875, 17.95768928527832, 19.17007827758789, 20.382465362548828, 21.5948543548584, 22.80724334716797, 24.01963233947754, 25.23202133178711, 26.444408416748047, 27.656797409057617, 28.869186401367188, 30.081573486328125, 31.293962478637695, 32.506351470947266, 33.7187385559082, 34.931129455566406, 36.143516540527344, 37.35590362548828, 38.568294525146484, 39.78068161010742, 40.993072509765625, 42.20545959472656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 9.0, 11.0, 9.0, 19.0, 16.0, 17.0, 22.0, 27.0, 33.0, 23.0, 21.0, 28.0, 34.0, 30.0, 47.0, 31.0, 34.0, 45.0, 44.0, 35.0, 50.0, 39.0, 39.0, 32.0, 42.0, 32.0, 24.0, 24.0, 37.0, 25.0, 12.0, 17.0, 16.0, 14.0, 14.0, 3.0, 6.0, 4.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.936317443847656, -17.336288452148438, -16.73625946044922, -16.13623046875, -15.536201477050781, -14.936172485351562, -14.336143493652344, -13.736114501953125, -13.136085510253906, -12.536056518554688, -11.936027526855469, -11.33599853515625, -10.735969543457031, -10.135940551757812, -9.535911560058594, -8.935882568359375, -8.335853576660156, -7.7358245849609375, -7.135795593261719, -6.5357666015625, -5.935737609863281, -5.3357086181640625, -4.735679626464844, -4.135650634765625, -3.5356216430664062, -2.9355926513671875, -2.3355636596679688, -1.73553466796875, -1.1355056762695312, -0.5354766845703125, 0.06455230712890625, 0.664581298828125, 1.2646102905273438, 1.8646392822265625, 2.4646682739257812, 3.064697265625, 3.6647262573242188, 4.2647552490234375, 4.864784240722656, 5.464813232421875, 6.064842224121094, 6.6648712158203125, 7.264900207519531, 7.86492919921875, 8.464958190917969, 9.064987182617188, 9.665016174316406, 10.265045166015625, 10.865074157714844, 11.465103149414062, 12.065132141113281, 12.6651611328125, 13.265190124511719, 13.865219116210938, 14.465248107910156, 15.065277099609375, 15.665306091308594, 16.265335083007812, 16.86536407470703, 17.46539306640625, 18.06542205810547, 18.665451049804688, 19.265480041503906, 19.865509033203125, 20.465538024902344]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 18.0, 20.0, 19.0, 12.0, 21.0, 25.0, 30.0, 24.0, 27.0, 25.0, 40.0, 43.0, 38.0, 54.0, 34.0, 55.0, 38.0, 43.0, 42.0, 46.0, 32.0, 34.0, 36.0, 31.0, 27.0, 15.0, 26.0, 18.0, 15.0, 15.0, 9.0, 14.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.481689453125, -2.39501953125, -2.308349609375, -2.2216796875, -2.135009765625, -2.04833984375, -1.961669921875, -1.875, -1.788330078125, -1.70166015625, -1.614990234375, -1.5283203125, -1.441650390625, -1.35498046875, -1.268310546875, -1.181640625, -1.094970703125, -1.00830078125, -0.921630859375, -0.8349609375, -0.748291015625, -0.66162109375, -0.574951171875, -0.48828125, -0.401611328125, -0.31494140625, -0.228271484375, -0.1416015625, -0.054931640625, 0.03173828125, 0.118408203125, 0.205078125, 0.291748046875, 0.37841796875, 0.465087890625, 0.5517578125, 0.638427734375, 0.72509765625, 0.811767578125, 0.8984375, 0.985107421875, 1.07177734375, 1.158447265625, 1.2451171875, 1.331787109375, 1.41845703125, 1.505126953125, 1.591796875, 1.678466796875, 1.76513671875, 1.851806640625, 1.9384765625, 2.025146484375, 2.11181640625, 2.198486328125, 2.28515625, 2.371826171875, 2.45849609375, 2.545166015625, 2.6318359375, 2.718505859375, 2.80517578125, 2.891845703125, 2.978515625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 14.0, 9.0, 18.0, 22.0, 44.0, 55.0, 88.0, 127.0, 171.0, 271.0, 344.0, 555.0, 821.0, 1236.0, 1791.0, 2620.0, 3814.0, 5661.0, 8678.0, 12995.0, 19501.0, 30771.0, 49934.0, 87234.0, 189151.0, 312299.0, 134232.0, 68983.0, 40954.0, 25738.0, 16615.0, 11204.0, 7446.0, 4840.0, 3219.0, 2326.0, 1543.0, 1045.0, 708.0, 451.0, 321.0, 239.0, 130.0, 112.0, 80.0, 47.0, 39.0, 21.0, 17.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0141143798828125, -0.013663530349731445, -0.01321268081665039, -0.012761831283569336, -0.012310981750488281, -0.011860132217407227, -0.011409282684326172, -0.010958433151245117, -0.010507583618164062, -0.010056734085083008, -0.009605884552001953, -0.009155035018920898, -0.008704185485839844, -0.008253335952758789, -0.007802486419677734, -0.00735163688659668, -0.006900787353515625, -0.00644993782043457, -0.005999088287353516, -0.005548238754272461, -0.005097389221191406, -0.0046465396881103516, -0.004195690155029297, -0.003744840621948242, -0.0032939910888671875, -0.002843141555786133, -0.002392292022705078, -0.0019414424896240234, -0.0014905929565429688, -0.001039743423461914, -0.0005888938903808594, -0.0001380443572998047, 0.00031280517578125, 0.0007636547088623047, 0.0012145042419433594, 0.001665353775024414, 0.0021162033081054688, 0.0025670528411865234, 0.003017902374267578, 0.003468751907348633, 0.0039196014404296875, 0.004370450973510742, 0.004821300506591797, 0.0052721500396728516, 0.005722999572753906, 0.006173849105834961, 0.006624698638916016, 0.00707554817199707, 0.007526397705078125, 0.00797724723815918, 0.008428096771240234, 0.008878946304321289, 0.009329795837402344, 0.009780645370483398, 0.010231494903564453, 0.010682344436645508, 0.011133193969726562, 0.011584043502807617, 0.012034893035888672, 0.012485742568969727, 0.012936592102050781, 0.013387441635131836, 0.01383829116821289, 0.014289140701293945, 0.014739990234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 12.0, 4.0, 3.0, 11.0, 17.0, 11.0, 17.0, 13.0, 12.0, 27.0, 29.0, 33.0, 31.0, 26.0, 24.0, 29.0, 36.0, 42.0, 35.0, 34.0, 47.0, 1071.0, 36.0, 37.0, 41.0, 37.0, 23.0, 30.0, 31.0, 33.0, 21.0, 28.0, 15.0, 19.0, 16.0, 11.0, 17.0, 10.0, 11.0, 11.0, 10.0, 5.0, 7.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.7587890625, -1.7071685791015625, -1.655548095703125, -1.6039276123046875, -1.55230712890625, -1.5006866455078125, -1.449066162109375, -1.3974456787109375, -1.3458251953125, -1.2942047119140625, -1.242584228515625, -1.1909637451171875, -1.13934326171875, -1.0877227783203125, -1.036102294921875, -0.9844818115234375, -0.932861328125, -0.8812408447265625, -0.829620361328125, -0.7779998779296875, -0.72637939453125, -0.6747589111328125, -0.623138427734375, -0.5715179443359375, -0.5198974609375, -0.4682769775390625, -0.416656494140625, -0.3650360107421875, -0.31341552734375, -0.2617950439453125, -0.210174560546875, -0.1585540771484375, -0.10693359375, -0.0553131103515625, -0.003692626953125, 0.0479278564453125, 0.09954833984375, 0.1511688232421875, 0.202789306640625, 0.2544097900390625, 0.3060302734375, 0.3576507568359375, 0.409271240234375, 0.4608917236328125, 0.51251220703125, 0.5641326904296875, 0.615753173828125, 0.6673736572265625, 0.718994140625, 0.7706146240234375, 0.822235107421875, 0.8738555908203125, 0.92547607421875, 0.9770965576171875, 1.028717041015625, 1.0803375244140625, 1.1319580078125, 1.1835784912109375, 1.235198974609375, 1.2868194580078125, 1.33843994140625, 1.3900604248046875, 1.441680908203125, 1.4933013916015625, 1.544921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 11.0, 9.0, 16.0, 31.0, 47.0, 62.0, 100.0, 137.0, 219.0, 298.0, 537.0, 724.0, 1084.0, 1675.0, 2488.0, 3649.0, 5660.0, 8604.0, 13041.0, 20521.0, 31927.0, 51204.0, 86162.0, 179175.0, 1342780.0, 145159.0, 75069.0, 45057.0, 28705.0, 18420.0, 11851.0, 7598.0, 4977.0, 3347.0, 2238.0, 1476.0, 1027.0, 647.0, 426.0, 325.0, 227.0, 131.0, 95.0, 62.0, 46.0, 32.0, 22.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.009490966796875, -0.009178519248962402, -0.008866071701049805, -0.008553624153137207, -0.00824117660522461, -0.007928729057312012, -0.007616281509399414, -0.007303833961486816, -0.006991386413574219, -0.006678938865661621, -0.0063664913177490234, -0.006054043769836426, -0.005741596221923828, -0.0054291486740112305, -0.005116701126098633, -0.004804253578186035, -0.0044918060302734375, -0.00417935848236084, -0.003866910934448242, -0.0035544633865356445, -0.003242015838623047, -0.0029295682907104492, -0.0026171207427978516, -0.002304673194885254, -0.0019922256469726562, -0.0016797780990600586, -0.001367330551147461, -0.0010548830032348633, -0.0007424354553222656, -0.00042998790740966797, -0.00011754035949707031, 0.00019490718841552734, 0.000507354736328125, 0.0008198022842407227, 0.0011322498321533203, 0.001444697380065918, 0.0017571449279785156, 0.0020695924758911133, 0.002382040023803711, 0.0026944875717163086, 0.0030069351196289062, 0.003319382667541504, 0.0036318302154541016, 0.003944277763366699, 0.004256725311279297, 0.0045691728591918945, 0.004881620407104492, 0.00519406795501709, 0.0055065155029296875, 0.005818963050842285, 0.006131410598754883, 0.0064438581466674805, 0.006756305694580078, 0.007068753242492676, 0.0073812007904052734, 0.007693648338317871, 0.008006095886230469, 0.008318543434143066, 0.008630990982055664, 0.008943438529968262, 0.00925588607788086, 0.009568333625793457, 0.009880781173706055, 0.010193228721618652, 0.01050567626953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 931.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 11.0, 4.0, 0.0, 1.0, 20.0, 4.0, 0.0, 1.0, 1.0, 0.0, 47.0, 19.0, 21.0, 304.0, 2163.0, 20974.0, 1001317.0, 23287.0, 151.0, 98.0, 58.0, 26.0, 10.0, 1.0, 1.0, 1.0, 0.0, 11.0, 0.0, 0.0, 5.0, 0.0, 16.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.187676727771759e-06, -2.1103769540786743e-06, -2.0330771803855896e-06, -1.955777406692505e-06, -1.8784776329994202e-06, -1.8011778593063354e-06, -1.7238780856132507e-06, -1.646578311920166e-06, -1.5692785382270813e-06, -1.4919787645339966e-06, -1.4146789908409119e-06, -1.3373792171478271e-06, -1.2600794434547424e-06, -1.1827796697616577e-06, -1.105479896068573e-06, -1.0281801223754883e-06, -9.508803486824036e-07, -8.735805749893188e-07, -7.962808012962341e-07, -7.189810276031494e-07, -6.416812539100647e-07, -5.6438148021698e-07, -4.870817065238953e-07, -4.0978193283081055e-07, -3.3248215913772583e-07, -2.551823854446411e-07, -1.778826117515564e-07, -1.0058283805847168e-07, -2.3283064365386963e-08, 5.4016709327697754e-08, 1.3131648302078247e-07, 2.086162567138672e-07, 2.859160304069519e-07, 3.632158041000366e-07, 4.4051557779312134e-07, 5.178153514862061e-07, 5.951151251792908e-07, 6.724148988723755e-07, 7.497146725654602e-07, 8.270144462585449e-07, 9.043142199516296e-07, 9.816139936447144e-07, 1.058913767337799e-06, 1.1362135410308838e-06, 1.2135133147239685e-06, 1.2908130884170532e-06, 1.368112862110138e-06, 1.4454126358032227e-06, 1.5227124094963074e-06, 1.600012183189392e-06, 1.6773119568824768e-06, 1.7546117305755615e-06, 1.8319115042686462e-06, 1.909211277961731e-06, 1.9865110516548157e-06, 2.0638108253479004e-06, 2.141110599040985e-06, 2.21841037273407e-06, 2.2957101464271545e-06, 2.3730099201202393e-06, 2.450309693813324e-06, 2.5276094675064087e-06, 2.6049092411994934e-06, 2.682209014892578e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 18.0, 20.0, 19.0, 12.0, 21.0, 25.0, 30.0, 24.0, 27.0, 25.0, 40.0, 43.0, 38.0, 54.0, 34.0, 55.0, 38.0, 43.0, 42.0, 46.0, 32.0, 34.0, 36.0, 31.0, 27.0, 15.0, 26.0, 18.0, 15.0, 15.0, 9.0, 14.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.481689453125, -2.39501953125, -2.308349609375, -2.2216796875, -2.135009765625, -2.04833984375, -1.961669921875, -1.875, -1.788330078125, -1.70166015625, -1.614990234375, -1.5283203125, -1.441650390625, -1.35498046875, -1.268310546875, -1.181640625, -1.094970703125, -1.00830078125, -0.921630859375, -0.8349609375, -0.748291015625, -0.66162109375, -0.574951171875, -0.48828125, -0.401611328125, -0.31494140625, -0.228271484375, -0.1416015625, -0.054931640625, 0.03173828125, 0.118408203125, 0.205078125, 0.291748046875, 0.37841796875, 0.465087890625, 0.5517578125, 0.638427734375, 0.72509765625, 0.811767578125, 0.8984375, 0.985107421875, 1.07177734375, 1.158447265625, 1.2451171875, 1.331787109375, 1.41845703125, 1.505126953125, 1.591796875, 1.678466796875, 1.76513671875, 1.851806640625, 1.9384765625, 2.025146484375, 2.11181640625, 2.198486328125, 2.28515625, 2.371826171875, 2.45849609375, 2.545166015625, 2.6318359375, 2.718505859375, 2.80517578125, 2.891845703125, 2.978515625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 19.0, 21.0, 28.0, 43.0, 67.0, 100.0, 142.0, 179.0, 271.0, 442.0, 661.0, 1022.0, 1445.0, 2268.0, 3553.0, 6085.0, 11404.0, 24282.0, 59980.0, 168454.0, 403906.0, 221807.0, 79166.0, 30564.0, 13773.0, 7207.0, 4191.0, 2528.0, 1666.0, 1050.0, 719.0, 493.0, 332.0, 209.0, 152.0, 93.0, 65.0, 45.0, 32.0, 28.0, 23.0, 8.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.08160400390625, -2.0089111328125, -1.93621826171875, -1.863525390625, -1.79083251953125, -1.7181396484375, -1.64544677734375, -1.57275390625, -1.50006103515625, -1.4273681640625, -1.35467529296875, -1.281982421875, -1.20928955078125, -1.1365966796875, -1.06390380859375, -0.9912109375, -0.91851806640625, -0.8458251953125, -0.77313232421875, -0.700439453125, -0.62774658203125, -0.5550537109375, -0.48236083984375, -0.40966796875, -0.33697509765625, -0.2642822265625, -0.19158935546875, -0.118896484375, -0.04620361328125, 0.0264892578125, 0.09918212890625, 0.171875, 0.24456787109375, 0.3172607421875, 0.38995361328125, 0.462646484375, 0.53533935546875, 0.6080322265625, 0.68072509765625, 0.75341796875, 0.82611083984375, 0.8988037109375, 0.97149658203125, 1.044189453125, 1.11688232421875, 1.1895751953125, 1.26226806640625, 1.3349609375, 1.40765380859375, 1.4803466796875, 1.55303955078125, 1.625732421875, 1.69842529296875, 1.7711181640625, 1.84381103515625, 1.91650390625, 1.98919677734375, 2.0618896484375, 2.13458251953125, 2.207275390625, 2.27996826171875, 2.3526611328125, 2.42535400390625, 2.498046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 9.0, 13.0, 21.0, 12.0, 17.0, 29.0, 23.0, 42.0, 32.0, 41.0, 37.0, 42.0, 70.0, 129.0, 352.0, 1559.0, 173.0, 63.0, 62.0, 48.0, 38.0, 39.0, 26.0, 28.0, 20.0, 23.0, 12.0, 10.0, 9.0, 11.0, 10.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.593017578125, -9.26416015625, -8.935302734375, -8.6064453125, -8.277587890625, -7.94873046875, -7.619873046875, -7.291015625, -6.962158203125, -6.63330078125, -6.304443359375, -5.9755859375, -5.646728515625, -5.31787109375, -4.989013671875, -4.66015625, -4.331298828125, -4.00244140625, -3.673583984375, -3.3447265625, -3.015869140625, -2.68701171875, -2.358154296875, -2.029296875, -1.700439453125, -1.37158203125, -1.042724609375, -0.7138671875, -0.385009765625, -0.05615234375, 0.272705078125, 0.6015625, 0.930419921875, 1.25927734375, 1.588134765625, 1.9169921875, 2.245849609375, 2.57470703125, 2.903564453125, 3.232421875, 3.561279296875, 3.89013671875, 4.218994140625, 4.5478515625, 4.876708984375, 5.20556640625, 5.534423828125, 5.86328125, 6.192138671875, 6.52099609375, 6.849853515625, 7.1787109375, 7.507568359375, 7.83642578125, 8.165283203125, 8.494140625, 8.822998046875, 9.15185546875, 9.480712890625, 9.8095703125, 10.138427734375, 10.46728515625, 10.796142578125, 11.125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 5.0, 7.0, 7.0, 16.0, 12.0, 15.0, 16.0, 20.0, 38.0, 45.0, 64.0, 77.0, 108.0, 183.0, 262.0, 487.0, 1729.0, 25190.0, 3073128.0, 40612.0, 2150.0, 548.0, 279.0, 177.0, 140.0, 112.0, 69.0, 52.0, 23.0, 25.0, 17.0, 27.0, 10.0, 13.0, 13.0, 10.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.90625, -20.283203125, -19.66015625, -19.037109375, -18.4140625, -17.791015625, -17.16796875, -16.544921875, -15.921875, -15.298828125, -14.67578125, -14.052734375, -13.4296875, -12.806640625, -12.18359375, -11.560546875, -10.9375, -10.314453125, -9.69140625, -9.068359375, -8.4453125, -7.822265625, -7.19921875, -6.576171875, -5.953125, -5.330078125, -4.70703125, -4.083984375, -3.4609375, -2.837890625, -2.21484375, -1.591796875, -0.96875, -0.345703125, 0.27734375, 0.900390625, 1.5234375, 2.146484375, 2.76953125, 3.392578125, 4.015625, 4.638671875, 5.26171875, 5.884765625, 6.5078125, 7.130859375, 7.75390625, 8.376953125, 9.0, 9.623046875, 10.24609375, 10.869140625, 11.4921875, 12.115234375, 12.73828125, 13.361328125, 13.984375, 14.607421875, 15.23046875, 15.853515625, 16.4765625, 17.099609375, 17.72265625, 18.345703125, 18.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 15.0, 53.0, 163.0, 300.0, 271.0, 146.0, 54.0, 12.0, 3.0], "bins": [-49.93052673339844, -49.08224105834961, -48.23395919799805, -47.38567352294922, -46.537391662597656, -45.68910598754883, -44.840824127197266, -43.99253845214844, -43.144256591796875, -42.29597091674805, -41.447689056396484, -40.599403381347656, -39.751121520996094, -38.902835845947266, -38.0545539855957, -37.206268310546875, -36.35798645019531, -35.509700775146484, -34.66141891479492, -33.813133239746094, -32.96485137939453, -32.1165657043457, -31.26828384399414, -30.420000076293945, -29.571714401245117, -28.723430633544922, -27.875146865844727, -27.02686309814453, -26.178579330444336, -25.33029556274414, -24.482011795043945, -23.63372802734375, -22.785446166992188, -21.937162399291992, -21.088878631591797, -20.2405948638916, -19.392311096191406, -18.54402732849121, -17.695743560791016, -16.84745979309082, -15.999174118041992, -15.150890350341797, -14.302606582641602, -13.454322814941406, -12.606039047241211, -11.757755279541016, -10.90947151184082, -10.061187744140625, -9.21290397644043, -8.364620208740234, -7.516336441040039, -6.668052673339844, -5.819768905639648, -4.971484661102295, -4.1232008934021, -3.2749171257019043, -2.426633358001709, -1.5783495903015137, -0.7300657033920288, 0.11821818351745605, 0.9665019512176514, 1.8147859573364258, 2.663069725036621, 3.5113534927368164, 4.359637260437012]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 8.0, 7.0, 6.0, 9.0, 11.0, 6.0, 12.0, 14.0, 15.0, 22.0, 22.0, 24.0, 30.0, 30.0, 18.0, 31.0, 21.0, 35.0, 41.0, 50.0, 39.0, 47.0, 43.0, 34.0, 40.0, 38.0, 41.0, 51.0, 50.0, 27.0, 32.0, 21.0, 17.0, 24.0, 12.0, 16.0, 10.0, 9.0, 8.0, 8.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.588218688964844, -21.821998596191406, -21.05577850341797, -20.2895565032959, -19.52333641052246, -18.757116317749023, -17.990896224975586, -17.224674224853516, -16.458454132080078, -15.69223403930664, -14.926012992858887, -14.15979290008545, -13.393571853637695, -12.627351760864258, -11.86113166809082, -11.094910621643066, -10.328690528869629, -9.562470436096191, -8.796249389648438, -8.030029296875, -7.263808250427246, -6.497588157653809, -5.731367588043213, -4.965147018432617, -4.1989264488220215, -3.432705879211426, -2.66648530960083, -1.9002649784088135, -1.1340444087982178, -0.36782383918762207, 0.39839649200439453, 1.1646170616149902, 1.930837631225586, 2.6970582008361816, 3.4632787704467773, 4.229498863220215, 4.995719909667969, 5.761940002441406, 6.528160572052002, 7.294381141662598, 8.060602188110352, 8.826822280883789, 9.593043327331543, 10.35926342010498, 11.125484466552734, 11.891704559326172, 12.65792465209961, 13.424145698547363, 14.1903657913208, 14.956585884094238, 15.722806930541992, 16.48902702331543, 17.255247116088867, 18.021469116210938, 18.787689208984375, 19.553909301757812, 20.32012939453125, 21.086349487304688, 21.852569580078125, 22.618791580200195, 23.385011672973633, 24.15123176574707, 24.917451858520508, 25.683673858642578, 26.449893951416016]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 3.0, 4.0, 21.0, 16.0, 12.0, 17.0, 26.0, 17.0, 19.0, 31.0, 25.0, 29.0, 40.0, 34.0, 41.0, 41.0, 51.0, 55.0, 26.0, 53.0, 53.0, 33.0, 41.0, 41.0, 32.0, 27.0, 29.0, 31.0, 17.0, 20.0, 19.0, 19.0, 7.0, 15.0, 11.0, 10.0, 9.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.4912109375, -2.400390625, -2.3095703125, -2.21875, -2.1279296875, -2.037109375, -1.9462890625, -1.85546875, -1.7646484375, -1.673828125, -1.5830078125, -1.4921875, -1.4013671875, -1.310546875, -1.2197265625, -1.12890625, -1.0380859375, -0.947265625, -0.8564453125, -0.765625, -0.6748046875, -0.583984375, -0.4931640625, -0.40234375, -0.3115234375, -0.220703125, -0.1298828125, -0.0390625, 0.0517578125, 0.142578125, 0.2333984375, 0.32421875, 0.4150390625, 0.505859375, 0.5966796875, 0.6875, 0.7783203125, 0.869140625, 0.9599609375, 1.05078125, 1.1416015625, 1.232421875, 1.3232421875, 1.4140625, 1.5048828125, 1.595703125, 1.6865234375, 1.77734375, 1.8681640625, 1.958984375, 2.0498046875, 2.140625, 2.2314453125, 2.322265625, 2.4130859375, 2.50390625, 2.5947265625, 2.685546875, 2.7763671875, 2.8671875, 2.9580078125, 3.048828125, 3.1396484375, 3.23046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 10.0, 9.0, 17.0, 26.0, 23.0, 39.0, 45.0, 79.0, 93.0, 128.0, 225.0, 365.0, 749.0, 1821.0, 4851.0, 15661.0, 60400.0, 315908.0, 1685059.0, 1706224.0, 317064.0, 60947.0, 15781.0, 5065.0, 1802.0, 808.0, 361.0, 221.0, 121.0, 92.0, 70.0, 48.0, 45.0, 30.0, 21.0, 20.0, 11.0, 8.0, 8.0, 4.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.275146484375, -5.09326171875, -4.911376953125, -4.7294921875, -4.547607421875, -4.36572265625, -4.183837890625, -4.001953125, -3.820068359375, -3.63818359375, -3.456298828125, -3.2744140625, -3.092529296875, -2.91064453125, -2.728759765625, -2.546875, -2.364990234375, -2.18310546875, -2.001220703125, -1.8193359375, -1.637451171875, -1.45556640625, -1.273681640625, -1.091796875, -0.909912109375, -0.72802734375, -0.546142578125, -0.3642578125, -0.182373046875, -0.00048828125, 0.181396484375, 0.36328125, 0.545166015625, 0.72705078125, 0.908935546875, 1.0908203125, 1.272705078125, 1.45458984375, 1.636474609375, 1.818359375, 2.000244140625, 2.18212890625, 2.364013671875, 2.5458984375, 2.727783203125, 2.90966796875, 3.091552734375, 3.2734375, 3.455322265625, 3.63720703125, 3.819091796875, 4.0009765625, 4.182861328125, 4.36474609375, 4.546630859375, 4.728515625, 4.910400390625, 5.09228515625, 5.274169921875, 5.4560546875, 5.637939453125, 5.81982421875, 6.001708984375, 6.18359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 11.0, 19.0, 19.0, 25.0, 32.0, 45.0, 56.0, 80.0, 89.0, 92.0, 138.0, 151.0, 158.0, 220.0, 301.0, 311.0, 322.0, 344.0, 312.0, 209.0, 218.0, 168.0, 133.0, 122.0, 88.0, 66.0, 61.0, 45.0, 43.0, 25.0, 28.0, 20.0, 22.0, 17.0, 8.0, 11.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.820556640625, -3.69189453125, -3.563232421875, -3.4345703125, -3.305908203125, -3.17724609375, -3.048583984375, -2.919921875, -2.791259765625, -2.66259765625, -2.533935546875, -2.4052734375, -2.276611328125, -2.14794921875, -2.019287109375, -1.890625, -1.761962890625, -1.63330078125, -1.504638671875, -1.3759765625, -1.247314453125, -1.11865234375, -0.989990234375, -0.861328125, -0.732666015625, -0.60400390625, -0.475341796875, -0.3466796875, -0.218017578125, -0.08935546875, 0.039306640625, 0.16796875, 0.296630859375, 0.42529296875, 0.553955078125, 0.6826171875, 0.811279296875, 0.93994140625, 1.068603515625, 1.197265625, 1.325927734375, 1.45458984375, 1.583251953125, 1.7119140625, 1.840576171875, 1.96923828125, 2.097900390625, 2.2265625, 2.355224609375, 2.48388671875, 2.612548828125, 2.7412109375, 2.869873046875, 2.99853515625, 3.127197265625, 3.255859375, 3.384521484375, 3.51318359375, 3.641845703125, 3.7705078125, 3.899169921875, 4.02783203125, 4.156494140625, 4.28515625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 8.0, 13.0, 12.0, 18.0, 15.0, 22.0, 32.0, 29.0, 57.0, 61.0, 81.0, 85.0, 137.0, 162.0, 221.0, 261.0, 459.0, 1990.0, 45640.0, 2631462.0, 1484296.0, 26174.0, 1508.0, 371.0, 245.0, 183.0, 160.0, 122.0, 112.0, 101.0, 47.0, 39.0, 34.0, 23.0, 26.0, 10.0, 12.0, 6.0, 11.0, 10.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-20.671875, -20.0625, -19.453125, -18.84375, -18.234375, -17.625, -17.015625, -16.40625, -15.796875, -15.1875, -14.578125, -13.96875, -13.359375, -12.75, -12.140625, -11.53125, -10.921875, -10.3125, -9.703125, -9.09375, -8.484375, -7.875, -7.265625, -6.65625, -6.046875, -5.4375, -4.828125, -4.21875, -3.609375, -3.0, -2.390625, -1.78125, -1.171875, -0.5625, 0.046875, 0.65625, 1.265625, 1.875, 2.484375, 3.09375, 3.703125, 4.3125, 4.921875, 5.53125, 6.140625, 6.75, 7.359375, 7.96875, 8.578125, 9.1875, 9.796875, 10.40625, 11.015625, 11.625, 12.234375, 12.84375, 13.453125, 14.0625, 14.671875, 15.28125, 15.890625, 16.5, 17.109375, 17.71875, 18.328125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 22.0, 56.0, 118.0, 188.0, 249.0, 182.0, 105.0, 55.0, 21.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.02879333496094, -81.19861602783203, -79.36843872070312, -77.53826141357422, -75.70808410644531, -73.8779067993164, -72.0477294921875, -70.21754455566406, -68.38737487792969, -66.55719757080078, -64.72702026367188, -62.89684295654297, -61.06666564941406, -59.236488342285156, -57.406307220458984, -55.57612991333008, -53.745948791503906, -51.915771484375, -50.085594177246094, -48.25541687011719, -46.42523956298828, -44.595062255859375, -42.7648811340332, -40.9347038269043, -39.10452651977539, -37.274349212646484, -35.44417190551758, -33.61399459838867, -31.783815383911133, -29.953638076782227, -28.123458862304688, -26.29328155517578, -24.46310043334961, -22.632923126220703, -20.802745819091797, -18.972566604614258, -17.14238929748535, -15.312211990356445, -13.482033729553223, -11.65185546875, -9.821678161621094, -7.991500377655029, -6.161322593688965, -4.3311448097229, -2.500967025756836, -0.6707897186279297, 1.159388542175293, 2.9895668029785156, 4.819744110107422, 6.649921894073486, 8.48009967803955, 10.310277938842773, 12.14045524597168, 13.970632553100586, 15.800810813903809, 17.63098907470703, 19.461166381835938, 21.291343688964844, 23.12152099609375, 24.95170021057129, 26.781877517700195, 28.6120548248291, 30.44223403930664, 32.27241134643555, 34.10258865356445]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 7.0, 8.0, 7.0, 10.0, 10.0, 10.0, 11.0, 22.0, 33.0, 27.0, 26.0, 27.0, 22.0, 26.0, 33.0, 48.0, 40.0, 34.0, 42.0, 34.0, 39.0, 34.0, 43.0, 37.0, 29.0, 42.0, 34.0, 22.0, 32.0, 27.0, 23.0, 28.0, 13.0, 17.0, 15.0, 10.0, 13.0, 7.0, 8.0, 9.0, 5.0, 4.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.77703857421875, -16.23661994934082, -15.69620132446289, -15.155782699584961, -14.615364074707031, -14.074945449829102, -13.534526824951172, -12.994108200073242, -12.453689575195312, -11.913270950317383, -11.372852325439453, -10.832433700561523, -10.292015075683594, -9.751596450805664, -9.211177825927734, -8.670759201049805, -8.130340576171875, -7.589921951293945, -7.049503326416016, -6.509084701538086, -5.968666076660156, -5.428247451782227, -4.887828826904297, -4.347410202026367, -3.8069915771484375, -3.266572952270508, -2.726154327392578, -2.1857357025146484, -1.6453170776367188, -1.104898452758789, -0.5644798278808594, -0.024061203002929688, 0.516357421875, 1.0567760467529297, 1.5971946716308594, 2.137613296508789, 2.6780319213867188, 3.2184505462646484, 3.758869171142578, 4.299287796020508, 4.8397064208984375, 5.380125045776367, 5.920543670654297, 6.460962295532227, 7.001380920410156, 7.541799545288086, 8.082218170166016, 8.622636795043945, 9.163055419921875, 9.703474044799805, 10.243892669677734, 10.784311294555664, 11.324729919433594, 11.865148544311523, 12.405567169189453, 12.945985794067383, 13.486404418945312, 14.026823043823242, 14.567241668701172, 15.107660293579102, 15.648078918457031, 16.18849754333496, 16.72891616821289, 17.26933479309082, 17.80975341796875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 5.0, 14.0, 18.0, 11.0, 14.0, 30.0, 40.0, 26.0, 36.0, 30.0, 35.0, 34.0, 32.0, 38.0, 52.0, 44.0, 56.0, 44.0, 39.0, 46.0, 34.0, 33.0, 34.0, 25.0, 20.0, 27.0, 26.0, 17.0, 16.0, 20.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.75390625, -2.66571044921875, -2.5775146484375, -2.48931884765625, -2.401123046875, -2.31292724609375, -2.2247314453125, -2.13653564453125, -2.04833984375, -1.96014404296875, -1.8719482421875, -1.78375244140625, -1.695556640625, -1.60736083984375, -1.5191650390625, -1.43096923828125, -1.3427734375, -1.25457763671875, -1.1663818359375, -1.07818603515625, -0.989990234375, -0.90179443359375, -0.8135986328125, -0.72540283203125, -0.63720703125, -0.54901123046875, -0.4608154296875, -0.37261962890625, -0.284423828125, -0.19622802734375, -0.1080322265625, -0.01983642578125, 0.068359375, 0.15655517578125, 0.2447509765625, 0.33294677734375, 0.421142578125, 0.50933837890625, 0.5975341796875, 0.68572998046875, 0.77392578125, 0.86212158203125, 0.9503173828125, 1.03851318359375, 1.126708984375, 1.21490478515625, 1.3031005859375, 1.39129638671875, 1.4794921875, 1.56768798828125, 1.6558837890625, 1.74407958984375, 1.832275390625, 1.92047119140625, 2.0086669921875, 2.09686279296875, 2.18505859375, 2.27325439453125, 2.3614501953125, 2.44964599609375, 2.537841796875, 2.62603759765625, 2.7142333984375, 2.80242919921875, 2.890625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 12.0, 12.0, 18.0, 42.0, 56.0, 79.0, 122.0, 176.0, 282.0, 431.0, 581.0, 876.0, 1344.0, 2039.0, 2975.0, 4507.0, 6917.0, 10704.0, 16764.0, 26411.0, 42110.0, 70216.0, 135766.0, 322124.0, 184042.0, 84473.0, 49321.0, 30772.0, 19492.0, 12337.0, 7922.0, 5230.0, 3476.0, 2248.0, 1548.0, 1058.0, 680.0, 459.0, 338.0, 192.0, 139.0, 89.0, 62.0, 31.0, 29.0, 22.0, 13.0, 7.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01522064208984375, -0.014754652976989746, -0.014288663864135742, -0.013822674751281738, -0.013356685638427734, -0.01289069652557373, -0.012424707412719727, -0.011958718299865723, -0.011492729187011719, -0.011026740074157715, -0.010560750961303711, -0.010094761848449707, -0.009628772735595703, -0.0091627836227417, -0.008696794509887695, -0.008230805397033691, -0.0077648162841796875, -0.007298827171325684, -0.00683283805847168, -0.006366848945617676, -0.005900859832763672, -0.005434870719909668, -0.004968881607055664, -0.00450289249420166, -0.004036903381347656, -0.0035709142684936523, -0.0031049251556396484, -0.0026389360427856445, -0.0021729469299316406, -0.0017069578170776367, -0.0012409687042236328, -0.0007749795913696289, -0.000308990478515625, 0.0001569986343383789, 0.0006229877471923828, 0.0010889768600463867, 0.0015549659729003906, 0.0020209550857543945, 0.0024869441986083984, 0.0029529333114624023, 0.0034189224243164062, 0.00388491153717041, 0.004350900650024414, 0.004816889762878418, 0.005282878875732422, 0.005748867988586426, 0.00621485710144043, 0.006680846214294434, 0.0071468353271484375, 0.007612824440002441, 0.008078813552856445, 0.00854480266571045, 0.009010791778564453, 0.009476780891418457, 0.009942770004272461, 0.010408759117126465, 0.010874748229980469, 0.011340737342834473, 0.011806726455688477, 0.01227271556854248, 0.012738704681396484, 0.013204693794250488, 0.013670682907104492, 0.014136672019958496, 0.0146026611328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 9.0, 11.0, 8.0, 20.0, 11.0, 24.0, 23.0, 24.0, 37.0, 30.0, 37.0, 34.0, 34.0, 41.0, 40.0, 47.0, 45.0, 1068.0, 37.0, 46.0, 36.0, 44.0, 35.0, 28.0, 30.0, 42.0, 33.0, 23.0, 19.0, 20.0, 20.0, 14.0, 11.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.21875, -2.15606689453125, -2.0933837890625, -2.03070068359375, -1.968017578125, -1.90533447265625, -1.8426513671875, -1.77996826171875, -1.71728515625, -1.65460205078125, -1.5919189453125, -1.52923583984375, -1.466552734375, -1.40386962890625, -1.3411865234375, -1.27850341796875, -1.2158203125, -1.15313720703125, -1.0904541015625, -1.02777099609375, -0.965087890625, -0.90240478515625, -0.8397216796875, -0.77703857421875, -0.71435546875, -0.65167236328125, -0.5889892578125, -0.52630615234375, -0.463623046875, -0.40093994140625, -0.3382568359375, -0.27557373046875, -0.212890625, -0.15020751953125, -0.0875244140625, -0.02484130859375, 0.037841796875, 0.10052490234375, 0.1632080078125, 0.22589111328125, 0.28857421875, 0.35125732421875, 0.4139404296875, 0.47662353515625, 0.539306640625, 0.60198974609375, 0.6646728515625, 0.72735595703125, 0.7900390625, 0.85272216796875, 0.9154052734375, 0.97808837890625, 1.040771484375, 1.10345458984375, 1.1661376953125, 1.22882080078125, 1.29150390625, 1.35418701171875, 1.4168701171875, 1.47955322265625, 1.542236328125, 1.60491943359375, 1.6676025390625, 1.73028564453125, 1.79296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 9.0, 7.0, 6.0, 21.0, 23.0, 26.0, 49.0, 94.0, 111.0, 174.0, 243.0, 436.0, 637.0, 1105.0, 1766.0, 2642.0, 4671.0, 7694.0, 13119.0, 22561.0, 39368.0, 69282.0, 134906.0, 1366793.0, 212532.0, 94432.0, 52037.0, 29769.0, 17200.0, 10004.0, 6030.0, 3504.0, 2226.0, 1362.0, 835.0, 525.0, 324.0, 195.0, 157.0, 94.0, 66.0, 32.0, 25.0, 22.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.01145017147064209, -0.01105189323425293, -0.01065361499786377, -0.01025533676147461, -0.00985705852508545, -0.009458780288696289, -0.009060502052307129, -0.008662223815917969, -0.008263945579528809, -0.007865667343139648, -0.007467389106750488, -0.007069110870361328, -0.006670832633972168, -0.006272554397583008, -0.005874276161193848, -0.0054759979248046875, -0.005077719688415527, -0.004679441452026367, -0.004281163215637207, -0.003882884979248047, -0.0034846067428588867, -0.0030863285064697266, -0.0026880502700805664, -0.0022897720336914062, -0.001891493797302246, -0.001493215560913086, -0.0010949373245239258, -0.0006966590881347656, -0.00029838085174560547, 9.989738464355469e-05, 0.0004981756210327148, 0.000896453857421875, 0.0012947320938110352, 0.0016930103302001953, 0.0020912885665893555, 0.0024895668029785156, 0.0028878450393676758, 0.003286123275756836, 0.003684401512145996, 0.004082679748535156, 0.004480957984924316, 0.0048792362213134766, 0.005277514457702637, 0.005675792694091797, 0.006074070930480957, 0.006472349166870117, 0.006870627403259277, 0.0072689056396484375, 0.007667183876037598, 0.008065462112426758, 0.008463740348815918, 0.008862018585205078, 0.009260296821594238, 0.009658575057983398, 0.010056853294372559, 0.010455131530761719, 0.010853409767150879, 0.011251688003540039, 0.0116499662399292, 0.01204824447631836, 0.01244652271270752, 0.01284480094909668, 0.01324307918548584, 0.013641357421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 927.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 1.0, 0.0, 22.0, 0.0, 13.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 22.0, 26.0, 23.0, 23.0, 89.0, 212.0, 2942.0, 0.0, 23400.0, 994937.0, 23486.0, 2909.0, 224.0, 97.0, 13.0, 0.0, 24.0, 24.0, 22.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 21.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113021850585938e-06, -1.259148120880127e-06, -1.2069940567016602e-06, -1.1548399925231934e-06, -1.1026859283447266e-06, -1.0505318641662598e-06, -9.98377799987793e-07, -9.462237358093262e-07, -8.940696716308594e-07, -8.419156074523926e-07, -7.897615432739258e-07, -7.37607479095459e-07, -6.854534149169922e-07, -6.332993507385254e-07, -5.811452865600586e-07, -5.289912223815918e-07, -4.76837158203125e-07, -4.246830940246582e-07, -3.725290298461914e-07, -3.203749656677246e-07, -2.682209014892578e-07, -2.1606683731079102e-07, -1.6391277313232422e-07, -1.1175870895385742e-07, -5.960464477539063e-08, -7.450580596923828e-09, 4.470348358154297e-08, 9.685754776000977e-08, 1.4901161193847656e-07, 2.0116567611694336e-07, 2.5331974029541016e-07, 3.0547380447387695e-07, 3.5762786865234375e-07, 4.0978193283081055e-07, 4.6193599700927734e-07, 5.140900611877441e-07, 5.662441253662109e-07, 6.183981895446777e-07, 6.705522537231445e-07, 7.227063179016113e-07, 7.748603820800781e-07, 8.270144462585449e-07, 8.791685104370117e-07, 9.313225746154785e-07, 9.834766387939453e-07, 1.0356307029724121e-06, 1.087784767150879e-06, 1.1399388313293457e-06, 1.1920928955078125e-06, 1.2442469596862793e-06, 1.296401023864746e-06, 1.3485550880432129e-06, 1.4007091522216797e-06, 1.4528632164001465e-06, 1.5050172805786133e-06, 1.55717134475708e-06, 1.6093254089355469e-06, 1.6614794731140137e-06, 1.7136335372924805e-06, 1.7657876014709473e-06, 1.817941665649414e-06, 1.8700957298278809e-06, 1.9222497940063477e-06, 1.9744038581848145e-06, 2.0265579223632812e-06]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 5.0, 14.0, 18.0, 11.0, 14.0, 30.0, 40.0, 26.0, 36.0, 30.0, 35.0, 34.0, 32.0, 38.0, 52.0, 44.0, 56.0, 44.0, 39.0, 46.0, 34.0, 33.0, 34.0, 25.0, 20.0, 27.0, 26.0, 17.0, 16.0, 20.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.75390625, -2.66571044921875, -2.5775146484375, -2.48931884765625, -2.401123046875, -2.31292724609375, -2.2247314453125, -2.13653564453125, -2.04833984375, -1.96014404296875, -1.8719482421875, -1.78375244140625, -1.695556640625, -1.60736083984375, -1.5191650390625, -1.43096923828125, -1.3427734375, -1.25457763671875, -1.1663818359375, -1.07818603515625, -0.989990234375, -0.90179443359375, -0.8135986328125, -0.72540283203125, -0.63720703125, -0.54901123046875, -0.4608154296875, -0.37261962890625, -0.284423828125, -0.19622802734375, -0.1080322265625, -0.01983642578125, 0.068359375, 0.15655517578125, 0.2447509765625, 0.33294677734375, 0.421142578125, 0.50933837890625, 0.5975341796875, 0.68572998046875, 0.77392578125, 0.86212158203125, 0.9503173828125, 1.03851318359375, 1.126708984375, 1.21490478515625, 1.3031005859375, 1.39129638671875, 1.4794921875, 1.56768798828125, 1.6558837890625, 1.74407958984375, 1.832275390625, 1.92047119140625, 2.0086669921875, 2.09686279296875, 2.18505859375, 2.27325439453125, 2.3614501953125, 2.44964599609375, 2.537841796875, 2.62603759765625, 2.7142333984375, 2.80242919921875, 2.890625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 12.0, 24.0, 23.0, 58.0, 74.0, 115.0, 219.0, 307.0, 553.0, 942.0, 1611.0, 2909.0, 4965.0, 8927.0, 17020.0, 34403.0, 83773.0, 320838.0, 396891.0, 96053.0, 37849.0, 18234.0, 9954.0, 5441.0, 3086.0, 1755.0, 938.0, 575.0, 365.0, 217.0, 147.0, 75.0, 57.0, 46.0, 33.0, 19.0, 15.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.90625, -2.81561279296875, -2.7249755859375, -2.63433837890625, -2.543701171875, -2.45306396484375, -2.3624267578125, -2.27178955078125, -2.18115234375, -2.09051513671875, -1.9998779296875, -1.90924072265625, -1.818603515625, -1.72796630859375, -1.6373291015625, -1.54669189453125, -1.4560546875, -1.36541748046875, -1.2747802734375, -1.18414306640625, -1.093505859375, -1.00286865234375, -0.9122314453125, -0.82159423828125, -0.73095703125, -0.64031982421875, -0.5496826171875, -0.45904541015625, -0.368408203125, -0.27777099609375, -0.1871337890625, -0.09649658203125, -0.005859375, 0.08477783203125, 0.1754150390625, 0.26605224609375, 0.356689453125, 0.44732666015625, 0.5379638671875, 0.62860107421875, 0.71923828125, 0.80987548828125, 0.9005126953125, 0.99114990234375, 1.081787109375, 1.17242431640625, 1.2630615234375, 1.35369873046875, 1.4443359375, 1.53497314453125, 1.6256103515625, 1.71624755859375, 1.806884765625, 1.89752197265625, 1.9881591796875, 2.07879638671875, 2.16943359375, 2.26007080078125, 2.3507080078125, 2.44134521484375, 2.531982421875, 2.62261962890625, 2.7132568359375, 2.80389404296875, 2.89453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 6.0, 4.0, 11.0, 10.0, 12.0, 19.0, 16.0, 20.0, 21.0, 24.0, 37.0, 41.0, 42.0, 44.0, 55.0, 46.0, 77.0, 171.0, 1653.0, 215.0, 100.0, 58.0, 48.0, 42.0, 40.0, 31.0, 34.0, 20.0, 29.0, 28.0, 9.0, 13.0, 17.0, 10.0, 10.0, 10.0, 11.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.3006591796875, -9.984130859375, -9.6676025390625, -9.35107421875, -9.0345458984375, -8.718017578125, -8.4014892578125, -8.0849609375, -7.7684326171875, -7.451904296875, -7.1353759765625, -6.81884765625, -6.5023193359375, -6.185791015625, -5.8692626953125, -5.552734375, -5.2362060546875, -4.919677734375, -4.6031494140625, -4.28662109375, -3.9700927734375, -3.653564453125, -3.3370361328125, -3.0205078125, -2.7039794921875, -2.387451171875, -2.0709228515625, -1.75439453125, -1.4378662109375, -1.121337890625, -0.8048095703125, -0.48828125, -0.1717529296875, 0.144775390625, 0.4613037109375, 0.77783203125, 1.0943603515625, 1.410888671875, 1.7274169921875, 2.0439453125, 2.3604736328125, 2.677001953125, 2.9935302734375, 3.31005859375, 3.6265869140625, 3.943115234375, 4.2596435546875, 4.576171875, 4.8927001953125, 5.209228515625, 5.5257568359375, 5.84228515625, 6.1588134765625, 6.475341796875, 6.7918701171875, 7.1083984375, 7.4249267578125, 7.741455078125, 8.0579833984375, 8.37451171875, 8.6910400390625, 9.007568359375, 9.3240966796875, 9.640625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 11.0, 12.0, 14.0, 11.0, 19.0, 16.0, 18.0, 35.0, 43.0, 53.0, 79.0, 86.0, 119.0, 148.0, 233.0, 455.0, 1725.0, 39345.0, 3068999.0, 31416.0, 1505.0, 435.0, 254.0, 146.0, 122.0, 100.0, 84.0, 55.0, 26.0, 35.0, 16.0, 29.0, 13.0, 15.0, 7.0, 5.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.14208984375, -20.4248046875, -19.70751953125, -18.990234375, -18.27294921875, -17.5556640625, -16.83837890625, -16.12109375, -15.40380859375, -14.6865234375, -13.96923828125, -13.251953125, -12.53466796875, -11.8173828125, -11.10009765625, -10.3828125, -9.66552734375, -8.9482421875, -8.23095703125, -7.513671875, -6.79638671875, -6.0791015625, -5.36181640625, -4.64453125, -3.92724609375, -3.2099609375, -2.49267578125, -1.775390625, -1.05810546875, -0.3408203125, 0.37646484375, 1.09375, 1.81103515625, 2.5283203125, 3.24560546875, 3.962890625, 4.68017578125, 5.3974609375, 6.11474609375, 6.83203125, 7.54931640625, 8.2666015625, 8.98388671875, 9.701171875, 10.41845703125, 11.1357421875, 11.85302734375, 12.5703125, 13.28759765625, 14.0048828125, 14.72216796875, 15.439453125, 16.15673828125, 16.8740234375, 17.59130859375, 18.30859375, 19.02587890625, 19.7431640625, 20.46044921875, 21.177734375, 21.89501953125, 22.6123046875, 23.32958984375, 24.046875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [195.0, 808.0, 15.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.190304756164551, -1.1983695030212402, 2.7935657501220703, 6.785500526428223, 10.777436256408691, 14.76937198638916, 18.761306762695312, 22.75324249267578, 26.74517822265625, 30.73711395263672, 34.72904968261719, 38.720985412597656, 42.712921142578125, 46.704856872558594, 50.6967887878418, 54.688724517822266, 58.680660247802734, 62.6725959777832, 66.6645278930664, 70.65646362304688, 74.64839935302734, 78.64033508300781, 82.63227081298828, 86.62420654296875, 90.61614227294922, 94.60807800292969, 98.60001373291016, 102.59194946289062, 106.5838851928711, 110.57582092285156, 114.5677490234375, 118.5596923828125, 122.55162048339844, 126.5435562133789, 130.53549194335938, 134.5274200439453, 138.5193634033203, 142.51129150390625, 146.50323486328125, 150.4951629638672, 154.4871063232422, 158.47903442382812, 162.47097778320312, 166.46290588378906, 170.45484924316406, 174.44677734375, 178.438720703125, 182.43064880371094, 186.42257690429688, 190.4145050048828, 194.4064483642578, 198.39837646484375, 202.39031982421875, 206.3822479248047, 210.3741912841797, 214.36611938476562, 218.35806274414062, 222.34999084472656, 226.34193420410156, 230.3338623046875, 234.3258056640625, 238.31773376464844, 242.30967712402344, 246.30160522460938, 250.29354858398438]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 3.0, 8.0, 7.0, 12.0, 15.0, 12.0, 17.0, 13.0, 22.0, 32.0, 23.0, 25.0, 31.0, 34.0, 46.0, 30.0, 36.0, 32.0, 33.0, 51.0, 37.0, 52.0, 33.0, 31.0, 31.0, 30.0, 36.0, 28.0, 27.0, 26.0, 22.0, 24.0, 17.0, 14.0, 16.0, 13.0, 16.0, 6.0, 4.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-24.78132438659668, -24.04560089111328, -23.309879302978516, -22.574155807495117, -21.83843231201172, -21.10270881652832, -20.366985321044922, -19.631263732910156, -18.895540237426758, -18.15981674194336, -17.424095153808594, -16.688371658325195, -15.952648162841797, -15.216924667358398, -14.481202125549316, -13.745479583740234, -13.009756088256836, -12.274032592773438, -11.538310050964355, -10.802587509155273, -10.066864013671875, -9.331140518188477, -8.595417976379395, -7.859694957733154, -7.123971939086914, -6.388248920440674, -5.652525901794434, -4.916802883148193, -4.181079864501953, -3.445356845855713, -2.7096338272094727, -1.9739108085632324, -1.2381877899169922, -0.502464771270752, 0.23325824737548828, 0.9689812660217285, 1.7047042846679688, 2.440427303314209, 3.176150321960449, 3.9118733406066895, 4.64759635925293, 5.38331937789917, 6.11904239654541, 6.85476541519165, 7.590488433837891, 8.326211929321289, 9.061934471130371, 9.797657012939453, 10.533380508422852, 11.26910400390625, 12.004826545715332, 12.740549087524414, 13.476272583007812, 14.211996078491211, 14.947718620300293, 15.683441162109375, 16.419164657592773, 17.154888153076172, 17.890609741210938, 18.626333236694336, 19.362056732177734, 20.097780227661133, 20.83350372314453, 21.569225311279297, 22.304948806762695]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 3.0, 10.0, 10.0, 10.0, 16.0, 17.0, 22.0, 25.0, 24.0, 39.0, 36.0, 20.0, 40.0, 37.0, 48.0, 46.0, 47.0, 40.0, 44.0, 49.0, 50.0, 42.0, 29.0, 32.0, 30.0, 31.0, 25.0, 21.0, 24.0, 19.0, 15.0, 11.0, 11.0, 18.0, 13.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.892578125, -2.79925537109375, -2.7059326171875, -2.61260986328125, -2.519287109375, -2.42596435546875, -2.3326416015625, -2.23931884765625, -2.14599609375, -2.05267333984375, -1.9593505859375, -1.86602783203125, -1.772705078125, -1.67938232421875, -1.5860595703125, -1.49273681640625, -1.3994140625, -1.30609130859375, -1.2127685546875, -1.11944580078125, -1.026123046875, -0.93280029296875, -0.8394775390625, -0.74615478515625, -0.65283203125, -0.55950927734375, -0.4661865234375, -0.37286376953125, -0.279541015625, -0.18621826171875, -0.0928955078125, 0.00042724609375, 0.09375, 0.18707275390625, 0.2803955078125, 0.37371826171875, 0.467041015625, 0.56036376953125, 0.6536865234375, 0.74700927734375, 0.84033203125, 0.93365478515625, 1.0269775390625, 1.12030029296875, 1.213623046875, 1.30694580078125, 1.4002685546875, 1.49359130859375, 1.5869140625, 1.68023681640625, 1.7735595703125, 1.86688232421875, 1.960205078125, 2.05352783203125, 2.1468505859375, 2.24017333984375, 2.33349609375, 2.42681884765625, 2.5201416015625, 2.61346435546875, 2.706787109375, 2.80010986328125, 2.8934326171875, 2.98675537109375, 3.080078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 1.0, 8.0, 10.0, 16.0, 18.0, 21.0, 28.0, 35.0, 59.0, 78.0, 121.0, 299.0, 704.0, 1765.0, 5808.0, 24413.0, 139936.0, 1240918.0, 2380134.0, 336585.0, 48048.0, 10392.0, 2907.0, 1006.0, 428.0, 186.0, 100.0, 66.0, 43.0, 31.0, 13.0, 17.0, 17.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.015625, -6.78338623046875, -6.5511474609375, -6.31890869140625, -6.086669921875, -5.85443115234375, -5.6221923828125, -5.38995361328125, -5.15771484375, -4.92547607421875, -4.6932373046875, -4.46099853515625, -4.228759765625, -3.99652099609375, -3.7642822265625, -3.53204345703125, -3.2998046875, -3.06756591796875, -2.8353271484375, -2.60308837890625, -2.370849609375, -2.13861083984375, -1.9063720703125, -1.67413330078125, -1.44189453125, -1.20965576171875, -0.9774169921875, -0.74517822265625, -0.512939453125, -0.28070068359375, -0.0484619140625, 0.18377685546875, 0.416015625, 0.64825439453125, 0.8804931640625, 1.11273193359375, 1.344970703125, 1.57720947265625, 1.8094482421875, 2.04168701171875, 2.27392578125, 2.50616455078125, 2.7384033203125, 2.97064208984375, 3.202880859375, 3.43511962890625, 3.6673583984375, 3.89959716796875, 4.1318359375, 4.36407470703125, 4.5963134765625, 4.82855224609375, 5.060791015625, 5.29302978515625, 5.5252685546875, 5.75750732421875, 5.98974609375, 6.22198486328125, 6.4542236328125, 6.68646240234375, 6.918701171875, 7.15093994140625, 7.3831787109375, 7.61541748046875, 7.84765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 2.0, 9.0, 8.0, 14.0, 18.0, 25.0, 37.0, 36.0, 67.0, 86.0, 106.0, 150.0, 158.0, 254.0, 380.0, 396.0, 488.0, 440.0, 340.0, 238.0, 207.0, 171.0, 118.0, 90.0, 65.0, 45.0, 36.0, 36.0, 16.0, 11.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.36737060546875, -5.1917724609375, -5.01617431640625, -4.840576171875, -4.66497802734375, -4.4893798828125, -4.31378173828125, -4.13818359375, -3.96258544921875, -3.7869873046875, -3.61138916015625, -3.435791015625, -3.26019287109375, -3.0845947265625, -2.90899658203125, -2.7333984375, -2.55780029296875, -2.3822021484375, -2.20660400390625, -2.031005859375, -1.85540771484375, -1.6798095703125, -1.50421142578125, -1.32861328125, -1.15301513671875, -0.9774169921875, -0.80181884765625, -0.626220703125, -0.45062255859375, -0.2750244140625, -0.09942626953125, 0.076171875, 0.25177001953125, 0.4273681640625, 0.60296630859375, 0.778564453125, 0.95416259765625, 1.1297607421875, 1.30535888671875, 1.48095703125, 1.65655517578125, 1.8321533203125, 2.00775146484375, 2.183349609375, 2.35894775390625, 2.5345458984375, 2.71014404296875, 2.8857421875, 3.06134033203125, 3.2369384765625, 3.41253662109375, 3.588134765625, 3.76373291015625, 3.9393310546875, 4.11492919921875, 4.29052734375, 4.46612548828125, 4.6417236328125, 4.81732177734375, 4.992919921875, 5.16851806640625, 5.3441162109375, 5.51971435546875, 5.6953125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 16.0, 9.0, 25.0, 33.0, 28.0, 75.0, 87.0, 122.0, 166.0, 249.0, 309.0, 482.0, 2192.0, 109337.0, 3897362.0, 179165.0, 2906.0, 565.0, 300.0, 248.0, 154.0, 122.0, 90.0, 55.0, 41.0, 32.0, 29.0, 21.0, 11.0, 10.0, 6.0, 5.0, 4.0, 8.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.640625, -23.859619140625, -23.07861328125, -22.297607421875, -21.5166015625, -20.735595703125, -19.95458984375, -19.173583984375, -18.392578125, -17.611572265625, -16.83056640625, -16.049560546875, -15.2685546875, -14.487548828125, -13.70654296875, -12.925537109375, -12.14453125, -11.363525390625, -10.58251953125, -9.801513671875, -9.0205078125, -8.239501953125, -7.45849609375, -6.677490234375, -5.896484375, -5.115478515625, -4.33447265625, -3.553466796875, -2.7724609375, -1.991455078125, -1.21044921875, -0.429443359375, 0.3515625, 1.132568359375, 1.91357421875, 2.694580078125, 3.4755859375, 4.256591796875, 5.03759765625, 5.818603515625, 6.599609375, 7.380615234375, 8.16162109375, 8.942626953125, 9.7236328125, 10.504638671875, 11.28564453125, 12.066650390625, 12.84765625, 13.628662109375, 14.40966796875, 15.190673828125, 15.9716796875, 16.752685546875, 17.53369140625, 18.314697265625, 19.095703125, 19.876708984375, 20.65771484375, 21.438720703125, 22.2197265625, 23.000732421875, 23.78173828125, 24.562744140625, 25.34375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 9.0, 18.0, 49.0, 60.0, 113.0, 172.0, 179.0, 142.0, 109.0, 86.0, 43.0, 17.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.216331481933594, -14.920907020568848, -13.625482559204102, -12.330058097839355, -11.03463363647461, -9.739209175109863, -8.443784713745117, -7.148360252380371, -5.852935791015625, -4.557511329650879, -3.262086868286133, -1.9666624069213867, -0.6712379455566406, 0.6241865158081055, 1.9196109771728516, 3.2150354385375977, 4.510459899902344, 5.80588436126709, 7.101308822631836, 8.396733283996582, 9.692157745361328, 10.987582206726074, 12.28300666809082, 13.578431129455566, 14.873855590820312, 16.169281005859375, 17.464704513549805, 18.760128021240234, 20.055553436279297, 21.35097885131836, 22.64640235900879, 23.94182586669922, 25.23725128173828, 26.532676696777344, 27.828100204467773, 29.123523712158203, 30.418949127197266, 31.714374542236328, 33.009796142578125, 34.30522155761719, 35.60064697265625, 36.89607238769531, 38.191497802734375, 39.48691940307617, 40.782344818115234, 42.0777702331543, 43.373191833496094, 44.668617248535156, 45.96404266357422, 47.25946807861328, 48.554893493652344, 49.85031509399414, 51.1457405090332, 52.441165924072266, 53.73658752441406, 55.032012939453125, 56.32743835449219, 57.62286376953125, 58.91828918457031, 60.21371078491211, 61.50913619995117, 62.804561614990234, 64.09998321533203, 65.3954086303711, 66.69083404541016]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 9.0, 4.0, 6.0, 8.0, 7.0, 21.0, 18.0, 17.0, 30.0, 26.0, 23.0, 32.0, 37.0, 36.0, 42.0, 58.0, 47.0, 55.0, 42.0, 47.0, 46.0, 49.0, 54.0, 26.0, 32.0, 34.0, 24.0, 13.0, 32.0, 24.0, 20.0, 15.0, 12.0, 12.0, 6.0, 11.0, 7.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.41748046875, -18.791841506958008, -18.166202545166016, -17.540563583374023, -16.91492462158203, -16.289287567138672, -15.66364860534668, -15.038009643554688, -14.412370681762695, -13.786731719970703, -13.161092758178711, -12.535454750061035, -11.909815788269043, -11.28417682647705, -10.658538818359375, -10.032899856567383, -9.40726089477539, -8.781621932983398, -8.155982971191406, -7.5303449630737305, -6.904706001281738, -6.279067039489746, -5.653428554534912, -5.027790069580078, -4.402151107788086, -3.776512384414673, -3.1508736610412598, -2.5252349376678467, -1.8995962142944336, -1.2739574909210205, -0.6483187675476074, -0.022680282592773438, 0.6029586791992188, 1.2285974025726318, 1.854236125946045, 2.479874849319458, 3.105513572692871, 3.731152296066284, 4.356791019439697, 4.982429504394531, 5.608068466186523, 6.233707427978516, 6.85934591293335, 7.484984397888184, 8.110623359680176, 8.736262321472168, 9.361900329589844, 9.987539291381836, 10.613178253173828, 11.23881721496582, 11.864456176757812, 12.490094184875488, 13.11573314666748, 13.741372108459473, 14.367010116577148, 14.99264907836914, 15.618288040161133, 16.243927001953125, 16.869565963745117, 17.49520492553711, 18.12084197998047, 18.74648094177246, 19.372119903564453, 19.997758865356445, 20.623397827148438]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 11.0, 11.0, 18.0, 20.0, 12.0, 25.0, 25.0, 33.0, 17.0, 22.0, 27.0, 34.0, 37.0, 44.0, 38.0, 55.0, 47.0, 44.0, 33.0, 37.0, 43.0, 32.0, 45.0, 32.0, 31.0, 25.0, 19.0, 23.0, 28.0, 20.0, 19.0, 11.0, 10.0, 9.0, 9.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.955078125, -2.86663818359375, -2.7781982421875, -2.68975830078125, -2.601318359375, -2.51287841796875, -2.4244384765625, -2.33599853515625, -2.24755859375, -2.15911865234375, -2.0706787109375, -1.98223876953125, -1.893798828125, -1.80535888671875, -1.7169189453125, -1.62847900390625, -1.5400390625, -1.45159912109375, -1.3631591796875, -1.27471923828125, -1.186279296875, -1.09783935546875, -1.0093994140625, -0.92095947265625, -0.83251953125, -0.74407958984375, -0.6556396484375, -0.56719970703125, -0.478759765625, -0.39031982421875, -0.3018798828125, -0.21343994140625, -0.125, -0.03656005859375, 0.0518798828125, 0.14031982421875, 0.228759765625, 0.31719970703125, 0.4056396484375, 0.49407958984375, 0.58251953125, 0.67095947265625, 0.7593994140625, 0.84783935546875, 0.936279296875, 1.02471923828125, 1.1131591796875, 1.20159912109375, 1.2900390625, 1.37847900390625, 1.4669189453125, 1.55535888671875, 1.643798828125, 1.73223876953125, 1.8206787109375, 1.90911865234375, 1.99755859375, 2.08599853515625, 2.1744384765625, 2.26287841796875, 2.351318359375, 2.43975830078125, 2.5281982421875, 2.61663818359375, 2.705078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 20.0, 22.0, 31.0, 46.0, 62.0, 103.0, 141.0, 194.0, 264.0, 391.0, 559.0, 723.0, 1131.0, 1519.0, 2231.0, 3094.0, 4395.0, 6449.0, 9088.0, 12969.0, 18412.0, 26455.0, 38911.0, 61798.0, 105708.0, 231272.0, 229154.0, 105630.0, 60819.0, 38741.0, 26600.0, 18530.0, 12963.0, 9026.0, 6216.0, 4353.0, 3027.0, 2180.0, 1464.0, 1118.0, 772.0, 567.0, 417.0, 280.0, 209.0, 142.0, 114.0, 78.0, 47.0, 36.0, 30.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0], "bins": [-0.0134124755859375, -0.013005971908569336, -0.012599468231201172, -0.012192964553833008, -0.011786460876464844, -0.01137995719909668, -0.010973453521728516, -0.010566949844360352, -0.010160446166992188, -0.009753942489624023, -0.00934743881225586, -0.008940935134887695, -0.008534431457519531, -0.008127927780151367, -0.007721424102783203, -0.007314920425415039, -0.006908416748046875, -0.006501913070678711, -0.006095409393310547, -0.005688905715942383, -0.005282402038574219, -0.004875898361206055, -0.004469394683837891, -0.0040628910064697266, -0.0036563873291015625, -0.0032498836517333984, -0.0028433799743652344, -0.0024368762969970703, -0.0020303726196289062, -0.0016238689422607422, -0.0012173652648925781, -0.0008108615875244141, -0.00040435791015625, 2.1457672119140625e-06, 0.0004086494445800781, 0.0008151531219482422, 0.0012216567993164062, 0.0016281604766845703, 0.0020346641540527344, 0.0024411678314208984, 0.0028476715087890625, 0.0032541751861572266, 0.0036606788635253906, 0.004067182540893555, 0.004473686218261719, 0.004880189895629883, 0.005286693572998047, 0.005693197250366211, 0.006099700927734375, 0.006506204605102539, 0.006912708282470703, 0.007319211959838867, 0.007725715637207031, 0.008132219314575195, 0.00853872299194336, 0.008945226669311523, 0.009351730346679688, 0.009758234024047852, 0.010164737701416016, 0.01057124137878418, 0.010977745056152344, 0.011384248733520508, 0.011790752410888672, 0.012197256088256836, 0.012603759765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 13.0, 20.0, 25.0, 23.0, 20.0, 25.0, 24.0, 35.0, 38.0, 52.0, 46.0, 42.0, 54.0, 50.0, 53.0, 1066.0, 39.0, 36.0, 41.0, 42.0, 31.0, 38.0, 27.0, 23.0, 27.0, 25.0, 19.0, 20.0, 10.0, 11.0, 12.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.115631103515625, -2.04766845703125, -1.979705810546875, -1.9117431640625, -1.843780517578125, -1.77581787109375, -1.707855224609375, -1.639892578125, -1.571929931640625, -1.50396728515625, -1.436004638671875, -1.3680419921875, -1.300079345703125, -1.23211669921875, -1.164154052734375, -1.09619140625, -1.028228759765625, -0.96026611328125, -0.892303466796875, -0.8243408203125, -0.756378173828125, -0.68841552734375, -0.620452880859375, -0.552490234375, -0.484527587890625, -0.41656494140625, -0.348602294921875, -0.2806396484375, -0.212677001953125, -0.14471435546875, -0.076751708984375, -0.0087890625, 0.059173583984375, 0.12713623046875, 0.195098876953125, 0.2630615234375, 0.331024169921875, 0.39898681640625, 0.466949462890625, 0.534912109375, 0.602874755859375, 0.67083740234375, 0.738800048828125, 0.8067626953125, 0.874725341796875, 0.94268798828125, 1.010650634765625, 1.07861328125, 1.146575927734375, 1.21453857421875, 1.282501220703125, 1.3504638671875, 1.418426513671875, 1.48638916015625, 1.554351806640625, 1.622314453125, 1.690277099609375, 1.75823974609375, 1.826202392578125, 1.8941650390625, 1.962127685546875, 2.03009033203125, 2.098052978515625, 2.166015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 11.0, 13.0, 22.0, 41.0, 33.0, 70.0, 119.0, 181.0, 263.0, 407.0, 635.0, 1027.0, 1726.0, 2865.0, 4354.0, 7653.0, 12496.0, 21738.0, 37289.0, 67708.0, 134305.0, 1364971.0, 221020.0, 96199.0, 51020.0, 28958.0, 16738.0, 9940.0, 5922.0, 3583.0, 2166.0, 1381.0, 771.0, 498.0, 363.0, 217.0, 150.0, 95.0, 58.0, 40.0, 29.0, 17.0, 9.0, 18.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01311492919921875, -0.012702107429504395, -0.012289285659790039, -0.011876463890075684, -0.011463642120361328, -0.011050820350646973, -0.010637998580932617, -0.010225176811218262, -0.009812355041503906, -0.00939953327178955, -0.008986711502075195, -0.00857388973236084, -0.008161067962646484, -0.007748246192932129, -0.0073354244232177734, -0.006922602653503418, -0.0065097808837890625, -0.006096959114074707, -0.0056841373443603516, -0.005271315574645996, -0.004858493804931641, -0.004445672035217285, -0.00403285026550293, -0.0036200284957885742, -0.0032072067260742188, -0.0027943849563598633, -0.002381563186645508, -0.0019687414169311523, -0.0015559196472167969, -0.0011430978775024414, -0.0007302761077880859, -0.00031745433807373047, 9.5367431640625e-05, 0.0005081892013549805, 0.0009210109710693359, 0.0013338327407836914, 0.0017466545104980469, 0.0021594762802124023, 0.002572298049926758, 0.0029851198196411133, 0.0033979415893554688, 0.0038107633590698242, 0.00422358512878418, 0.004636406898498535, 0.005049228668212891, 0.005462050437927246, 0.0058748722076416016, 0.006287693977355957, 0.0067005157470703125, 0.007113337516784668, 0.0075261592864990234, 0.007938981056213379, 0.008351802825927734, 0.00876462459564209, 0.009177446365356445, 0.0095902681350708, 0.010003089904785156, 0.010415911674499512, 0.010828733444213867, 0.011241555213928223, 0.011654376983642578, 0.012067198753356934, 0.012480020523071289, 0.012892842292785645, 0.0133056640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 881.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 13.0, 2.0, 24.0, 17.0, 2.0, 0.0, 2.0, 6.0, 67.0, 51.0, 157.0, 3992.0, 32987.0, 1006890.0, 3978.0, 138.0, 72.0, 76.0, 3.0, 4.0, 1.0, 0.0, 11.0, 31.0, 1.0, 19.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.993511199951172e-06, -3.893859684467316e-06, -3.7942081689834595e-06, -3.6945566534996033e-06, -3.594905138015747e-06, -3.495253622531891e-06, -3.3956021070480347e-06, -3.2959505915641785e-06, -3.1962990760803223e-06, -3.096647560596466e-06, -2.99699604511261e-06, -2.8973445296287537e-06, -2.7976930141448975e-06, -2.6980414986610413e-06, -2.598389983177185e-06, -2.498738467693329e-06, -2.3990869522094727e-06, -2.2994354367256165e-06, -2.1997839212417603e-06, -2.100132405757904e-06, -2.000480890274048e-06, -1.9008293747901917e-06, -1.8011778593063354e-06, -1.7015263438224792e-06, -1.601874828338623e-06, -1.5022233128547668e-06, -1.4025717973709106e-06, -1.3029202818870544e-06, -1.2032687664031982e-06, -1.103617250919342e-06, -1.0039657354354858e-06, -9.043142199516296e-07, -8.046627044677734e-07, -7.050111889839172e-07, -6.05359673500061e-07, -5.057081580162048e-07, -4.0605664253234863e-07, -3.0640512704849243e-07, -2.0675361156463623e-07, -1.0710209608078003e-07, -7.450580596923828e-09, 9.220093488693237e-08, 1.9185245037078857e-07, 2.915039658546448e-07, 3.91155481338501e-07, 4.908069968223572e-07, 5.904585123062134e-07, 6.901100277900696e-07, 7.897615432739258e-07, 8.89413058757782e-07, 9.890645742416382e-07, 1.0887160897254944e-06, 1.1883676052093506e-06, 1.2880191206932068e-06, 1.387670636177063e-06, 1.4873221516609192e-06, 1.5869736671447754e-06, 1.6866251826286316e-06, 1.7862766981124878e-06, 1.885928213596344e-06, 1.9855797290802e-06, 2.0852312445640564e-06, 2.1848827600479126e-06, 2.284534275531769e-06, 2.384185791015625e-06]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.063336747772155e-10, 1.812667349554431e-09, 2.7190010243316465e-09, 3.625334699108862e-09, 4.5316683738860775e-09, 5.438002048663293e-09, 6.3443357234405084e-09, 7.250669398217724e-09, 8.15700307299494e-09, 9.063336747772155e-09, 9.96967042254937e-09, 1.0876004097326586e-08, 1.1782337772103801e-08, 1.2688671446881017e-08, 1.3595005121658232e-08, 1.4501338796435448e-08, 1.5407671583034244e-08, 1.631400614598988e-08, 1.7220340708945514e-08, 1.812667349554431e-08, 1.9033006282143106e-08, 1.993934084509874e-08, 2.0845675408054376e-08, 2.1752008194653172e-08, 2.2658340981251968e-08, 2.3564675544207603e-08, 2.4471010107163238e-08, 2.5377342893762034e-08, 2.628367568036083e-08, 2.7190010243316465e-08, 2.80963448062721e-08, 2.9002677592870896e-08, 2.990901037946969e-08, 3.081534316606849e-08, 3.172167950538096e-08, 3.262801229197976e-08, 3.3534345078578554e-08, 3.444068141789103e-08, 3.5347014204489824e-08, 3.625334699108862e-08, 3.7159679777687415e-08, 3.806601256428621e-08, 3.8972348903598686e-08, 3.987868169019748e-08, 4.078501447679628e-08, 4.169135081610875e-08, 4.259768360270755e-08, 4.3504016389306344e-08, 4.441034917590514e-08, 4.5316681962503935e-08, 4.622301830181641e-08, 4.7129351088415206e-08, 4.8035683875014e-08, 4.8942020214326476e-08, 4.984835300092527e-08, 5.075468578752407e-08, 5.1661018574122863e-08, 5.256735136072166e-08, 5.3473687700034134e-08, 5.438002048663293e-08, 5.5286353273231725e-08, 5.61926896125442e-08, 5.7099022399142996e-08, 5.800535518574179e-08]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0], "bins": [-5.960464477539063e-08, -5.8673322200775146e-08, -5.774199962615967e-08, -5.681067705154419e-08, -5.587935447692871e-08, -5.494803190231323e-08, -5.4016709327697754e-08, -5.3085386753082275e-08, -5.21540641784668e-08, -5.122274160385132e-08, -5.029141902923584e-08, -4.936009645462036e-08, -4.842877388000488e-08, -4.7497451305389404e-08, -4.6566128730773926e-08, -4.563480615615845e-08, -4.470348358154297e-08, -4.377216100692749e-08, -4.284083843231201e-08, -4.190951585769653e-08, -4.0978193283081055e-08, -4.0046870708465576e-08, -3.91155481338501e-08, -3.818422555923462e-08, -3.725290298461914e-08, -3.632158041000366e-08, -3.5390257835388184e-08, -3.4458935260772705e-08, -3.3527612686157227e-08, -3.259629011154175e-08, -3.166496753692627e-08, -3.073364496231079e-08, -2.9802322387695312e-08, -2.8870999813079834e-08, -2.7939677238464355e-08, -2.7008354663848877e-08, -2.60770320892334e-08, -2.514570951461792e-08, -2.421438694000244e-08, -2.3283064365386963e-08, -2.2351741790771484e-08, -2.1420419216156006e-08, -2.0489096641540527e-08, -1.955777406692505e-08, -1.862645149230957e-08, -1.7695128917694092e-08, -1.6763806343078613e-08, -1.5832483768463135e-08, -1.4901161193847656e-08, -1.3969838619232178e-08, -1.30385160446167e-08, -1.210719347000122e-08, -1.1175870895385742e-08, -1.0244548320770264e-08, -9.313225746154785e-09, -8.381903171539307e-09, -7.450580596923828e-09, -6.51925802230835e-09, -5.587935447692871e-09, -4.6566128730773926e-09, -3.725290298461914e-09, -2.7939677238464355e-09, -1.862645149230957e-09, -9.313225746154785e-10, 0.0]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 11.0, 11.0, 18.0, 20.0, 12.0, 25.0, 25.0, 33.0, 17.0, 22.0, 27.0, 34.0, 37.0, 44.0, 38.0, 55.0, 47.0, 44.0, 33.0, 37.0, 43.0, 32.0, 45.0, 32.0, 31.0, 25.0, 19.0, 23.0, 28.0, 20.0, 19.0, 11.0, 10.0, 9.0, 9.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.955078125, -2.86663818359375, -2.7781982421875, -2.68975830078125, -2.601318359375, -2.51287841796875, -2.4244384765625, -2.33599853515625, -2.24755859375, -2.15911865234375, -2.0706787109375, -1.98223876953125, -1.893798828125, -1.80535888671875, -1.7169189453125, -1.62847900390625, -1.5400390625, -1.45159912109375, -1.3631591796875, -1.27471923828125, -1.186279296875, -1.09783935546875, -1.0093994140625, -0.92095947265625, -0.83251953125, -0.74407958984375, -0.6556396484375, -0.56719970703125, -0.478759765625, -0.39031982421875, -0.3018798828125, -0.21343994140625, -0.125, -0.03656005859375, 0.0518798828125, 0.14031982421875, 0.228759765625, 0.31719970703125, 0.4056396484375, 0.49407958984375, 0.58251953125, 0.67095947265625, 0.7593994140625, 0.84783935546875, 0.936279296875, 1.02471923828125, 1.1131591796875, 1.20159912109375, 1.2900390625, 1.37847900390625, 1.4669189453125, 1.55535888671875, 1.643798828125, 1.73223876953125, 1.8206787109375, 1.90911865234375, 1.99755859375, 2.08599853515625, 2.1744384765625, 2.26287841796875, 2.351318359375, 2.43975830078125, 2.5281982421875, 2.61663818359375, 2.705078125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 4.0, 8.0, 11.0, 15.0, 24.0, 27.0, 38.0, 75.0, 112.0, 165.0, 286.0, 486.0, 757.0, 1297.0, 2229.0, 3887.0, 6853.0, 11985.0, 21515.0, 40704.0, 85746.0, 237032.0, 395872.0, 122653.0, 53959.0, 27429.0, 15174.0, 8462.0, 4966.0, 2741.0, 1555.0, 961.0, 553.0, 334.0, 186.0, 148.0, 99.0, 57.0, 44.0, 19.0, 18.0, 26.0, 13.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.814453125, -2.7242431640625, -2.634033203125, -2.5438232421875, -2.45361328125, -2.3634033203125, -2.273193359375, -2.1829833984375, -2.0927734375, -2.0025634765625, -1.912353515625, -1.8221435546875, -1.73193359375, -1.6417236328125, -1.551513671875, -1.4613037109375, -1.37109375, -1.2808837890625, -1.190673828125, -1.1004638671875, -1.01025390625, -0.9200439453125, -0.829833984375, -0.7396240234375, -0.6494140625, -0.5592041015625, -0.468994140625, -0.3787841796875, -0.28857421875, -0.1983642578125, -0.108154296875, -0.0179443359375, 0.072265625, 0.1624755859375, 0.252685546875, 0.3428955078125, 0.43310546875, 0.5233154296875, 0.613525390625, 0.7037353515625, 0.7939453125, 0.8841552734375, 0.974365234375, 1.0645751953125, 1.15478515625, 1.2449951171875, 1.335205078125, 1.4254150390625, 1.515625, 1.6058349609375, 1.696044921875, 1.7862548828125, 1.87646484375, 1.9666748046875, 2.056884765625, 2.1470947265625, 2.2373046875, 2.3275146484375, 2.417724609375, 2.5079345703125, 2.59814453125, 2.6883544921875, 2.778564453125, 2.8687744140625, 2.958984375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 9.0, 3.0, 7.0, 10.0, 14.0, 8.0, 10.0, 17.0, 16.0, 17.0, 38.0, 17.0, 31.0, 53.0, 46.0, 52.0, 64.0, 89.0, 214.0, 1598.0, 209.0, 85.0, 59.0, 49.0, 50.0, 51.0, 39.0, 36.0, 19.0, 31.0, 21.0, 14.0, 11.0, 23.0, 8.0, 13.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.8885498046875, -8.597412109375, -8.3062744140625, -8.01513671875, -7.7239990234375, -7.432861328125, -7.1417236328125, -6.8505859375, -6.5594482421875, -6.268310546875, -5.9771728515625, -5.68603515625, -5.3948974609375, -5.103759765625, -4.8126220703125, -4.521484375, -4.2303466796875, -3.939208984375, -3.6480712890625, -3.35693359375, -3.0657958984375, -2.774658203125, -2.4835205078125, -2.1923828125, -1.9012451171875, -1.610107421875, -1.3189697265625, -1.02783203125, -0.7366943359375, -0.445556640625, -0.1544189453125, 0.13671875, 0.4278564453125, 0.718994140625, 1.0101318359375, 1.30126953125, 1.5924072265625, 1.883544921875, 2.1746826171875, 2.4658203125, 2.7569580078125, 3.048095703125, 3.3392333984375, 3.63037109375, 3.9215087890625, 4.212646484375, 4.5037841796875, 4.794921875, 5.0860595703125, 5.377197265625, 5.6683349609375, 5.95947265625, 6.2506103515625, 6.541748046875, 6.8328857421875, 7.1240234375, 7.4151611328125, 7.706298828125, 7.9974365234375, 8.28857421875, 8.5797119140625, 8.870849609375, 9.1619873046875, 9.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 6.0, 10.0, 13.0, 17.0, 25.0, 22.0, 30.0, 50.0, 61.0, 63.0, 99.0, 146.0, 182.0, 272.0, 452.0, 1532.0, 15282.0, 960764.0, 2142126.0, 21138.0, 1901.0, 463.0, 281.0, 195.0, 129.0, 98.0, 66.0, 58.0, 40.0, 34.0, 24.0, 20.0, 15.0, 19.0, 15.0, 8.0, 6.0, 7.0, 8.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.78125, -16.2735595703125, -15.765869140625, -15.2581787109375, -14.75048828125, -14.2427978515625, -13.735107421875, -13.2274169921875, -12.7197265625, -12.2120361328125, -11.704345703125, -11.1966552734375, -10.68896484375, -10.1812744140625, -9.673583984375, -9.1658935546875, -8.658203125, -8.1505126953125, -7.642822265625, -7.1351318359375, -6.62744140625, -6.1197509765625, -5.612060546875, -5.1043701171875, -4.5966796875, -4.0889892578125, -3.581298828125, -3.0736083984375, -2.56591796875, -2.0582275390625, -1.550537109375, -1.0428466796875, -0.53515625, -0.0274658203125, 0.480224609375, 0.9879150390625, 1.49560546875, 2.0032958984375, 2.510986328125, 3.0186767578125, 3.5263671875, 4.0340576171875, 4.541748046875, 5.0494384765625, 5.55712890625, 6.0648193359375, 6.572509765625, 7.0802001953125, 7.587890625, 8.0955810546875, 8.603271484375, 9.1109619140625, 9.61865234375, 10.1263427734375, 10.634033203125, 11.1417236328125, 11.6494140625, 12.1571044921875, 12.664794921875, 13.1724853515625, 13.68017578125, 14.1878662109375, 14.695556640625, 15.2032470703125, 15.7109375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 60.0, 284.0, 454.0, 193.0, 17.0, 2.0, 1.0], "bins": [-98.02595520019531, -96.37340545654297, -94.7208480834961, -93.06829833984375, -91.4157485961914, -89.76319885253906, -88.11064147949219, -86.45809173583984, -84.8055419921875, -83.15299224853516, -81.50043487548828, -79.84788513183594, -78.1953353881836, -76.54278564453125, -74.89022827148438, -73.23767852783203, -71.58512115478516, -69.93257141113281, -68.28001403808594, -66.6274642944336, -64.97491455078125, -63.32236099243164, -61.66980743408203, -60.01725769042969, -58.36470413208008, -56.71215057373047, -55.059600830078125, -53.407047271728516, -51.754493713378906, -50.10194396972656, -48.44939041137695, -46.796836853027344, -45.144290924072266, -43.491737365722656, -41.83918762207031, -40.1866340637207, -38.534080505371094, -36.88153076171875, -35.22897720336914, -33.57642364501953, -31.923873901367188, -30.27132225036621, -28.618770599365234, -26.966217041015625, -25.31366539001465, -23.661113739013672, -22.008560180664062, -20.356008529663086, -18.70345687866211, -17.050905227661133, -15.39835262298584, -13.745800018310547, -12.09324836730957, -10.440696716308594, -8.7881441116333, -7.135591506958008, -5.483038902282715, -3.83048677444458, -2.1779346466064453, -0.5253825187683105, 1.1271696090698242, 2.779721260070801, 4.432273864746094, 6.084826469421387, 7.737378120422363]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 4.0, 8.0, 10.0, 6.0, 9.0, 16.0, 17.0, 17.0, 18.0, 27.0, 19.0, 32.0, 40.0, 31.0, 40.0, 31.0, 37.0, 43.0, 49.0, 44.0, 51.0, 38.0, 39.0, 41.0, 46.0, 33.0, 32.0, 34.0, 31.0, 25.0, 27.0, 18.0, 18.0, 13.0, 12.0, 7.0, 8.0, 7.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.095500946044922, -20.347705841064453, -19.59990882873535, -18.85211181640625, -18.10431671142578, -17.356521606445312, -16.60872459411621, -15.860928535461426, -15.11313247680664, -14.365336418151855, -13.61754035949707, -12.869744300842285, -12.1219482421875, -11.374152183532715, -10.62635612487793, -9.878560066223145, -9.13076400756836, -8.382967948913574, -7.635171890258789, -6.887375831604004, -6.139579772949219, -5.391783714294434, -4.643987655639648, -3.8961915969848633, -3.148395538330078, -2.400599479675293, -1.6528034210205078, -0.9050073623657227, -0.1572113037109375, 0.5905847549438477, 1.3383808135986328, 2.086176872253418, 2.833972930908203, 3.5817689895629883, 4.329565048217773, 5.077361106872559, 5.825157165527344, 6.572953224182129, 7.320749282836914, 8.0685453414917, 8.816341400146484, 9.56413745880127, 10.311933517456055, 11.05972957611084, 11.807525634765625, 12.55532169342041, 13.303117752075195, 14.05091381072998, 14.798709869384766, 15.54650592803955, 16.294301986694336, 17.042098999023438, 17.789894104003906, 18.537689208984375, 19.285486221313477, 20.033283233642578, 20.781078338623047, 21.528873443603516, 22.276670455932617, 23.02446746826172, 23.772262573242188, 24.520057678222656, 25.267854690551758, 26.01565170288086, 26.763446807861328]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 18.0, 18.0, 16.0, 23.0, 19.0, 25.0, 27.0, 28.0, 40.0, 41.0, 40.0, 45.0, 36.0, 50.0, 40.0, 48.0, 41.0, 41.0, 38.0, 37.0, 36.0, 39.0, 28.0, 26.0, 26.0, 30.0, 17.0, 19.0, 20.0, 10.0, 6.0, 8.0, 8.0, 12.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.19140625, -3.09185791015625, -2.9923095703125, -2.89276123046875, -2.793212890625, -2.69366455078125, -2.5941162109375, -2.49456787109375, -2.39501953125, -2.29547119140625, -2.1959228515625, -2.09637451171875, -1.996826171875, -1.89727783203125, -1.7977294921875, -1.69818115234375, -1.5986328125, -1.49908447265625, -1.3995361328125, -1.29998779296875, -1.200439453125, -1.10089111328125, -1.0013427734375, -0.90179443359375, -0.80224609375, -0.70269775390625, -0.6031494140625, -0.50360107421875, -0.404052734375, -0.30450439453125, -0.2049560546875, -0.10540771484375, -0.005859375, 0.09368896484375, 0.1932373046875, 0.29278564453125, 0.392333984375, 0.49188232421875, 0.5914306640625, 0.69097900390625, 0.79052734375, 0.89007568359375, 0.9896240234375, 1.08917236328125, 1.188720703125, 1.28826904296875, 1.3878173828125, 1.48736572265625, 1.5869140625, 1.68646240234375, 1.7860107421875, 1.88555908203125, 1.985107421875, 2.08465576171875, 2.1842041015625, 2.28375244140625, 2.38330078125, 2.48284912109375, 2.5823974609375, 2.68194580078125, 2.781494140625, 2.88104248046875, 2.9805908203125, 3.08013916015625, 3.1796875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 15.0, 15.0, 15.0, 22.0, 29.0, 41.0, 75.0, 105.0, 281.0, 868.0, 3163.0, 16501.0, 131020.0, 1822234.0, 2046196.0, 149737.0, 18582.0, 3672.0, 960.0, 299.0, 129.0, 66.0, 53.0, 34.0, 20.0, 27.0, 19.0, 12.0, 8.0, 11.0, 10.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.25, -8.961181640625, -8.67236328125, -8.383544921875, -8.0947265625, -7.805908203125, -7.51708984375, -7.228271484375, -6.939453125, -6.650634765625, -6.36181640625, -6.072998046875, -5.7841796875, -5.495361328125, -5.20654296875, -4.917724609375, -4.62890625, -4.340087890625, -4.05126953125, -3.762451171875, -3.4736328125, -3.184814453125, -2.89599609375, -2.607177734375, -2.318359375, -2.029541015625, -1.74072265625, -1.451904296875, -1.1630859375, -0.874267578125, -0.58544921875, -0.296630859375, -0.0078125, 0.281005859375, 0.56982421875, 0.858642578125, 1.1474609375, 1.436279296875, 1.72509765625, 2.013916015625, 2.302734375, 2.591552734375, 2.88037109375, 3.169189453125, 3.4580078125, 3.746826171875, 4.03564453125, 4.324462890625, 4.61328125, 4.902099609375, 5.19091796875, 5.479736328125, 5.7685546875, 6.057373046875, 6.34619140625, 6.635009765625, 6.923828125, 7.212646484375, 7.50146484375, 7.790283203125, 8.0791015625, 8.367919921875, 8.65673828125, 8.945556640625, 9.234375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 8.0, 13.0, 17.0, 6.0, 17.0, 34.0, 27.0, 48.0, 48.0, 67.0, 73.0, 84.0, 150.0, 177.0, 231.0, 278.0, 348.0, 416.0, 361.0, 354.0, 308.0, 225.0, 171.0, 128.0, 83.0, 86.0, 73.0, 49.0, 37.0, 43.0, 20.0, 22.0, 16.0, 14.0, 14.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.3125, -4.169189453125, -4.02587890625, -3.882568359375, -3.7392578125, -3.595947265625, -3.45263671875, -3.309326171875, -3.166015625, -3.022705078125, -2.87939453125, -2.736083984375, -2.5927734375, -2.449462890625, -2.30615234375, -2.162841796875, -2.01953125, -1.876220703125, -1.73291015625, -1.589599609375, -1.4462890625, -1.302978515625, -1.15966796875, -1.016357421875, -0.873046875, -0.729736328125, -0.58642578125, -0.443115234375, -0.2998046875, -0.156494140625, -0.01318359375, 0.130126953125, 0.2734375, 0.416748046875, 0.56005859375, 0.703369140625, 0.8466796875, 0.989990234375, 1.13330078125, 1.276611328125, 1.419921875, 1.563232421875, 1.70654296875, 1.849853515625, 1.9931640625, 2.136474609375, 2.27978515625, 2.423095703125, 2.56640625, 2.709716796875, 2.85302734375, 2.996337890625, 3.1396484375, 3.282958984375, 3.42626953125, 3.569580078125, 3.712890625, 3.856201171875, 3.99951171875, 4.142822265625, 4.2861328125, 4.429443359375, 4.57275390625, 4.716064453125, 4.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 13.0, 18.0, 21.0, 25.0, 26.0, 51.0, 63.0, 82.0, 111.0, 125.0, 189.0, 252.0, 345.0, 1056.0, 24246.0, 3364574.0, 794177.0, 6955.0, 627.0, 329.0, 241.0, 196.0, 138.0, 81.0, 75.0, 65.0, 43.0, 38.0, 23.0, 19.0, 8.0, 9.0, 15.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.109375, -27.27880859375, -26.4482421875, -25.61767578125, -24.787109375, -23.95654296875, -23.1259765625, -22.29541015625, -21.46484375, -20.63427734375, -19.8037109375, -18.97314453125, -18.142578125, -17.31201171875, -16.4814453125, -15.65087890625, -14.8203125, -13.98974609375, -13.1591796875, -12.32861328125, -11.498046875, -10.66748046875, -9.8369140625, -9.00634765625, -8.17578125, -7.34521484375, -6.5146484375, -5.68408203125, -4.853515625, -4.02294921875, -3.1923828125, -2.36181640625, -1.53125, -0.70068359375, 0.1298828125, 0.96044921875, 1.791015625, 2.62158203125, 3.4521484375, 4.28271484375, 5.11328125, 5.94384765625, 6.7744140625, 7.60498046875, 8.435546875, 9.26611328125, 10.0966796875, 10.92724609375, 11.7578125, 12.58837890625, 13.4189453125, 14.24951171875, 15.080078125, 15.91064453125, 16.7412109375, 17.57177734375, 18.40234375, 19.23291015625, 20.0634765625, 20.89404296875, 21.724609375, 22.55517578125, 23.3857421875, 24.21630859375, 25.046875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 16.0, 23.0, 34.0, 45.0, 66.0, 102.0, 103.0, 103.0, 103.0, 96.0, 93.0, 71.0, 52.0, 29.0, 23.0, 10.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.040903091430664, -24.22721290588379, -23.413524627685547, -22.599834442138672, -21.786144256591797, -20.972455978393555, -20.15876579284668, -19.345077514648438, -18.531387329101562, -17.717697143554688, -16.904008865356445, -16.09031867980957, -15.276629447937012, -14.462940216064453, -13.649250030517578, -12.83556079864502, -12.021871566772461, -11.208182334899902, -10.394493103027344, -9.580802917480469, -8.76711368560791, -7.953424453735352, -7.139734745025635, -6.326045036315918, -5.512355804443359, -4.698666572570801, -3.884976863861084, -3.0712873935699463, -2.2575979232788086, -1.44390869140625, -0.6302189826965332, 0.1834707260131836, 0.997161865234375, 1.8108513355255127, 2.6245408058166504, 3.438230276107788, 4.251919746398926, 5.065608978271484, 5.879298686981201, 6.692988395690918, 7.506677627563477, 8.320366859436035, 9.134056091308594, 9.947746276855469, 10.761435508728027, 11.575124740600586, 12.388814926147461, 13.20250415802002, 14.016193389892578, 14.829882621765137, 15.643571853637695, 16.45726203918457, 17.270950317382812, 18.084640502929688, 18.898330688476562, 19.712020874023438, 20.52570915222168, 21.339399337768555, 22.153087615966797, 22.966777801513672, 23.780467987060547, 24.59415626525879, 25.407846450805664, 26.221534729003906, 27.03522491455078]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 9.0, 3.0, 8.0, 9.0, 9.0, 12.0, 20.0, 18.0, 23.0, 27.0, 34.0, 35.0, 35.0, 43.0, 43.0, 45.0, 38.0, 46.0, 30.0, 46.0, 47.0, 46.0, 40.0, 35.0, 42.0, 39.0, 33.0, 29.0, 23.0, 26.0, 25.0, 17.0, 16.0, 16.0, 8.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.3619384765625, -21.730127334594727, -21.098318099975586, -20.466506958007812, -19.834697723388672, -19.2028865814209, -18.571075439453125, -17.939266204833984, -17.30745506286621, -16.675643920898438, -16.043834686279297, -15.412023544311523, -14.780213356018066, -14.14840316772461, -13.516592025756836, -12.884781837463379, -12.252971649169922, -11.621161460876465, -10.989351272583008, -10.357540130615234, -9.725729942321777, -9.09391975402832, -8.462108612060547, -7.83029842376709, -7.198488235473633, -6.566678047180176, -5.9348673820495605, -5.303056716918945, -4.671246528625488, -4.039436340332031, -3.407625675201416, -2.775815010070801, -2.1440048217773438, -1.5121943950653076, -0.8803839683532715, -0.24857354164123535, 0.3832368850708008, 1.015047311782837, 1.646857738494873, 2.2786684036254883, 2.9104785919189453, 3.5422890186309814, 4.174099445343018, 4.805910110473633, 5.43772029876709, 6.069530487060547, 6.701341152191162, 7.333151817321777, 7.964962005615234, 8.596772193908691, 9.228582382202148, 9.860393524169922, 10.492203712463379, 11.124013900756836, 11.75582504272461, 12.387635231018066, 13.019445419311523, 13.65125560760498, 14.283065795898438, 14.914876937866211, 15.546687126159668, 16.178497314453125, 16.8103084564209, 17.442119598388672, 18.073928833007812]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 35.0, 22.0, 41.0, 31.0, 30.0, 41.0, 38.0, 38.0, 47.0, 58.0, 54.0, 55.0, 53.0, 46.0, 40.0, 43.0, 40.0, 36.0, 32.0, 19.0, 31.0, 26.0, 20.0, 9.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.919189453125, -3.80322265625, -3.687255859375, -3.5712890625, -3.455322265625, -3.33935546875, -3.223388671875, -3.107421875, -2.991455078125, -2.87548828125, -2.759521484375, -2.6435546875, -2.527587890625, -2.41162109375, -2.295654296875, -2.1796875, -2.063720703125, -1.94775390625, -1.831787109375, -1.7158203125, -1.599853515625, -1.48388671875, -1.367919921875, -1.251953125, -1.135986328125, -1.02001953125, -0.904052734375, -0.7880859375, -0.672119140625, -0.55615234375, -0.440185546875, -0.32421875, -0.208251953125, -0.09228515625, 0.023681640625, 0.1396484375, 0.255615234375, 0.37158203125, 0.487548828125, 0.603515625, 0.719482421875, 0.83544921875, 0.951416015625, 1.0673828125, 1.183349609375, 1.29931640625, 1.415283203125, 1.53125, 1.647216796875, 1.76318359375, 1.879150390625, 1.9951171875, 2.111083984375, 2.22705078125, 2.343017578125, 2.458984375, 2.574951171875, 2.69091796875, 2.806884765625, 2.9228515625, 3.038818359375, 3.15478515625, 3.270751953125, 3.38671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 16.0, 15.0, 22.0, 34.0, 60.0, 82.0, 145.0, 216.0, 321.0, 610.0, 960.0, 1604.0, 2674.0, 4767.0, 8167.0, 14516.0, 25665.0, 47695.0, 94517.0, 229987.0, 352576.0, 126914.0, 61727.0, 32694.0, 18127.0, 10178.0, 6031.0, 3317.0, 1916.0, 1157.0, 715.0, 395.0, 235.0, 187.0, 93.0, 81.0, 41.0, 27.0, 22.0, 14.0, 14.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0242767333984375, -0.02358698844909668, -0.02289724349975586, -0.02220749855041504, -0.02151775360107422, -0.0208280086517334, -0.020138263702392578, -0.019448518753051758, -0.018758773803710938, -0.018069028854370117, -0.017379283905029297, -0.016689538955688477, -0.015999794006347656, -0.015310049057006836, -0.014620304107666016, -0.013930559158325195, -0.013240814208984375, -0.012551069259643555, -0.011861324310302734, -0.011171579360961914, -0.010481834411621094, -0.009792089462280273, -0.009102344512939453, -0.008412599563598633, -0.0077228546142578125, -0.007033109664916992, -0.006343364715576172, -0.0056536197662353516, -0.004963874816894531, -0.004274129867553711, -0.0035843849182128906, -0.0028946399688720703, -0.00220489501953125, -0.0015151500701904297, -0.0008254051208496094, -0.00013566017150878906, 0.0005540847778320312, 0.0012438297271728516, 0.0019335746765136719, 0.002623319625854492, 0.0033130645751953125, 0.004002809524536133, 0.004692554473876953, 0.0053822994232177734, 0.006072044372558594, 0.006761789321899414, 0.007451534271240234, 0.008141279220581055, 0.008831024169921875, 0.009520769119262695, 0.010210514068603516, 0.010900259017944336, 0.011590003967285156, 0.012279748916625977, 0.012969493865966797, 0.013659238815307617, 0.014348983764648438, 0.015038728713989258, 0.015728473663330078, 0.0164182186126709, 0.01710796356201172, 0.01779770851135254, 0.01848745346069336, 0.01917719841003418, 0.019866943359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 8.0, 16.0, 16.0, 12.0, 19.0, 27.0, 24.0, 27.0, 21.0, 32.0, 39.0, 36.0, 29.0, 34.0, 27.0, 30.0, 46.0, 1061.0, 42.0, 42.0, 32.0, 37.0, 28.0, 39.0, 38.0, 27.0, 33.0, 31.0, 23.0, 26.0, 17.0, 13.0, 13.0, 12.0, 12.0, 6.0, 11.0, 4.0, 6.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8183441162109375, -1.758758544921875, -1.6991729736328125, -1.63958740234375, -1.5800018310546875, -1.520416259765625, -1.4608306884765625, -1.4012451171875, -1.3416595458984375, -1.282073974609375, -1.2224884033203125, -1.16290283203125, -1.1033172607421875, -1.043731689453125, -0.9841461181640625, -0.924560546875, -0.8649749755859375, -0.805389404296875, -0.7458038330078125, -0.68621826171875, -0.6266326904296875, -0.567047119140625, -0.5074615478515625, -0.4478759765625, -0.3882904052734375, -0.328704833984375, -0.2691192626953125, -0.20953369140625, -0.1499481201171875, -0.090362548828125, -0.0307769775390625, 0.02880859375, 0.0883941650390625, 0.147979736328125, 0.2075653076171875, 0.26715087890625, 0.3267364501953125, 0.386322021484375, 0.4459075927734375, 0.5054931640625, 0.5650787353515625, 0.624664306640625, 0.6842498779296875, 0.74383544921875, 0.8034210205078125, 0.863006591796875, 0.9225921630859375, 0.982177734375, 1.0417633056640625, 1.101348876953125, 1.1609344482421875, 1.22052001953125, 1.2801055908203125, 1.339691162109375, 1.3992767333984375, 1.4588623046875, 1.5184478759765625, 1.578033447265625, 1.6376190185546875, 1.69720458984375, 1.7567901611328125, 1.816375732421875, 1.8759613037109375, 1.935546875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 14.0, 29.0, 35.0, 46.0, 48.0, 95.0, 168.0, 247.0, 358.0, 506.0, 797.0, 1264.0, 1928.0, 2914.0, 4449.0, 7161.0, 11035.0, 17574.0, 28485.0, 46274.0, 77277.0, 142260.0, 1338332.0, 182168.0, 91030.0, 53894.0, 32694.0, 20331.0, 12802.0, 8132.0, 5059.0, 3361.0, 2196.0, 1377.0, 918.0, 610.0, 451.0, 276.0, 185.0, 119.0, 89.0, 43.0, 30.0, 23.0, 19.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011478185653686523, -0.011115550994873047, -0.01075291633605957, -0.010390281677246094, -0.010027647018432617, -0.00966501235961914, -0.009302377700805664, -0.008939743041992188, -0.008577108383178711, -0.008214473724365234, -0.007851839065551758, -0.007489204406738281, -0.007126569747924805, -0.006763935089111328, -0.0064013004302978516, -0.006038665771484375, -0.0056760311126708984, -0.005313396453857422, -0.004950761795043945, -0.004588127136230469, -0.004225492477416992, -0.0038628578186035156, -0.003500223159790039, -0.0031375885009765625, -0.002774953842163086, -0.0024123191833496094, -0.002049684524536133, -0.0016870498657226562, -0.0013244152069091797, -0.0009617805480957031, -0.0005991458892822266, -0.00023651123046875, 0.00012612342834472656, 0.0004887580871582031, 0.0008513927459716797, 0.0012140274047851562, 0.0015766620635986328, 0.0019392967224121094, 0.002301931381225586, 0.0026645660400390625, 0.003027200698852539, 0.0033898353576660156, 0.003752470016479492, 0.004115104675292969, 0.004477739334106445, 0.004840373992919922, 0.0052030086517333984, 0.005565643310546875, 0.0059282779693603516, 0.006290912628173828, 0.006653547286987305, 0.007016181945800781, 0.007378816604614258, 0.007741451263427734, 0.008104085922241211, 0.008466720581054688, 0.008829355239868164, 0.00919198989868164, 0.009554624557495117, 0.009917259216308594, 0.01027989387512207, 0.010642528533935547, 0.011005163192749023, 0.0113677978515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 839.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 14.0, 25.0, 30.0, 22.0, 1.0, 2.0, 11.0, 85.0, 116.0, 558.0, 46634.0, 1000180.0, 573.0, 112.0, 52.0, 50.0, 3.0, 0.0, 21.0, 19.0, 34.0, 17.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.636123776435852e-06, -4.503875970840454e-06, -4.371628165245056e-06, -4.239380359649658e-06, -4.10713255405426e-06, -3.974884748458862e-06, -3.842636942863464e-06, -3.7103891372680664e-06, -3.5781413316726685e-06, -3.4458935260772705e-06, -3.3136457204818726e-06, -3.1813979148864746e-06, -3.0491501092910767e-06, -2.9169023036956787e-06, -2.7846544981002808e-06, -2.652406692504883e-06, -2.520158886909485e-06, -2.387911081314087e-06, -2.255663275718689e-06, -2.123415470123291e-06, -1.991167664527893e-06, -1.8589198589324951e-06, -1.7266720533370972e-06, -1.5944242477416992e-06, -1.4621764421463013e-06, -1.3299286365509033e-06, -1.1976808309555054e-06, -1.0654330253601074e-06, -9.331852197647095e-07, -8.009374141693115e-07, -6.686896085739136e-07, -5.364418029785156e-07, -4.041939973831177e-07, -2.7194619178771973e-07, -1.3969838619232178e-07, -7.450580596923828e-09, 1.2479722499847412e-07, 2.5704503059387207e-07, 3.8929283618927e-07, 5.21540641784668e-07, 6.537884473800659e-07, 7.860362529754639e-07, 9.182840585708618e-07, 1.0505318641662598e-06, 1.1827796697616577e-06, 1.3150274753570557e-06, 1.4472752809524536e-06, 1.5795230865478516e-06, 1.7117708921432495e-06, 1.8440186977386475e-06, 1.9762665033340454e-06, 2.1085143089294434e-06, 2.2407621145248413e-06, 2.3730099201202393e-06, 2.505257725715637e-06, 2.637505531311035e-06, 2.769753336906433e-06, 2.902001142501831e-06, 3.034248948097229e-06, 3.166496753692627e-06, 3.298744559288025e-06, 3.430992364883423e-06, 3.563240170478821e-06, 3.6954879760742188e-06]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 2.3011285932295067e-10, 4.6022571864590134e-10, 6.903385640910642e-10, 9.204514372918027e-10, 1.1505643104925412e-09, 1.3806771281821284e-09, 1.6107900568940181e-09, 1.8409028745836054e-09, 2.071015803295495e-09, 2.3011286209850823e-09, 2.5312414386746696e-09, 2.761354256364257e-09, 2.991467074053844e-09, 3.2215798917434313e-09, 3.4516929314776235e-09, 3.6818057491672107e-09, 3.911918788901403e-09, 4.14203160659099e-09, 4.372144424280577e-09, 4.602257241970165e-09, 4.832370059659752e-09, 5.062482877349339e-09, 5.292595695038926e-09, 5.522708512728514e-09, 5.752821330418101e-09, 5.982934148107688e-09, 6.213046965797275e-09, 6.4431597834868626e-09, 6.67327260117645e-09, 6.903385418866037e-09, 7.133498680644834e-09, 7.363611498334421e-09, 7.593724760113219e-09, 7.823837577802806e-09, 8.053950395492393e-09, 8.28406321318198e-09, 8.514176030871567e-09, 8.744288848561155e-09, 8.974401666250742e-09, 9.20451448394033e-09, 9.434627301629916e-09, 9.664740119319504e-09, 9.894852937009091e-09, 1.0124965754698678e-08, 1.0355078572388265e-08, 1.0585191390077853e-08, 1.081530420776744e-08, 1.1045417025457027e-08, 1.1275529843146614e-08, 1.1505642660836202e-08, 1.1735755478525789e-08, 1.1965868296215376e-08, 1.2195981113904963e-08, 1.242609393159455e-08, 1.2656206749284138e-08, 1.2886320455152145e-08, 1.3116433272841732e-08, 1.334654609053132e-08, 1.3576658908220907e-08, 1.3806771725910494e-08, 1.4036884543600081e-08, 1.4266997361289668e-08, 1.4497110178979256e-08, 1.4727222996668843e-08]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 35.0, 22.0, 41.0, 31.0, 30.0, 41.0, 38.0, 38.0, 47.0, 58.0, 54.0, 55.0, 53.0, 46.0, 40.0, 43.0, 40.0, 36.0, 32.0, 19.0, 31.0, 26.0, 20.0, 9.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.919189453125, -3.80322265625, -3.687255859375, -3.5712890625, -3.455322265625, -3.33935546875, -3.223388671875, -3.107421875, -2.991455078125, -2.87548828125, -2.759521484375, -2.6435546875, -2.527587890625, -2.41162109375, -2.295654296875, -2.1796875, -2.063720703125, -1.94775390625, -1.831787109375, -1.7158203125, -1.599853515625, -1.48388671875, -1.367919921875, -1.251953125, -1.135986328125, -1.02001953125, -0.904052734375, -0.7880859375, -0.672119140625, -0.55615234375, -0.440185546875, -0.32421875, -0.208251953125, -0.09228515625, 0.023681640625, 0.1396484375, 0.255615234375, 0.37158203125, 0.487548828125, 0.603515625, 0.719482421875, 0.83544921875, 0.951416015625, 1.0673828125, 1.183349609375, 1.29931640625, 1.415283203125, 1.53125, 1.647216796875, 1.76318359375, 1.879150390625, 1.9951171875, 2.111083984375, 2.22705078125, 2.343017578125, 2.458984375, 2.574951171875, 2.69091796875, 2.806884765625, 2.9228515625, 3.038818359375, 3.15478515625, 3.270751953125, 3.38671875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 13.0, 15.0, 14.0, 27.0, 49.0, 62.0, 85.0, 132.0, 216.0, 442.0, 1056.0, 2814.0, 7952.0, 22928.0, 100084.0, 715148.0, 152961.0, 28944.0, 9695.0, 3434.0, 1301.0, 503.0, 252.0, 135.0, 77.0, 53.0, 51.0, 28.0, 16.0, 16.0, 11.0, 9.0, 6.0, 10.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.53448486328125, -5.3697509765625, -5.20501708984375, -5.040283203125, -4.87554931640625, -4.7108154296875, -4.54608154296875, -4.38134765625, -4.21661376953125, -4.0518798828125, -3.88714599609375, -3.722412109375, -3.55767822265625, -3.3929443359375, -3.22821044921875, -3.0634765625, -2.89874267578125, -2.7340087890625, -2.56927490234375, -2.404541015625, -2.23980712890625, -2.0750732421875, -1.91033935546875, -1.74560546875, -1.58087158203125, -1.4161376953125, -1.25140380859375, -1.086669921875, -0.92193603515625, -0.7572021484375, -0.59246826171875, -0.427734375, -0.26300048828125, -0.0982666015625, 0.06646728515625, 0.231201171875, 0.39593505859375, 0.5606689453125, 0.72540283203125, 0.89013671875, 1.05487060546875, 1.2196044921875, 1.38433837890625, 1.549072265625, 1.71380615234375, 1.8785400390625, 2.04327392578125, 2.2080078125, 2.37274169921875, 2.5374755859375, 2.70220947265625, 2.866943359375, 3.03167724609375, 3.1964111328125, 3.36114501953125, 3.52587890625, 3.69061279296875, 3.8553466796875, 4.02008056640625, 4.184814453125, 4.34954833984375, 4.5142822265625, 4.67901611328125, 4.84375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 7.0, 6.0, 9.0, 8.0, 7.0, 5.0, 17.0, 11.0, 17.0, 10.0, 12.0, 17.0, 25.0, 28.0, 33.0, 38.0, 31.0, 33.0, 58.0, 55.0, 97.0, 221.0, 1656.0, 163.0, 75.0, 48.0, 35.0, 40.0, 35.0, 38.0, 22.0, 19.0, 31.0, 23.0, 20.0, 16.0, 20.0, 14.0, 10.0, 12.0, 11.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.78125, -8.4920654296875, -8.202880859375, -7.9136962890625, -7.62451171875, -7.3353271484375, -7.046142578125, -6.7569580078125, -6.4677734375, -6.1785888671875, -5.889404296875, -5.6002197265625, -5.31103515625, -5.0218505859375, -4.732666015625, -4.4434814453125, -4.154296875, -3.8651123046875, -3.575927734375, -3.2867431640625, -2.99755859375, -2.7083740234375, -2.419189453125, -2.1300048828125, -1.8408203125, -1.5516357421875, -1.262451171875, -0.9732666015625, -0.68408203125, -0.3948974609375, -0.105712890625, 0.1834716796875, 0.47265625, 0.7618408203125, 1.051025390625, 1.3402099609375, 1.62939453125, 1.9185791015625, 2.207763671875, 2.4969482421875, 2.7861328125, 3.0753173828125, 3.364501953125, 3.6536865234375, 3.94287109375, 4.2320556640625, 4.521240234375, 4.8104248046875, 5.099609375, 5.3887939453125, 5.677978515625, 5.9671630859375, 6.25634765625, 6.5455322265625, 6.834716796875, 7.1239013671875, 7.4130859375, 7.7022705078125, 7.991455078125, 8.2806396484375, 8.56982421875, 8.8590087890625, 9.148193359375, 9.4373779296875, 9.7265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 4.0, 6.0, 14.0, 8.0, 15.0, 12.0, 24.0, 18.0, 23.0, 40.0, 29.0, 35.0, 49.0, 65.0, 115.0, 140.0, 255.0, 650.0, 4288.0, 703249.0, 2428852.0, 6155.0, 778.0, 262.0, 162.0, 109.0, 77.0, 51.0, 43.0, 27.0, 21.0, 14.0, 13.0, 16.0, 14.0, 14.0, 13.0, 6.0, 6.0, 12.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.53125, -22.84033203125, -22.1494140625, -21.45849609375, -20.767578125, -20.07666015625, -19.3857421875, -18.69482421875, -18.00390625, -17.31298828125, -16.6220703125, -15.93115234375, -15.240234375, -14.54931640625, -13.8583984375, -13.16748046875, -12.4765625, -11.78564453125, -11.0947265625, -10.40380859375, -9.712890625, -9.02197265625, -8.3310546875, -7.64013671875, -6.94921875, -6.25830078125, -5.5673828125, -4.87646484375, -4.185546875, -3.49462890625, -2.8037109375, -2.11279296875, -1.421875, -0.73095703125, -0.0400390625, 0.65087890625, 1.341796875, 2.03271484375, 2.7236328125, 3.41455078125, 4.10546875, 4.79638671875, 5.4873046875, 6.17822265625, 6.869140625, 7.56005859375, 8.2509765625, 8.94189453125, 9.6328125, 10.32373046875, 11.0146484375, 11.70556640625, 12.396484375, 13.08740234375, 13.7783203125, 14.46923828125, 15.16015625, 15.85107421875, 16.5419921875, 17.23291015625, 17.923828125, 18.61474609375, 19.3056640625, 19.99658203125, 20.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 18.0, 39.0, 70.0, 96.0, 116.0, 152.0, 154.0, 139.0, 81.0, 65.0, 30.0, 23.0, 8.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624663352966309, -5.2265753746032715, -4.828487396240234, -4.4303998947143555, -4.032311916351318, -3.6342239379882812, -3.2361361980438232, -2.8380484580993652, -2.439960479736328, -2.041872501373291, -1.643784761428833, -1.2456969022750854, -0.8476090431213379, -0.44952118396759033, -0.05143332481384277, 0.34665441513061523, 0.7447423934936523, 1.1428302526474, 1.5409181118011475, 1.939005970954895, 2.3370938301086426, 2.7351818084716797, 3.1332695484161377, 3.5313572883605957, 3.929445266723633, 4.32753324508667, 4.725621223449707, 5.123708724975586, 5.521796703338623, 5.91988468170166, 6.317972183227539, 6.716060161590576, 7.11414909362793, 7.512237071990967, 7.910325050354004, 8.308412551879883, 8.706501007080078, 9.104588508605957, 9.502676010131836, 9.900764465332031, 10.29885196685791, 10.696939468383789, 11.095027923583984, 11.493115425109863, 11.891202926635742, 12.289291381835938, 12.687378883361816, 13.085466384887695, 13.48355484008789, 13.88164234161377, 14.279730796813965, 14.677818298339844, 15.075906753540039, 15.473994255065918, 15.872081756591797, 16.270170211791992, 16.668258666992188, 17.066347122192383, 17.464433670043945, 17.86252212524414, 18.260610580444336, 18.6586971282959, 19.056785583496094, 19.45487403869629, 19.85296058654785]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 9.0, 4.0, 9.0, 17.0, 14.0, 19.0, 17.0, 29.0, 22.0, 38.0, 29.0, 30.0, 38.0, 47.0, 49.0, 44.0, 44.0, 53.0, 44.0, 41.0, 44.0, 43.0, 46.0, 33.0, 44.0, 33.0, 25.0, 20.0, 19.0, 22.0, 15.0, 13.0, 8.0, 12.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.866119384765625, -33.842620849609375, -32.81912612915039, -31.79562759399414, -30.77212905883789, -29.748632431030273, -28.725135803222656, -27.701637268066406, -26.67814064025879, -25.654644012451172, -24.631145477294922, -23.607648849487305, -22.584152221679688, -21.560653686523438, -20.53715705871582, -19.513660430908203, -18.490161895751953, -17.466665267944336, -16.443166732788086, -15.419670104980469, -14.396172523498535, -13.372674942016602, -12.349178314208984, -11.32568073272705, -10.302183151245117, -9.278685569763184, -8.25518798828125, -7.231691360473633, -6.208193778991699, -5.184696197509766, -4.16119909286499, -3.137701988220215, -2.114208221435547, -1.0907108783721924, -0.06721353530883789, 0.9562838077545166, 1.979781150817871, 3.0032787322998047, 4.02677583694458, 5.0502729415893555, 6.073770523071289, 7.097268104553223, 8.120765686035156, 9.144262313842773, 10.167759895324707, 11.19125747680664, 12.214754104614258, 13.238251686096191, 14.261749267578125, 15.285246849060059, 16.308744430541992, 17.33224105834961, 18.35573959350586, 19.379236221313477, 20.402732849121094, 21.426231384277344, 22.44972801208496, 23.473224639892578, 24.496723175048828, 25.520219802856445, 26.543716430664062, 27.567214965820312, 28.59071159362793, 29.614208221435547, 30.637706756591797]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 6.0, 5.0, 12.0, 9.0, 20.0, 32.0, 33.0, 26.0, 37.0, 34.0, 37.0, 41.0, 46.0, 40.0, 52.0, 57.0, 53.0, 48.0, 47.0, 52.0, 42.0, 30.0, 38.0, 28.0, 31.0, 30.0, 25.0, 29.0, 14.0, 8.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.083953857421875, -3.96087646484375, -3.837799072265625, -3.7147216796875, -3.591644287109375, -3.46856689453125, -3.345489501953125, -3.222412109375, -3.099334716796875, -2.97625732421875, -2.853179931640625, -2.7301025390625, -2.607025146484375, -2.48394775390625, -2.360870361328125, -2.23779296875, -2.114715576171875, -1.99163818359375, -1.868560791015625, -1.7454833984375, -1.622406005859375, -1.49932861328125, -1.376251220703125, -1.253173828125, -1.130096435546875, -1.00701904296875, -0.883941650390625, -0.7608642578125, -0.637786865234375, -0.51470947265625, -0.391632080078125, -0.2685546875, -0.145477294921875, -0.02239990234375, 0.100677490234375, 0.2237548828125, 0.346832275390625, 0.46990966796875, 0.592987060546875, 0.716064453125, 0.839141845703125, 0.96221923828125, 1.085296630859375, 1.2083740234375, 1.331451416015625, 1.45452880859375, 1.577606201171875, 1.70068359375, 1.823760986328125, 1.94683837890625, 2.069915771484375, 2.1929931640625, 2.316070556640625, 2.43914794921875, 2.562225341796875, 2.685302734375, 2.808380126953125, 2.93145751953125, 3.054534912109375, 3.1776123046875, 3.300689697265625, 3.42376708984375, 3.546844482421875, 3.669921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 22.0, 23.0, 33.0, 48.0, 75.0, 130.0, 212.0, 318.0, 485.0, 852.0, 1439.0, 2629.0, 5074.0, 10092.0, 20514.0, 44757.0, 104572.0, 266941.0, 675883.0, 1258672.0, 1037679.0, 452914.0, 175046.0, 72178.0, 31965.0, 15352.0, 7430.0, 3914.0, 2116.0, 1094.0, 678.0, 424.0, 254.0, 169.0, 97.0, 62.0, 43.0, 26.0, 22.0, 12.0, 7.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.625, -3.520782470703125, -3.41656494140625, -3.312347412109375, -3.2081298828125, -3.103912353515625, -2.99969482421875, -2.895477294921875, -2.791259765625, -2.687042236328125, -2.58282470703125, -2.478607177734375, -2.3743896484375, -2.270172119140625, -2.16595458984375, -2.061737060546875, -1.95751953125, -1.853302001953125, -1.74908447265625, -1.644866943359375, -1.5406494140625, -1.436431884765625, -1.33221435546875, -1.227996826171875, -1.123779296875, -1.019561767578125, -0.91534423828125, -0.811126708984375, -0.7069091796875, -0.602691650390625, -0.49847412109375, -0.394256591796875, -0.2900390625, -0.185821533203125, -0.08160400390625, 0.022613525390625, 0.1268310546875, 0.231048583984375, 0.33526611328125, 0.439483642578125, 0.543701171875, 0.647918701171875, 0.75213623046875, 0.856353759765625, 0.9605712890625, 1.064788818359375, 1.16900634765625, 1.273223876953125, 1.37744140625, 1.481658935546875, 1.58587646484375, 1.690093994140625, 1.7943115234375, 1.898529052734375, 2.00274658203125, 2.106964111328125, 2.211181640625, 2.315399169921875, 2.41961669921875, 2.523834228515625, 2.6280517578125, 2.732269287109375, 2.83648681640625, 2.940704345703125, 3.044921875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 6.0, 14.0, 15.0, 17.0, 28.0, 38.0, 38.0, 64.0, 69.0, 85.0, 102.0, 135.0, 180.0, 251.0, 272.0, 337.0, 372.0, 399.0, 318.0, 249.0, 228.0, 167.0, 132.0, 106.0, 92.0, 74.0, 50.0, 51.0, 42.0, 28.0, 13.0, 18.0, 19.0, 12.0, 4.0, 10.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.77734375, -4.62762451171875, -4.4779052734375, -4.32818603515625, -4.178466796875, -4.02874755859375, -3.8790283203125, -3.72930908203125, -3.57958984375, -3.42987060546875, -3.2801513671875, -3.13043212890625, -2.980712890625, -2.83099365234375, -2.6812744140625, -2.53155517578125, -2.3818359375, -2.23211669921875, -2.0823974609375, -1.93267822265625, -1.782958984375, -1.63323974609375, -1.4835205078125, -1.33380126953125, -1.18408203125, -1.03436279296875, -0.8846435546875, -0.73492431640625, -0.585205078125, -0.43548583984375, -0.2857666015625, -0.13604736328125, 0.013671875, 0.16339111328125, 0.3131103515625, 0.46282958984375, 0.612548828125, 0.76226806640625, 0.9119873046875, 1.06170654296875, 1.21142578125, 1.36114501953125, 1.5108642578125, 1.66058349609375, 1.810302734375, 1.96002197265625, 2.1097412109375, 2.25946044921875, 2.4091796875, 2.55889892578125, 2.7086181640625, 2.85833740234375, 3.008056640625, 3.15777587890625, 3.3074951171875, 3.45721435546875, 3.60693359375, 3.75665283203125, 3.9063720703125, 4.05609130859375, 4.205810546875, 4.35552978515625, 4.5052490234375, 4.65496826171875, 4.8046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 5.0, 4.0, 9.0, 16.0, 6.0, 20.0, 21.0, 31.0, 29.0, 51.0, 64.0, 92.0, 98.0, 149.0, 197.0, 265.0, 379.0, 722.0, 3108.0, 76417.0, 3370893.0, 724153.0, 14518.0, 1361.0, 496.0, 325.0, 240.0, 136.0, 118.0, 103.0, 63.0, 50.0, 42.0, 28.0, 22.0, 16.0, 10.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.337158203125, -17.72119140625, -17.105224609375, -16.4892578125, -15.873291015625, -15.25732421875, -14.641357421875, -14.025390625, -13.409423828125, -12.79345703125, -12.177490234375, -11.5615234375, -10.945556640625, -10.32958984375, -9.713623046875, -9.09765625, -8.481689453125, -7.86572265625, -7.249755859375, -6.6337890625, -6.017822265625, -5.40185546875, -4.785888671875, -4.169921875, -3.553955078125, -2.93798828125, -2.322021484375, -1.7060546875, -1.090087890625, -0.47412109375, 0.141845703125, 0.7578125, 1.373779296875, 1.98974609375, 2.605712890625, 3.2216796875, 3.837646484375, 4.45361328125, 5.069580078125, 5.685546875, 6.301513671875, 6.91748046875, 7.533447265625, 8.1494140625, 8.765380859375, 9.38134765625, 9.997314453125, 10.61328125, 11.229248046875, 11.84521484375, 12.461181640625, 13.0771484375, 13.693115234375, 14.30908203125, 14.925048828125, 15.541015625, 16.156982421875, 16.77294921875, 17.388916015625, 18.0048828125, 18.620849609375, 19.23681640625, 19.852783203125, 20.46875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 12.0, 47.0, 166.0, 322.0, 263.0, 148.0, 38.0, 15.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.80194091796875, -109.36416625976562, -106.92639923095703, -104.4886245727539, -102.05085754394531, -99.61308288574219, -97.17530822753906, -94.73754119873047, -92.29976654052734, -89.86199188232422, -87.42422485351562, -84.9864501953125, -82.5486831665039, -80.11090850830078, -77.67314147949219, -75.23536682128906, -72.79759216308594, -70.35981750488281, -67.92205047607422, -65.4842758178711, -63.046504974365234, -60.608734130859375, -58.170963287353516, -55.733192443847656, -53.29542541503906, -50.8576545715332, -48.419883728027344, -45.98210906982422, -43.54433822631836, -41.1065673828125, -38.66879653930664, -36.23102569580078, -33.793251037597656, -31.355480194091797, -28.917707443237305, -26.479936599731445, -24.042163848876953, -21.604393005371094, -19.166622161865234, -16.728849411010742, -14.291078567504883, -11.853306770324707, -9.415534973144531, -6.977764129638672, -4.539992332458496, -2.1022205352783203, 0.33555030822753906, 2.7733230590820312, 5.211093902587891, 7.648865699768066, 10.086637496948242, 12.524408340454102, 14.962180137634277, 17.399951934814453, 19.837722778320312, 22.275495529174805, 24.713266372680664, 27.151037216186523, 29.588809967041016, 32.026580810546875, 34.464351654052734, 36.902122497558594, 39.33989715576172, 41.77766799926758, 44.21543884277344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 10.0, 3.0, 9.0, 7.0, 18.0, 13.0, 14.0, 20.0, 20.0, 13.0, 23.0, 24.0, 36.0, 28.0, 34.0, 52.0, 38.0, 37.0, 38.0, 54.0, 39.0, 41.0, 38.0, 46.0, 41.0, 42.0, 36.0, 34.0, 32.0, 30.0, 21.0, 25.0, 17.0, 5.0, 12.0, 8.0, 9.0, 9.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5845947265625, -18.91526222229004, -18.245929718017578, -17.576597213745117, -16.907264709472656, -16.237934112548828, -15.568601608276367, -14.899269104003906, -14.229936599731445, -13.560604095458984, -12.891271591186523, -12.221940040588379, -11.552607536315918, -10.883275032043457, -10.213943481445312, -9.544610977172852, -8.87527847290039, -8.20594596862793, -7.536613941192627, -6.867281913757324, -6.197949409484863, -5.528616905212402, -4.8592848777771, -4.189952850341797, -3.520620346069336, -2.851288080215454, -2.1819558143615723, -1.5126235485076904, -0.8432912826538086, -0.17395901679992676, 0.4953732490539551, 1.1647052764892578, 1.8340377807617188, 2.5033700466156006, 3.1727023124694824, 3.8420345783233643, 4.511366844177246, 5.180699348449707, 5.85003137588501, 6.5193634033203125, 7.188695907592773, 7.858028411865234, 8.527360916137695, 9.19669246673584, 9.8660249710083, 10.535357475280762, 11.204689025878906, 11.874021530151367, 12.543354034423828, 13.212686538696289, 13.88201904296875, 14.551350593566895, 15.220683097839355, 15.890015602111816, 16.55934715270996, 17.228679656982422, 17.898012161254883, 18.567344665527344, 19.236677169799805, 19.906009674072266, 20.575340270996094, 21.244672775268555, 21.914005279541016, 22.583337783813477, 23.252670288085938]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 21.0, 12.0, 24.0, 45.0, 32.0, 25.0, 39.0, 42.0, 33.0, 35.0, 41.0, 58.0, 58.0, 55.0, 43.0, 42.0, 45.0, 45.0, 45.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.97320556640625, -3.8565673828125, -3.73992919921875, -3.623291015625, -3.50665283203125, -3.3900146484375, -3.27337646484375, -3.15673828125, -3.04010009765625, -2.9234619140625, -2.80682373046875, -2.690185546875, -2.57354736328125, -2.4569091796875, -2.34027099609375, -2.2236328125, -2.10699462890625, -1.9903564453125, -1.87371826171875, -1.757080078125, -1.64044189453125, -1.5238037109375, -1.40716552734375, -1.29052734375, -1.17388916015625, -1.0572509765625, -0.94061279296875, -0.823974609375, -0.70733642578125, -0.5906982421875, -0.47406005859375, -0.357421875, -0.24078369140625, -0.1241455078125, -0.00750732421875, 0.109130859375, 0.22576904296875, 0.3424072265625, 0.45904541015625, 0.57568359375, 0.69232177734375, 0.8089599609375, 0.92559814453125, 1.042236328125, 1.15887451171875, 1.2755126953125, 1.39215087890625, 1.5087890625, 1.62542724609375, 1.7420654296875, 1.85870361328125, 1.975341796875, 2.09197998046875, 2.2086181640625, 2.32525634765625, 2.44189453125, 2.55853271484375, 2.6751708984375, 2.79180908203125, 2.908447265625, 3.02508544921875, 3.1417236328125, 3.25836181640625, 3.375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 20.0, 25.0, 32.0, 43.0, 63.0, 115.0, 155.0, 227.0, 309.0, 528.0, 805.0, 1330.0, 2078.0, 3358.0, 5349.0, 8659.0, 13979.0, 22794.0, 37245.0, 62672.0, 113493.0, 280613.0, 243714.0, 102683.0, 57764.0, 34673.0, 21025.0, 13150.0, 8210.0, 4954.0, 3078.0, 1933.0, 1244.0, 771.0, 459.0, 334.0, 213.0, 131.0, 94.0, 59.0, 47.0, 24.0, 26.0, 25.0, 14.0, 8.0, 6.0, 7.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.018951416015625, -0.01839280128479004, -0.017834186553955078, -0.017275571823120117, -0.016716957092285156, -0.016158342361450195, -0.015599727630615234, -0.015041112899780273, -0.014482498168945312, -0.013923883438110352, -0.01336526870727539, -0.01280665397644043, -0.012248039245605469, -0.011689424514770508, -0.011130809783935547, -0.010572195053100586, -0.010013580322265625, -0.009454965591430664, -0.008896350860595703, -0.008337736129760742, -0.007779121398925781, -0.00722050666809082, -0.006661891937255859, -0.0061032772064208984, -0.0055446624755859375, -0.0049860477447509766, -0.004427433013916016, -0.0038688182830810547, -0.0033102035522460938, -0.002751588821411133, -0.002192974090576172, -0.001634359359741211, -0.00107574462890625, -0.0005171298980712891, 4.1484832763671875e-05, 0.0006000995635986328, 0.0011587142944335938, 0.0017173290252685547, 0.0022759437561035156, 0.0028345584869384766, 0.0033931732177734375, 0.0039517879486083984, 0.004510402679443359, 0.00506901741027832, 0.005627632141113281, 0.006186246871948242, 0.006744861602783203, 0.007303476333618164, 0.007862091064453125, 0.008420705795288086, 0.008979320526123047, 0.009537935256958008, 0.010096549987792969, 0.01065516471862793, 0.01121377944946289, 0.011772394180297852, 0.012331008911132812, 0.012889623641967773, 0.013448238372802734, 0.014006853103637695, 0.014565467834472656, 0.015124082565307617, 0.015682697296142578, 0.01624131202697754, 0.0167999267578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 0.0, 6.0, 6.0, 9.0, 8.0, 14.0, 17.0, 16.0, 21.0, 28.0, 26.0, 30.0, 38.0, 37.0, 36.0, 37.0, 50.0, 45.0, 50.0, 1075.0, 38.0, 47.0, 47.0, 35.0, 37.0, 31.0, 39.0, 32.0, 22.0, 21.0, 19.0, 14.0, 22.0, 13.0, 9.0, 7.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9214935302734375, -1.853729248046875, -1.7859649658203125, -1.71820068359375, -1.6504364013671875, -1.582672119140625, -1.5149078369140625, -1.4471435546875, -1.3793792724609375, -1.311614990234375, -1.2438507080078125, -1.17608642578125, -1.1083221435546875, -1.040557861328125, -0.9727935791015625, -0.905029296875, -0.8372650146484375, -0.769500732421875, -0.7017364501953125, -0.63397216796875, -0.5662078857421875, -0.498443603515625, -0.4306793212890625, -0.3629150390625, -0.2951507568359375, -0.227386474609375, -0.1596221923828125, -0.09185791015625, -0.0240936279296875, 0.043670654296875, 0.1114349365234375, 0.17919921875, 0.2469635009765625, 0.314727783203125, 0.3824920654296875, 0.45025634765625, 0.5180206298828125, 0.585784912109375, 0.6535491943359375, 0.7213134765625, 0.7890777587890625, 0.856842041015625, 0.9246063232421875, 0.99237060546875, 1.0601348876953125, 1.127899169921875, 1.1956634521484375, 1.263427734375, 1.3311920166015625, 1.398956298828125, 1.4667205810546875, 1.53448486328125, 1.6022491455078125, 1.670013427734375, 1.7377777099609375, 1.8055419921875, 1.8733062744140625, 1.941070556640625, 2.0088348388671875, 2.07659912109375, 2.1443634033203125, 2.212127685546875, 2.2798919677734375, 2.34765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 11.0, 15.0, 32.0, 26.0, 50.0, 64.0, 109.0, 218.0, 326.0, 480.0, 742.0, 1237.0, 2025.0, 3129.0, 5036.0, 8290.0, 13582.0, 22869.0, 39567.0, 71621.0, 148211.0, 1388718.0, 192988.0, 84839.0, 46151.0, 26424.0, 15471.0, 9598.0, 5488.0, 3618.0, 2255.0, 1408.0, 908.0, 594.0, 367.0, 239.0, 168.0, 107.0, 44.0, 31.0, 26.0, 17.0, 15.0, 8.0, 9.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.014434814453125, -0.014005661010742188, -0.013576507568359375, -0.013147354125976562, -0.01271820068359375, -0.012289047241210938, -0.011859893798828125, -0.011430740356445312, -0.0110015869140625, -0.010572433471679688, -0.010143280029296875, -0.009714126586914062, -0.00928497314453125, -0.008855819702148438, -0.008426666259765625, -0.007997512817382812, -0.007568359375, -0.0071392059326171875, -0.006710052490234375, -0.0062808990478515625, -0.00585174560546875, -0.0054225921630859375, -0.004993438720703125, -0.0045642852783203125, -0.0041351318359375, -0.0037059783935546875, -0.003276824951171875, -0.0028476715087890625, -0.00241851806640625, -0.0019893646240234375, -0.001560211181640625, -0.0011310577392578125, -0.000701904296875, -0.0002727508544921875, 0.000156402587890625, 0.0005855560302734375, 0.00101470947265625, 0.0014438629150390625, 0.001873016357421875, 0.0023021697998046875, 0.0027313232421875, 0.0031604766845703125, 0.003589630126953125, 0.0040187835693359375, 0.00444793701171875, 0.0048770904541015625, 0.005306243896484375, 0.0057353973388671875, 0.00616455078125, 0.0065937042236328125, 0.007022857666015625, 0.0074520111083984375, 0.00788116455078125, 0.008310317993164062, 0.008739471435546875, 0.009168624877929688, 0.0095977783203125, 0.010026931762695312, 0.010456085205078125, 0.010885238647460938, 0.01131439208984375, 0.011743545532226562, 0.012172698974609375, 0.012601852416992188, 0.013031005859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 13.0, 44.0, 15.0, 23.0, 10.0, 0.0, 7.0, 41.0, 67.0, 65.0, 257.0, 4954.0, 991059.0, 51461.0, 257.0, 48.0, 75.0, 41.0, 4.0, 2.0, 6.0, 21.0, 21.0, 37.0, 16.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.7513673305511475e-06, -3.6284327507019043e-06, -3.505498170852661e-06, -3.382563591003418e-06, -3.259629011154175e-06, -3.1366944313049316e-06, -3.0137598514556885e-06, -2.8908252716064453e-06, -2.767890691757202e-06, -2.644956111907959e-06, -2.522021532058716e-06, -2.3990869522094727e-06, -2.2761523723602295e-06, -2.1532177925109863e-06, -2.030283212661743e-06, -1.9073486328125e-06, -1.7844140529632568e-06, -1.6614794731140137e-06, -1.5385448932647705e-06, -1.4156103134155273e-06, -1.2926757335662842e-06, -1.169741153717041e-06, -1.0468065738677979e-06, -9.238719940185547e-07, -8.009374141693115e-07, -6.780028343200684e-07, -5.550682544708252e-07, -4.3213367462158203e-07, -3.0919909477233887e-07, -1.862645149230957e-07, -6.332993507385254e-08, 5.960464477539063e-08, 1.825392246246338e-07, 3.0547380447387695e-07, 4.284083843231201e-07, 5.513429641723633e-07, 6.742775440216064e-07, 7.972121238708496e-07, 9.201467037200928e-07, 1.043081283569336e-06, 1.166015863418579e-06, 1.2889504432678223e-06, 1.4118850231170654e-06, 1.5348196029663086e-06, 1.6577541828155518e-06, 1.780688762664795e-06, 1.903623342514038e-06, 2.0265579223632812e-06, 2.1494925022125244e-06, 2.2724270820617676e-06, 2.3953616619110107e-06, 2.518296241760254e-06, 2.641230821609497e-06, 2.7641654014587402e-06, 2.8870999813079834e-06, 3.0100345611572266e-06, 3.1329691410064697e-06, 3.255903720855713e-06, 3.378838300704956e-06, 3.5017728805541992e-06, 3.6247074604034424e-06, 3.7476420402526855e-06, 3.870576620101929e-06, 3.993511199951172e-06]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.357754773172019e-08, -5.245936307574084e-08, -5.134118197247517e-08, -5.022299731649582e-08, -4.910481266051647e-08, -4.7986628004537124e-08, -4.6868446901271454e-08, -4.5750262245292106e-08, -4.463207758931276e-08, -4.351389293333341e-08, -4.239571183006774e-08, -4.127752717408839e-08, -4.015934251810904e-08, -3.9041157862129694e-08, -3.7922976758864024e-08, -3.6804792102884676e-08, -3.5686610999619006e-08, -3.456842634363966e-08, -3.345024524037399e-08, -3.233206058439464e-08, -3.121387592841529e-08, -3.009569127243594e-08, -2.8977510169170273e-08, -2.7859325513190925e-08, -2.6741140857211576e-08, -2.5622957977589067e-08, -2.450477332160972e-08, -2.338659044198721e-08, -2.226840578600786e-08, -2.1150222906385352e-08, -2.0032040026762843e-08, -1.8913855370783494e-08, -1.7795668938447307e-08, -1.6677486058824798e-08, -1.555930140284545e-08, -1.444111852322294e-08, -1.3322933867243592e-08, -1.2204750987621082e-08, -1.1086567219820154e-08, -9.968383452019225e-09, -8.850199684218296e-09, -7.732015916417367e-09, -6.613832148616439e-09, -5.49564882490472e-09, -4.377465057103791e-09, -3.259281289302862e-09, -2.1410979655911433e-09, -1.0229141977902145e-09, 9.526957001071423e-11, 1.2134532267893405e-09, 2.331636883567967e-09, 3.4498204293242907e-09, 4.5680041971252194e-09, 5.686187964926148e-09, 6.804371288637867e-09, 7.922555056438796e-09, 9.040738824239725e-09, 1.0158922592040653e-08, 1.1277106359841582e-08, 1.2395290127642511e-08, 1.351347300726502e-08, 1.4631657663244368e-08, 1.5749840542866878e-08, 1.6868025198846226e-08, 1.7986208078468735e-08]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 21.0, 12.0, 24.0, 45.0, 32.0, 25.0, 39.0, 42.0, 33.0, 35.0, 41.0, 58.0, 58.0, 55.0, 43.0, 42.0, 45.0, 45.0, 45.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.97320556640625, -3.8565673828125, -3.73992919921875, -3.623291015625, -3.50665283203125, -3.3900146484375, -3.27337646484375, -3.15673828125, -3.04010009765625, -2.9234619140625, -2.80682373046875, -2.690185546875, -2.57354736328125, -2.4569091796875, -2.34027099609375, -2.2236328125, -2.10699462890625, -1.9903564453125, -1.87371826171875, -1.757080078125, -1.64044189453125, -1.5238037109375, -1.40716552734375, -1.29052734375, -1.17388916015625, -1.0572509765625, -0.94061279296875, -0.823974609375, -0.70733642578125, -0.5906982421875, -0.47406005859375, -0.357421875, -0.24078369140625, -0.1241455078125, -0.00750732421875, 0.109130859375, 0.22576904296875, 0.3424072265625, 0.45904541015625, 0.57568359375, 0.69232177734375, 0.8089599609375, 0.92559814453125, 1.042236328125, 1.15887451171875, 1.2755126953125, 1.39215087890625, 1.5087890625, 1.62542724609375, 1.7420654296875, 1.85870361328125, 1.975341796875, 2.09197998046875, 2.2086181640625, 2.32525634765625, 2.44189453125, 2.55853271484375, 2.6751708984375, 2.79180908203125, 2.908447265625, 3.02508544921875, 3.1417236328125, 3.25836181640625, 3.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 22.0, 27.0, 48.0, 47.0, 89.0, 134.0, 244.0, 343.0, 551.0, 834.0, 1221.0, 1916.0, 2766.0, 4489.0, 6857.0, 10968.0, 18066.0, 29198.0, 50138.0, 92572.0, 191853.0, 287498.0, 157782.0, 78270.0, 43655.0, 25924.0, 15704.0, 9562.0, 6251.0, 4081.0, 2633.0, 1638.0, 1104.0, 695.0, 457.0, 324.0, 207.0, 116.0, 101.0, 57.0, 34.0, 19.0, 16.0, 9.0, 8.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0], "bins": [-2.546875, -2.4727783203125, -2.398681640625, -2.3245849609375, -2.25048828125, -2.1763916015625, -2.102294921875, -2.0281982421875, -1.9541015625, -1.8800048828125, -1.805908203125, -1.7318115234375, -1.65771484375, -1.5836181640625, -1.509521484375, -1.4354248046875, -1.361328125, -1.2872314453125, -1.213134765625, -1.1390380859375, -1.06494140625, -0.9908447265625, -0.916748046875, -0.8426513671875, -0.7685546875, -0.6944580078125, -0.620361328125, -0.5462646484375, -0.47216796875, -0.3980712890625, -0.323974609375, -0.2498779296875, -0.17578125, -0.1016845703125, -0.027587890625, 0.0465087890625, 0.12060546875, 0.1947021484375, 0.268798828125, 0.3428955078125, 0.4169921875, 0.4910888671875, 0.565185546875, 0.6392822265625, 0.71337890625, 0.7874755859375, 0.861572265625, 0.9356689453125, 1.009765625, 1.0838623046875, 1.157958984375, 1.2320556640625, 1.30615234375, 1.3802490234375, 1.454345703125, 1.5284423828125, 1.6025390625, 1.6766357421875, 1.750732421875, 1.8248291015625, 1.89892578125, 1.9730224609375, 2.047119140625, 2.1212158203125, 2.1953125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 5.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 5.0, 12.0, 12.0, 10.0, 13.0, 24.0, 25.0, 27.0, 32.0, 23.0, 24.0, 42.0, 35.0, 48.0, 58.0, 141.0, 329.0, 1411.0, 187.0, 85.0, 54.0, 49.0, 41.0, 34.0, 51.0, 28.0, 25.0, 21.0, 23.0, 17.0, 24.0, 24.0, 8.0, 11.0, 15.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.9375, -8.66796875, -8.3984375, -8.12890625, -7.859375, -7.58984375, -7.3203125, -7.05078125, -6.78125, -6.51171875, -6.2421875, -5.97265625, -5.703125, -5.43359375, -5.1640625, -4.89453125, -4.625, -4.35546875, -4.0859375, -3.81640625, -3.546875, -3.27734375, -3.0078125, -2.73828125, -2.46875, -2.19921875, -1.9296875, -1.66015625, -1.390625, -1.12109375, -0.8515625, -0.58203125, -0.3125, -0.04296875, 0.2265625, 0.49609375, 0.765625, 1.03515625, 1.3046875, 1.57421875, 1.84375, 2.11328125, 2.3828125, 2.65234375, 2.921875, 3.19140625, 3.4609375, 3.73046875, 4.0, 4.26953125, 4.5390625, 4.80859375, 5.078125, 5.34765625, 5.6171875, 5.88671875, 6.15625, 6.42578125, 6.6953125, 6.96484375, 7.234375, 7.50390625, 7.7734375, 8.04296875, 8.3125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 4.0, 13.0, 19.0, 18.0, 13.0, 16.0, 35.0, 30.0, 40.0, 36.0, 71.0, 74.0, 105.0, 165.0, 163.0, 300.0, 528.0, 1841.0, 11717.0, 136702.0, 2772118.0, 202294.0, 15721.0, 2064.0, 548.0, 297.0, 165.0, 120.0, 107.0, 75.0, 69.0, 52.0, 39.0, 24.0, 22.0, 21.0, 11.0, 7.0, 9.0, 9.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5078125, -11.1431884765625, -10.778564453125, -10.4139404296875, -10.04931640625, -9.6846923828125, -9.320068359375, -8.9554443359375, -8.5908203125, -8.2261962890625, -7.861572265625, -7.4969482421875, -7.13232421875, -6.7677001953125, -6.403076171875, -6.0384521484375, -5.673828125, -5.3092041015625, -4.944580078125, -4.5799560546875, -4.21533203125, -3.8507080078125, -3.486083984375, -3.1214599609375, -2.7568359375, -2.3922119140625, -2.027587890625, -1.6629638671875, -1.29833984375, -0.9337158203125, -0.569091796875, -0.2044677734375, 0.16015625, 0.5247802734375, 0.889404296875, 1.2540283203125, 1.61865234375, 1.9832763671875, 2.347900390625, 2.7125244140625, 3.0771484375, 3.4417724609375, 3.806396484375, 4.1710205078125, 4.53564453125, 4.9002685546875, 5.264892578125, 5.6295166015625, 5.994140625, 6.3587646484375, 6.723388671875, 7.0880126953125, 7.45263671875, 7.8172607421875, 8.181884765625, 8.5465087890625, 8.9111328125, 9.2757568359375, 9.640380859375, 10.0050048828125, 10.36962890625, 10.7342529296875, 11.098876953125, 11.4635009765625, 11.828125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [197.0, 780.0, 40.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.472397327423096, -1.4493160247802734, 2.573765277862549, 6.596847057342529, 10.619928359985352, 14.643009185791016, 18.666091918945312, 22.689172744750977, 26.71225357055664, 30.735334396362305, 34.75841522216797, 38.781497955322266, 42.80458068847656, 46.827659606933594, 50.85074234008789, 54.87382507324219, 58.89690399169922, 62.919986724853516, 66.94306945800781, 70.96614837646484, 74.98922729492188, 79.01231384277344, 83.03539276123047, 87.0584716796875, 91.08155059814453, 95.10462951660156, 99.12771606445312, 103.15079498291016, 107.17387390136719, 111.19696044921875, 115.22003936767578, 119.24311828613281, 123.26618957519531, 127.28926849365234, 131.31234741210938, 135.33543395996094, 139.3585205078125, 143.381591796875, 147.40467834472656, 151.42776489257812, 155.45083618164062, 159.4739227294922, 163.4969940185547, 167.52008056640625, 171.5431671142578, 175.5662384033203, 179.58932495117188, 183.61241149902344, 187.635498046875, 191.65858459472656, 195.68165588378906, 199.70474243164062, 203.7278289794922, 207.7509002685547, 211.77398681640625, 215.7970733642578, 219.8201446533203, 223.84323120117188, 227.86630249023438, 231.88938903808594, 235.9124755859375, 239.935546875, 243.95863342285156, 247.98171997070312, 252.00479125976562]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 7.0, 6.0, 4.0, 6.0, 6.0, 8.0, 8.0, 11.0, 12.0, 13.0, 14.0, 13.0, 24.0, 13.0, 15.0, 29.0, 26.0, 26.0, 25.0, 24.0, 28.0, 29.0, 35.0, 35.0, 26.0, 34.0, 54.0, 42.0, 35.0, 40.0, 24.0, 32.0, 22.0, 36.0, 29.0, 17.0, 21.0, 27.0, 21.0, 19.0, 18.0, 11.0, 16.0, 14.0, 10.0, 7.0, 4.0, 4.0, 8.0, 3.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.229881286621094, -20.539918899536133, -19.84995460510254, -19.159992218017578, -18.470027923583984, -17.780065536499023, -17.090103149414062, -16.40013885498047, -15.710175514221191, -15.020212173461914, -14.330248832702637, -13.64028549194336, -12.950323104858398, -12.260358810424805, -11.570396423339844, -10.880433082580566, -10.190469741821289, -9.500506401062012, -8.810543060302734, -8.120580673217773, -7.430616855621338, -6.7406535148620605, -6.050690650939941, -5.360727310180664, -4.670763969421387, -3.9808006286621094, -3.290837526321411, -2.600874423980713, -1.9109110832214355, -1.2209477424621582, -0.5309848785400391, 0.15897846221923828, 0.8489437103271484, 1.5389069318771362, 2.228870153427124, 2.9188332557678223, 3.6087965965270996, 4.298759937286377, 4.988722801208496, 5.678686141967773, 6.368649482727051, 7.058612823486328, 7.7485761642456055, 8.438539505004883, 9.128501892089844, 9.818466186523438, 10.508428573608398, 11.198391914367676, 11.888355255126953, 12.57831859588623, 13.268281936645508, 13.958244323730469, 14.648208618164062, 15.338171005249023, 16.028133392333984, 16.718097686767578, 17.408061981201172, 18.098024368286133, 18.787988662719727, 19.477951049804688, 20.16791534423828, 20.857877731323242, 21.547840118408203, 22.237804412841797, 22.927766799926758]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 2.0, 10.0, 15.0, 14.0, 13.0, 28.0, 26.0, 34.0, 42.0, 27.0, 31.0, 42.0, 34.0, 45.0, 54.0, 46.0, 43.0, 62.0, 39.0, 42.0, 41.0, 43.0, 39.0, 38.0, 24.0, 22.0, 29.0, 21.0, 18.0, 18.0, 11.0, 9.0, 13.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.140625, -4.024261474609375, -3.90789794921875, -3.791534423828125, -3.6751708984375, -3.558807373046875, -3.44244384765625, -3.326080322265625, -3.209716796875, -3.093353271484375, -2.97698974609375, -2.860626220703125, -2.7442626953125, -2.627899169921875, -2.51153564453125, -2.395172119140625, -2.27880859375, -2.162445068359375, -2.04608154296875, -1.929718017578125, -1.8133544921875, -1.696990966796875, -1.58062744140625, -1.464263916015625, -1.347900390625, -1.231536865234375, -1.11517333984375, -0.998809814453125, -0.8824462890625, -0.766082763671875, -0.64971923828125, -0.533355712890625, -0.4169921875, -0.300628662109375, -0.18426513671875, -0.067901611328125, 0.0484619140625, 0.164825439453125, 0.28118896484375, 0.397552490234375, 0.513916015625, 0.630279541015625, 0.74664306640625, 0.863006591796875, 0.9793701171875, 1.095733642578125, 1.21209716796875, 1.328460693359375, 1.44482421875, 1.561187744140625, 1.67755126953125, 1.793914794921875, 1.9102783203125, 2.026641845703125, 2.14300537109375, 2.259368896484375, 2.375732421875, 2.492095947265625, 2.60845947265625, 2.724822998046875, 2.8411865234375, 2.957550048828125, 3.07391357421875, 3.190277099609375, 3.306640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 3.0, 1.0, 9.0, 7.0, 9.0, 13.0, 21.0, 20.0, 18.0, 23.0, 33.0, 36.0, 51.0, 96.0, 279.0, 823.0, 3291.0, 15294.0, 99169.0, 1134971.0, 2634752.0, 263464.0, 32956.0, 6483.0, 1566.0, 453.0, 152.0, 69.0, 56.0, 33.0, 20.0, 22.0, 14.0, 13.0, 12.0, 15.0, 13.0, 3.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.846923828125, -7.56884765625, -7.290771484375, -7.0126953125, -6.734619140625, -6.45654296875, -6.178466796875, -5.900390625, -5.622314453125, -5.34423828125, -5.066162109375, -4.7880859375, -4.510009765625, -4.23193359375, -3.953857421875, -3.67578125, -3.397705078125, -3.11962890625, -2.841552734375, -2.5634765625, -2.285400390625, -2.00732421875, -1.729248046875, -1.451171875, -1.173095703125, -0.89501953125, -0.616943359375, -0.3388671875, -0.060791015625, 0.21728515625, 0.495361328125, 0.7734375, 1.051513671875, 1.32958984375, 1.607666015625, 1.8857421875, 2.163818359375, 2.44189453125, 2.719970703125, 2.998046875, 3.276123046875, 3.55419921875, 3.832275390625, 4.1103515625, 4.388427734375, 4.66650390625, 4.944580078125, 5.22265625, 5.500732421875, 5.77880859375, 6.056884765625, 6.3349609375, 6.613037109375, 6.89111328125, 7.169189453125, 7.447265625, 7.725341796875, 8.00341796875, 8.281494140625, 8.5595703125, 8.837646484375, 9.11572265625, 9.393798828125, 9.671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 13.0, 13.0, 27.0, 32.0, 47.0, 64.0, 94.0, 116.0, 137.0, 235.0, 318.0, 437.0, 540.0, 510.0, 408.0, 306.0, 212.0, 145.0, 110.0, 84.0, 59.0, 37.0, 27.0, 28.0, 25.0, 5.0, 7.0, 13.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0078125, -6.8123779296875, -6.616943359375, -6.4215087890625, -6.22607421875, -6.0306396484375, -5.835205078125, -5.6397705078125, -5.4443359375, -5.2489013671875, -5.053466796875, -4.8580322265625, -4.66259765625, -4.4671630859375, -4.271728515625, -4.0762939453125, -3.880859375, -3.6854248046875, -3.489990234375, -3.2945556640625, -3.09912109375, -2.9036865234375, -2.708251953125, -2.5128173828125, -2.3173828125, -2.1219482421875, -1.926513671875, -1.7310791015625, -1.53564453125, -1.3402099609375, -1.144775390625, -0.9493408203125, -0.75390625, -0.5584716796875, -0.363037109375, -0.1676025390625, 0.02783203125, 0.2232666015625, 0.418701171875, 0.6141357421875, 0.8095703125, 1.0050048828125, 1.200439453125, 1.3958740234375, 1.59130859375, 1.7867431640625, 1.982177734375, 2.1776123046875, 2.373046875, 2.5684814453125, 2.763916015625, 2.9593505859375, 3.15478515625, 3.3502197265625, 3.545654296875, 3.7410888671875, 3.9365234375, 4.1319580078125, 4.327392578125, 4.5228271484375, 4.71826171875, 4.9136962890625, 5.109130859375, 5.3045654296875, 5.5]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 6.0, 7.0, 8.0, 21.0, 10.0, 25.0, 35.0, 42.0, 51.0, 65.0, 86.0, 127.0, 191.0, 199.0, 357.0, 740.0, 4168.0, 86896.0, 3520138.0, 564348.0, 13923.0, 1397.0, 468.0, 265.0, 181.0, 125.0, 105.0, 98.0, 55.0, 39.0, 38.0, 14.0, 20.0, 9.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.218017578125, -17.56103515625, -16.904052734375, -16.2470703125, -15.590087890625, -14.93310546875, -14.276123046875, -13.619140625, -12.962158203125, -12.30517578125, -11.648193359375, -10.9912109375, -10.334228515625, -9.67724609375, -9.020263671875, -8.36328125, -7.706298828125, -7.04931640625, -6.392333984375, -5.7353515625, -5.078369140625, -4.42138671875, -3.764404296875, -3.107421875, -2.450439453125, -1.79345703125, -1.136474609375, -0.4794921875, 0.177490234375, 0.83447265625, 1.491455078125, 2.1484375, 2.805419921875, 3.46240234375, 4.119384765625, 4.7763671875, 5.433349609375, 6.09033203125, 6.747314453125, 7.404296875, 8.061279296875, 8.71826171875, 9.375244140625, 10.0322265625, 10.689208984375, 11.34619140625, 12.003173828125, 12.66015625, 13.317138671875, 13.97412109375, 14.631103515625, 15.2880859375, 15.945068359375, 16.60205078125, 17.259033203125, 17.916015625, 18.572998046875, 19.22998046875, 19.886962890625, 20.5439453125, 21.200927734375, 21.85791015625, 22.514892578125, 23.171875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 19.0, 28.0, 59.0, 83.0, 116.0, 136.0, 144.0, 138.0, 110.0, 72.0, 49.0, 25.0, 12.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.35489273071289, -45.3507080078125, -44.346527099609375, -43.342342376708984, -42.338157653808594, -41.3339729309082, -40.32978820800781, -39.32560729980469, -38.3214225769043, -37.317237854003906, -36.31305694580078, -35.30887222290039, -34.3046875, -33.30050277709961, -32.29631805419922, -31.292137145996094, -30.287952423095703, -29.283767700195312, -28.279584884643555, -27.275402069091797, -26.271217346191406, -25.267032623291016, -24.262849807739258, -23.2586669921875, -22.25448226928711, -21.25029754638672, -20.24611473083496, -19.241931915283203, -18.237747192382812, -17.233562469482422, -16.229379653930664, -15.22519588470459, -14.22100830078125, -13.216824531555176, -12.212640762329102, -11.208456993103027, -10.204273223876953, -9.200089454650879, -8.195905685424805, -7.1917219161987305, -6.187538146972656, -5.183354377746582, -4.179170608520508, -3.1749868392944336, -2.1708030700683594, -1.1666193008422852, -0.16243553161621094, 0.8417482376098633, 1.8459320068359375, 2.8501157760620117, 3.854299545288086, 4.85848331451416, 5.862667083740234, 6.866850852966309, 7.871034622192383, 8.875218391418457, 9.879402160644531, 10.883585929870605, 11.88776969909668, 12.891953468322754, 13.896137237548828, 14.900321006774902, 15.904504776000977, 16.908687591552734, 17.912872314453125]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 11.0, 15.0, 19.0, 24.0, 22.0, 29.0, 21.0, 38.0, 39.0, 26.0, 33.0, 44.0, 39.0, 42.0, 50.0, 43.0, 36.0, 41.0, 38.0, 35.0, 28.0, 35.0, 43.0, 19.0, 26.0, 27.0, 20.0, 22.0, 14.0, 21.0, 17.0, 16.0, 7.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.529922485351562, -18.9344539642334, -18.338987350463867, -17.743518829345703, -17.148052215576172, -16.552583694458008, -15.957115173339844, -15.361647605895996, -14.766180038452148, -14.1707124710083, -13.575244903564453, -12.979776382446289, -12.384308815002441, -11.788841247558594, -11.19337272644043, -10.597905158996582, -10.002437591552734, -9.406970024108887, -8.811502456665039, -8.216033935546875, -7.620566368103027, -7.02509880065918, -6.429630756378174, -5.834162712097168, -5.23869514465332, -4.643227577209473, -4.047759532928467, -3.45229172706604, -2.8568239212036133, -2.2613561153411865, -1.6658883094787598, -1.070420265197754, -0.47495269775390625, 0.12051510810852051, 0.7159829139709473, 1.311450719833374, 1.9069185256958008, 2.5023863315582275, 3.0978541374206543, 3.69332218170166, 4.288789749145508, 4.8842573165893555, 5.479725360870361, 6.075193405151367, 6.670660972595215, 7.2661285400390625, 7.861596584320068, 8.457064628601074, 9.052532196044922, 9.64799976348877, 10.243467330932617, 10.838935852050781, 11.434403419494629, 12.029870986938477, 12.62533950805664, 13.220807075500488, 13.816274642944336, 14.411742210388184, 15.007209777832031, 15.602678298950195, 16.19814682006836, 16.79361343383789, 17.389081954956055, 17.98455047607422, 18.58001708984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 17.0, 20.0, 29.0, 30.0, 29.0, 31.0, 41.0, 39.0, 42.0, 51.0, 51.0, 45.0, 43.0, 43.0, 40.0, 52.0, 45.0, 44.0, 34.0, 33.0, 31.0, 28.0, 18.0, 17.0, 18.0, 17.0, 14.0, 8.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.41796875, -4.300048828125, -4.18212890625, -4.064208984375, -3.9462890625, -3.828369140625, -3.71044921875, -3.592529296875, -3.474609375, -3.356689453125, -3.23876953125, -3.120849609375, -3.0029296875, -2.885009765625, -2.76708984375, -2.649169921875, -2.53125, -2.413330078125, -2.29541015625, -2.177490234375, -2.0595703125, -1.941650390625, -1.82373046875, -1.705810546875, -1.587890625, -1.469970703125, -1.35205078125, -1.234130859375, -1.1162109375, -0.998291015625, -0.88037109375, -0.762451171875, -0.64453125, -0.526611328125, -0.40869140625, -0.290771484375, -0.1728515625, -0.054931640625, 0.06298828125, 0.180908203125, 0.298828125, 0.416748046875, 0.53466796875, 0.652587890625, 0.7705078125, 0.888427734375, 1.00634765625, 1.124267578125, 1.2421875, 1.360107421875, 1.47802734375, 1.595947265625, 1.7138671875, 1.831787109375, 1.94970703125, 2.067626953125, 2.185546875, 2.303466796875, 2.42138671875, 2.539306640625, 2.6572265625, 2.775146484375, 2.89306640625, 3.010986328125, 3.12890625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 10.0, 12.0, 23.0, 29.0, 56.0, 69.0, 90.0, 169.0, 248.0, 396.0, 578.0, 963.0, 1432.0, 2373.0, 3590.0, 5747.0, 9156.0, 14667.0, 24134.0, 39981.0, 69366.0, 134177.0, 312686.0, 202415.0, 93838.0, 51823.0, 30774.0, 18649.0, 11419.0, 7153.0, 4603.0, 2862.0, 1819.0, 1121.0, 756.0, 464.0, 330.0, 188.0, 135.0, 86.0, 55.0, 31.0, 30.0, 15.0, 13.0, 5.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.020111083984375, -0.019515037536621094, -0.018918991088867188, -0.01832294464111328, -0.017726898193359375, -0.01713085174560547, -0.016534805297851562, -0.015938758850097656, -0.01534271240234375, -0.014746665954589844, -0.014150619506835938, -0.013554573059082031, -0.012958526611328125, -0.012362480163574219, -0.011766433715820312, -0.011170387268066406, -0.0105743408203125, -0.009978294372558594, -0.009382247924804688, -0.008786201477050781, -0.008190155029296875, -0.007594108581542969, -0.0069980621337890625, -0.006402015686035156, -0.00580596923828125, -0.005209922790527344, -0.0046138763427734375, -0.004017829895019531, -0.003421783447265625, -0.0028257369995117188, -0.0022296905517578125, -0.0016336441040039062, -0.00103759765625, -0.00044155120849609375, 0.0001544952392578125, 0.0007505416870117188, 0.001346588134765625, 0.0019426345825195312, 0.0025386810302734375, 0.0031347274780273438, 0.00373077392578125, 0.004326820373535156, 0.0049228668212890625, 0.005518913269042969, 0.006114959716796875, 0.006711006164550781, 0.0073070526123046875, 0.007903099060058594, 0.0084991455078125, 0.009095191955566406, 0.009691238403320312, 0.010287284851074219, 0.010883331298828125, 0.011479377746582031, 0.012075424194335938, 0.012671470642089844, 0.01326751708984375, 0.013863563537597656, 0.014459609985351562, 0.015055656433105469, 0.015651702880859375, 0.01624774932861328, 0.016843795776367188, 0.017439842224121094, 0.018035888671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 4.0, 9.0, 5.0, 2.0, 7.0, 11.0, 16.0, 24.0, 20.0, 31.0, 23.0, 26.0, 37.0, 33.0, 59.0, 41.0, 49.0, 40.0, 48.0, 1067.0, 45.0, 29.0, 48.0, 49.0, 34.0, 47.0, 30.0, 25.0, 32.0, 28.0, 18.0, 12.0, 13.0, 13.0, 14.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.23828125, -2.16455078125, -2.0908203125, -2.01708984375, -1.943359375, -1.86962890625, -1.7958984375, -1.72216796875, -1.6484375, -1.57470703125, -1.5009765625, -1.42724609375, -1.353515625, -1.27978515625, -1.2060546875, -1.13232421875, -1.05859375, -0.98486328125, -0.9111328125, -0.83740234375, -0.763671875, -0.68994140625, -0.6162109375, -0.54248046875, -0.46875, -0.39501953125, -0.3212890625, -0.24755859375, -0.173828125, -0.10009765625, -0.0263671875, 0.04736328125, 0.12109375, 0.19482421875, 0.2685546875, 0.34228515625, 0.416015625, 0.48974609375, 0.5634765625, 0.63720703125, 0.7109375, 0.78466796875, 0.8583984375, 0.93212890625, 1.005859375, 1.07958984375, 1.1533203125, 1.22705078125, 1.30078125, 1.37451171875, 1.4482421875, 1.52197265625, 1.595703125, 1.66943359375, 1.7431640625, 1.81689453125, 1.890625, 1.96435546875, 2.0380859375, 2.11181640625, 2.185546875, 2.25927734375, 2.3330078125, 2.40673828125, 2.48046875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 11.0, 15.0, 34.0, 49.0, 59.0, 98.0, 109.0, 191.0, 305.0, 456.0, 638.0, 1001.0, 1557.0, 2583.0, 3988.0, 6580.0, 10695.0, 18159.0, 31321.0, 55978.0, 106821.0, 251026.0, 1336967.0, 121379.0, 61876.0, 34422.0, 19891.0, 11864.0, 6995.0, 4352.0, 2743.0, 1705.0, 1141.0, 712.0, 483.0, 306.0, 181.0, 128.0, 79.0, 56.0, 46.0, 46.0, 29.0, 17.0, 11.0, 7.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0148773193359375, -0.014427661895751953, -0.013978004455566406, -0.01352834701538086, -0.013078689575195312, -0.012629032135009766, -0.012179374694824219, -0.011729717254638672, -0.011280059814453125, -0.010830402374267578, -0.010380744934082031, -0.009931087493896484, -0.009481430053710938, -0.00903177261352539, -0.008582115173339844, -0.008132457733154297, -0.00768280029296875, -0.007233142852783203, -0.006783485412597656, -0.006333827972412109, -0.0058841705322265625, -0.005434513092041016, -0.004984855651855469, -0.004535198211669922, -0.004085540771484375, -0.003635883331298828, -0.0031862258911132812, -0.0027365684509277344, -0.0022869110107421875, -0.0018372535705566406, -0.0013875961303710938, -0.0009379386901855469, -0.00048828125, -3.8623809814453125e-05, 0.00041103363037109375, 0.0008606910705566406, 0.0013103485107421875, 0.0017600059509277344, 0.0022096633911132812, 0.002659320831298828, 0.003108978271484375, 0.003558635711669922, 0.004008293151855469, 0.004457950592041016, 0.0049076080322265625, 0.005357265472412109, 0.005806922912597656, 0.006256580352783203, 0.00670623779296875, 0.007155895233154297, 0.007605552673339844, 0.00805521011352539, 0.008504867553710938, 0.008954524993896484, 0.009404182434082031, 0.009853839874267578, 0.010303497314453125, 0.010753154754638672, 0.011202812194824219, 0.011652469635009766, 0.012102127075195312, 0.01255178451538086, 0.013001441955566406, 0.013451099395751953, 0.0139007568359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 109.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 776.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 35.0, 44.0, 27.0, 6.0, 2.0, 0.0, 1.0, 85.0, 51.0, 89.0, 307.0, 4777.0, 986377.0, 55593.0, 464.0, 312.0, 93.0, 54.0, 82.0, 7.0, 0.0, 1.0, 21.0, 14.0, 31.0, 47.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8079375624656677e-06, -2.695247530937195e-06, -2.582557499408722e-06, -2.469867467880249e-06, -2.357177436351776e-06, -2.2444874048233032e-06, -2.1317973732948303e-06, -2.0191073417663574e-06, -1.9064173102378845e-06, -1.7937272787094116e-06, -1.6810372471809387e-06, -1.5683472156524658e-06, -1.455657184123993e-06, -1.34296715259552e-06, -1.2302771210670471e-06, -1.1175870895385742e-06, -1.0048970580101013e-06, -8.922070264816284e-07, -7.795169949531555e-07, -6.668269634246826e-07, -5.541369318962097e-07, -4.414469003677368e-07, -3.287568688392639e-07, -2.1606683731079102e-07, -1.0337680578231812e-07, 9.313225746154785e-09, 1.2200325727462769e-07, 2.3469328880310059e-07, 3.473833203315735e-07, 4.600733518600464e-07, 5.727633833885193e-07, 6.854534149169922e-07, 7.981434464454651e-07, 9.10833477973938e-07, 1.0235235095024109e-06, 1.1362135410308838e-06, 1.2489035725593567e-06, 1.3615936040878296e-06, 1.4742836356163025e-06, 1.5869736671447754e-06, 1.6996636986732483e-06, 1.8123537302017212e-06, 1.925043761730194e-06, 2.037733793258667e-06, 2.15042382478714e-06, 2.263113856315613e-06, 2.3758038878440857e-06, 2.4884939193725586e-06, 2.6011839509010315e-06, 2.7138739824295044e-06, 2.8265640139579773e-06, 2.93925404548645e-06, 3.051944077014923e-06, 3.164634108543396e-06, 3.277324140071869e-06, 3.390014171600342e-06, 3.5027042031288147e-06, 3.6153942346572876e-06, 3.7280842661857605e-06, 3.840774297714233e-06, 3.953464329242706e-06, 4.066154360771179e-06, 4.178844392299652e-06, 4.291534423828125e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 17.0, 20.0, 29.0, 30.0, 29.0, 31.0, 41.0, 39.0, 42.0, 51.0, 51.0, 45.0, 43.0, 43.0, 40.0, 52.0, 45.0, 44.0, 34.0, 33.0, 31.0, 28.0, 18.0, 17.0, 18.0, 17.0, 14.0, 8.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.41796875, -4.300048828125, -4.18212890625, -4.064208984375, -3.9462890625, -3.828369140625, -3.71044921875, -3.592529296875, -3.474609375, -3.356689453125, -3.23876953125, -3.120849609375, -3.0029296875, -2.885009765625, -2.76708984375, -2.649169921875, -2.53125, -2.413330078125, -2.29541015625, -2.177490234375, -2.0595703125, -1.941650390625, -1.82373046875, -1.705810546875, -1.587890625, -1.469970703125, -1.35205078125, -1.234130859375, -1.1162109375, -0.998291015625, -0.88037109375, -0.762451171875, -0.64453125, -0.526611328125, -0.40869140625, -0.290771484375, -0.1728515625, -0.054931640625, 0.06298828125, 0.180908203125, 0.298828125, 0.416748046875, 0.53466796875, 0.652587890625, 0.7705078125, 0.888427734375, 1.00634765625, 1.124267578125, 1.2421875, 1.360107421875, 1.47802734375, 1.595947265625, 1.7138671875, 1.831787109375, 1.94970703125, 2.067626953125, 2.185546875, 2.303466796875, 2.42138671875, 2.539306640625, 2.6572265625, 2.775146484375, 2.89306640625, 3.010986328125, 3.12890625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 17.0, 15.0, 21.0, 22.0, 48.0, 56.0, 95.0, 139.0, 248.0, 498.0, 1304.0, 3274.0, 8835.0, 25915.0, 96336.0, 645350.0, 203489.0, 41143.0, 13318.0, 4959.0, 1918.0, 724.0, 334.0, 172.0, 86.0, 61.0, 35.0, 28.0, 23.0, 20.0, 9.0, 18.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-7.484375, -7.28582763671875, -7.0872802734375, -6.88873291015625, -6.690185546875, -6.49163818359375, -6.2930908203125, -6.09454345703125, -5.89599609375, -5.69744873046875, -5.4989013671875, -5.30035400390625, -5.101806640625, -4.90325927734375, -4.7047119140625, -4.50616455078125, -4.3076171875, -4.10906982421875, -3.9105224609375, -3.71197509765625, -3.513427734375, -3.31488037109375, -3.1163330078125, -2.91778564453125, -2.71923828125, -2.52069091796875, -2.3221435546875, -2.12359619140625, -1.925048828125, -1.72650146484375, -1.5279541015625, -1.32940673828125, -1.130859375, -0.93231201171875, -0.7337646484375, -0.53521728515625, -0.336669921875, -0.13812255859375, 0.0604248046875, 0.25897216796875, 0.45751953125, 0.65606689453125, 0.8546142578125, 1.05316162109375, 1.251708984375, 1.45025634765625, 1.6488037109375, 1.84735107421875, 2.0458984375, 2.24444580078125, 2.4429931640625, 2.64154052734375, 2.840087890625, 3.03863525390625, 3.2371826171875, 3.43572998046875, 3.63427734375, 3.83282470703125, 4.0313720703125, 4.22991943359375, 4.428466796875, 4.62701416015625, 4.8255615234375, 5.02410888671875, 5.22265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 12.0, 11.0, 19.0, 17.0, 19.0, 30.0, 28.0, 37.0, 32.0, 36.0, 51.0, 52.0, 52.0, 108.0, 453.0, 1536.0, 119.0, 60.0, 69.0, 33.0, 31.0, 39.0, 34.0, 23.0, 21.0, 22.0, 21.0, 9.0, 15.0, 8.0, 16.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.3946533203125, -11.015869140625, -10.6370849609375, -10.25830078125, -9.8795166015625, -9.500732421875, -9.1219482421875, -8.7431640625, -8.3643798828125, -7.985595703125, -7.6068115234375, -7.22802734375, -6.8492431640625, -6.470458984375, -6.0916748046875, -5.712890625, -5.3341064453125, -4.955322265625, -4.5765380859375, -4.19775390625, -3.8189697265625, -3.440185546875, -3.0614013671875, -2.6826171875, -2.3038330078125, -1.925048828125, -1.5462646484375, -1.16748046875, -0.7886962890625, -0.409912109375, -0.0311279296875, 0.34765625, 0.7264404296875, 1.105224609375, 1.4840087890625, 1.86279296875, 2.2415771484375, 2.620361328125, 2.9991455078125, 3.3779296875, 3.7567138671875, 4.135498046875, 4.5142822265625, 4.89306640625, 5.2718505859375, 5.650634765625, 6.0294189453125, 6.408203125, 6.7869873046875, 7.165771484375, 7.5445556640625, 7.92333984375, 8.3021240234375, 8.680908203125, 9.0596923828125, 9.4384765625, 9.8172607421875, 10.196044921875, 10.5748291015625, 10.95361328125, 11.3323974609375, 11.711181640625, 12.0899658203125, 12.46875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 15.0, 7.0, 15.0, 10.0, 20.0, 27.0, 27.0, 44.0, 52.0, 60.0, 89.0, 124.0, 282.0, 830.0, 5757.0, 227039.0, 2892944.0, 15800.0, 1564.0, 358.0, 180.0, 104.0, 91.0, 60.0, 41.0, 28.0, 31.0, 25.0, 16.0, 17.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.875, -22.185791015625, -21.49658203125, -20.807373046875, -20.1181640625, -19.428955078125, -18.73974609375, -18.050537109375, -17.361328125, -16.672119140625, -15.98291015625, -15.293701171875, -14.6044921875, -13.915283203125, -13.22607421875, -12.536865234375, -11.84765625, -11.158447265625, -10.46923828125, -9.780029296875, -9.0908203125, -8.401611328125, -7.71240234375, -7.023193359375, -6.333984375, -5.644775390625, -4.95556640625, -4.266357421875, -3.5771484375, -2.887939453125, -2.19873046875, -1.509521484375, -0.8203125, -0.131103515625, 0.55810546875, 1.247314453125, 1.9365234375, 2.625732421875, 3.31494140625, 4.004150390625, 4.693359375, 5.382568359375, 6.07177734375, 6.760986328125, 7.4501953125, 8.139404296875, 8.82861328125, 9.517822265625, 10.20703125, 10.896240234375, 11.58544921875, 12.274658203125, 12.9638671875, 13.653076171875, 14.34228515625, 15.031494140625, 15.720703125, 16.409912109375, 17.09912109375, 17.788330078125, 18.4775390625, 19.166748046875, 19.85595703125, 20.545166015625, 21.234375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [28.0, 143.0, 432.0, 319.0, 81.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.330500602722168, -2.7925734519958496, -1.2546460628509521, 0.2832813262939453, 1.8212084770202637, 3.359135627746582, 4.897063255310059, 6.434989929199219, 7.972917556762695, 9.510845184326172, 11.048771858215332, 12.586699485778809, 14.124626159667969, 15.662553787231445, 17.200481414794922, 18.738407135009766, 20.276336669921875, 21.81426429748535, 23.352191925048828, 24.890117645263672, 26.42804527282715, 27.965972900390625, 29.5039005279541, 31.041828155517578, 32.57975387573242, 34.117679595947266, 35.655609130859375, 37.19353485107422, 38.73146438598633, 40.26939010620117, 41.80731964111328, 43.345245361328125, 44.883174896240234, 46.42110061645508, 47.95903015136719, 49.49695587158203, 51.03488540649414, 52.572811126708984, 54.110740661621094, 55.64866638183594, 57.18659210205078, 58.724517822265625, 60.262447357177734, 61.80037307739258, 63.33830261230469, 64.87622833251953, 66.41415405273438, 67.95207977294922, 69.4900131225586, 71.02793884277344, 72.56586456298828, 74.10379791259766, 75.6417236328125, 77.17964935302734, 78.71757507324219, 80.25550079345703, 81.79342651367188, 83.33135223388672, 84.86927795410156, 86.40721130371094, 87.94513702392578, 89.48306274414062, 91.02098846435547, 92.55891418457031, 94.09684753417969]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 16.0, 7.0, 12.0, 13.0, 13.0, 30.0, 34.0, 31.0, 46.0, 43.0, 51.0, 51.0, 46.0, 49.0, 54.0, 49.0, 46.0, 51.0, 45.0, 54.0, 45.0, 34.0, 37.0, 35.0, 26.0, 22.0, 8.0, 12.0, 6.0, 14.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.21537399291992, -39.067710876464844, -37.920047760009766, -36.77238082885742, -35.624717712402344, -34.477054595947266, -33.32939147949219, -32.181724548339844, -31.034061431884766, -29.886398315429688, -28.738733291625977, -27.5910701751709, -26.443405151367188, -25.29574203491211, -24.14807891845703, -23.00041389465332, -21.852750778198242, -20.705087661743164, -19.557422637939453, -18.409759521484375, -17.262094497680664, -16.114431381225586, -14.966767311096191, -13.819103240966797, -12.671439170837402, -11.523775100708008, -10.376111030578613, -9.228446960449219, -8.08078384399414, -6.933119297027588, -5.785455703735352, -4.637791633605957, -3.4901275634765625, -2.342463493347168, -1.1947996616363525, -0.04713582992553711, 1.1005282402038574, 2.248192310333252, 3.3958559036254883, 4.543519973754883, 5.691184043884277, 6.838848114013672, 7.986512184143066, 9.134176254272461, 10.281839370727539, 11.42950439453125, 12.577167510986328, 13.724831581115723, 14.872495651245117, 16.020158767700195, 17.167823791503906, 18.315486907958984, 19.463151931762695, 20.610815048217773, 21.758480072021484, 22.906143188476562, 24.05380630493164, 25.20146942138672, 26.34913444519043, 27.496797561645508, 28.64446258544922, 29.792125701904297, 30.939788818359375, 32.08745574951172, 33.2351188659668]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 5.0, 11.0, 20.0, 22.0, 16.0, 19.0, 28.0, 23.0, 32.0, 34.0, 39.0, 46.0, 41.0, 48.0, 40.0, 44.0, 50.0, 40.0, 51.0, 48.0, 34.0, 34.0, 41.0, 36.0, 35.0, 19.0, 16.0, 15.0, 25.0, 17.0, 15.0, 10.0, 9.0, 12.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-4.48828125, -4.3675537109375, -4.246826171875, -4.1260986328125, -4.00537109375, -3.8846435546875, -3.763916015625, -3.6431884765625, -3.5224609375, -3.4017333984375, -3.281005859375, -3.1602783203125, -3.03955078125, -2.9188232421875, -2.798095703125, -2.6773681640625, -2.556640625, -2.4359130859375, -2.315185546875, -2.1944580078125, -2.07373046875, -1.9530029296875, -1.832275390625, -1.7115478515625, -1.5908203125, -1.4700927734375, -1.349365234375, -1.2286376953125, -1.10791015625, -0.9871826171875, -0.866455078125, -0.7457275390625, -0.625, -0.5042724609375, -0.383544921875, -0.2628173828125, -0.14208984375, -0.0213623046875, 0.099365234375, 0.2200927734375, 0.3408203125, 0.4615478515625, 0.582275390625, 0.7030029296875, 0.82373046875, 0.9444580078125, 1.065185546875, 1.1859130859375, 1.306640625, 1.4273681640625, 1.548095703125, 1.6688232421875, 1.78955078125, 1.9102783203125, 2.031005859375, 2.1517333984375, 2.2724609375, 2.3931884765625, 2.513916015625, 2.6346435546875, 2.75537109375, 2.8760986328125, 2.996826171875, 3.1175537109375, 3.23828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 11.0, 16.0, 12.0, 18.0, 24.0, 22.0, 40.0, 37.0, 89.0, 152.0, 273.0, 722.0, 2000.0, 6019.0, 22149.0, 104480.0, 726278.0, 2583257.0, 623733.0, 94328.0, 21291.0, 5958.0, 1926.0, 708.0, 316.0, 146.0, 78.0, 37.0, 43.0, 28.0, 17.0, 11.0, 13.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.59765625, -7.3636474609375, -7.129638671875, -6.8956298828125, -6.66162109375, -6.4276123046875, -6.193603515625, -5.9595947265625, -5.7255859375, -5.4915771484375, -5.257568359375, -5.0235595703125, -4.78955078125, -4.5555419921875, -4.321533203125, -4.0875244140625, -3.853515625, -3.6195068359375, -3.385498046875, -3.1514892578125, -2.91748046875, -2.6834716796875, -2.449462890625, -2.2154541015625, -1.9814453125, -1.7474365234375, -1.513427734375, -1.2794189453125, -1.04541015625, -0.8114013671875, -0.577392578125, -0.3433837890625, -0.109375, 0.1246337890625, 0.358642578125, 0.5926513671875, 0.82666015625, 1.0606689453125, 1.294677734375, 1.5286865234375, 1.7626953125, 1.9967041015625, 2.230712890625, 2.4647216796875, 2.69873046875, 2.9327392578125, 3.166748046875, 3.4007568359375, 3.634765625, 3.8687744140625, 4.102783203125, 4.3367919921875, 4.57080078125, 4.8048095703125, 5.038818359375, 5.2728271484375, 5.5068359375, 5.7408447265625, 5.974853515625, 6.2088623046875, 6.44287109375, 6.6768798828125, 6.910888671875, 7.1448974609375, 7.37890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 4.0, 10.0, 15.0, 14.0, 14.0, 35.0, 39.0, 37.0, 48.0, 58.0, 102.0, 124.0, 147.0, 203.0, 265.0, 318.0, 420.0, 391.0, 399.0, 327.0, 247.0, 184.0, 160.0, 125.0, 78.0, 68.0, 61.0, 46.0, 32.0, 26.0, 18.0, 12.0, 9.0, 5.0, 8.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3671875, -5.21148681640625, -5.0557861328125, -4.90008544921875, -4.744384765625, -4.58868408203125, -4.4329833984375, -4.27728271484375, -4.12158203125, -3.96588134765625, -3.8101806640625, -3.65447998046875, -3.498779296875, -3.34307861328125, -3.1873779296875, -3.03167724609375, -2.8759765625, -2.72027587890625, -2.5645751953125, -2.40887451171875, -2.253173828125, -2.09747314453125, -1.9417724609375, -1.78607177734375, -1.63037109375, -1.47467041015625, -1.3189697265625, -1.16326904296875, -1.007568359375, -0.85186767578125, -0.6961669921875, -0.54046630859375, -0.384765625, -0.22906494140625, -0.0733642578125, 0.08233642578125, 0.238037109375, 0.39373779296875, 0.5494384765625, 0.70513916015625, 0.86083984375, 1.01654052734375, 1.1722412109375, 1.32794189453125, 1.483642578125, 1.63934326171875, 1.7950439453125, 1.95074462890625, 2.1064453125, 2.26214599609375, 2.4178466796875, 2.57354736328125, 2.729248046875, 2.88494873046875, 3.0406494140625, 3.19635009765625, 3.35205078125, 3.50775146484375, 3.6634521484375, 3.81915283203125, 3.974853515625, 4.13055419921875, 4.2862548828125, 4.44195556640625, 4.59765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 7.0, 13.0, 16.0, 20.0, 23.0, 34.0, 41.0, 67.0, 68.0, 103.0, 129.0, 184.0, 244.0, 477.0, 1327.0, 6561.0, 62774.0, 1332953.0, 2658710.0, 116775.0, 10319.0, 1814.0, 594.0, 281.0, 191.0, 132.0, 93.0, 90.0, 67.0, 36.0, 35.0, 25.0, 19.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.473876953125, -12.99462890625, -12.515380859375, -12.0361328125, -11.556884765625, -11.07763671875, -10.598388671875, -10.119140625, -9.639892578125, -9.16064453125, -8.681396484375, -8.2021484375, -7.722900390625, -7.24365234375, -6.764404296875, -6.28515625, -5.805908203125, -5.32666015625, -4.847412109375, -4.3681640625, -3.888916015625, -3.40966796875, -2.930419921875, -2.451171875, -1.971923828125, -1.49267578125, -1.013427734375, -0.5341796875, -0.054931640625, 0.42431640625, 0.903564453125, 1.3828125, 1.862060546875, 2.34130859375, 2.820556640625, 3.2998046875, 3.779052734375, 4.25830078125, 4.737548828125, 5.216796875, 5.696044921875, 6.17529296875, 6.654541015625, 7.1337890625, 7.613037109375, 8.09228515625, 8.571533203125, 9.05078125, 9.530029296875, 10.00927734375, 10.488525390625, 10.9677734375, 11.447021484375, 11.92626953125, 12.405517578125, 12.884765625, 13.364013671875, 13.84326171875, 14.322509765625, 14.8017578125, 15.281005859375, 15.76025390625, 16.239501953125, 16.71875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 12.0, 28.0, 41.0, 83.0, 146.0, 188.0, 187.0, 143.0, 92.0, 53.0, 16.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.303102493286133, -10.067081451416016, -8.831060409545898, -7.595038890838623, -6.359017848968506, -5.122996807098389, -3.8869752883911133, -2.650954246520996, -1.414933204650879, -0.17891204357147217, 1.0571091175079346, 2.293130397796631, 3.529151439666748, 4.765172481536865, 6.001194000244141, 7.237215042114258, 8.473236083984375, 9.709257125854492, 10.94527816772461, 12.181299209594727, 13.417320251464844, 14.653341293334961, 15.889363288879395, 17.125385284423828, 18.361404418945312, 19.59742546081543, 20.833446502685547, 22.069467544555664, 23.30548858642578, 24.5415096282959, 25.777530670166016, 27.013553619384766, 28.249576568603516, 29.485597610473633, 30.72161865234375, 31.957639694213867, 33.193660736083984, 34.429683685302734, 35.66570281982422, 36.90172576904297, 38.13774490356445, 39.3737678527832, 40.60978698730469, 41.84580993652344, 43.08182907104492, 44.31785202026367, 45.553871154785156, 46.789894104003906, 48.025917053222656, 49.261940002441406, 50.49795913696289, 51.73398208618164, 52.970001220703125, 54.206024169921875, 55.44204330444336, 56.67806625366211, 57.914085388183594, 59.150108337402344, 60.38612747192383, 61.62215042114258, 62.85816955566406, 64.09419250488281, 65.33021545410156, 66.56623077392578, 67.80225372314453]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 11.0, 16.0, 10.0, 13.0, 20.0, 12.0, 23.0, 19.0, 25.0, 24.0, 32.0, 31.0, 27.0, 35.0, 42.0, 37.0, 45.0, 50.0, 33.0, 40.0, 46.0, 38.0, 50.0, 38.0, 30.0, 33.0, 21.0, 35.0, 31.0, 21.0, 14.0, 11.0, 12.0, 12.0, 14.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.468196868896484, -15.89360237121582, -15.319007873535156, -14.744413375854492, -14.169818878173828, -13.595224380493164, -13.0206298828125, -12.446035385131836, -11.871440887451172, -11.296846389770508, -10.722251892089844, -10.14765739440918, -9.573062896728516, -8.998468399047852, -8.423873901367188, -7.849279880523682, -7.274685859680176, -6.700091361999512, -6.125496864318848, -5.550902366638184, -4.9763078689575195, -4.4017133712768555, -3.8271193504333496, -3.2525248527526855, -2.6779303550720215, -2.1033358573913574, -1.528741478919983, -0.9541471004486084, -0.37955260276794434, 0.19504189491271973, 0.7696361541748047, 1.3442306518554688, 1.9188251495361328, 2.493419647216797, 3.068014144897461, 3.642608404159546, 4.217203140258789, 4.791797637939453, 5.366391658782959, 5.940986156463623, 6.515580654144287, 7.090175151824951, 7.664769649505615, 8.239363670349121, 8.813958168029785, 9.38855266571045, 9.963147163391113, 10.537741661071777, 11.112336158752441, 11.686930656433105, 12.26152515411377, 12.836119651794434, 13.410714149475098, 13.985308647155762, 14.55990219116211, 15.134496688842773, 15.709091186523438, 16.2836856842041, 16.858280181884766, 17.43287467956543, 18.007469177246094, 18.582063674926758, 19.156658172607422, 19.731252670288086, 20.30584716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 4.0, 15.0, 10.0, 16.0, 20.0, 12.0, 17.0, 23.0, 22.0, 23.0, 31.0, 29.0, 40.0, 41.0, 25.0, 45.0, 55.0, 42.0, 39.0, 40.0, 39.0, 34.0, 48.0, 28.0, 45.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 18.0, 16.0, 20.0, 15.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.625, -3.514434814453125, -3.40386962890625, -3.293304443359375, -3.1827392578125, -3.072174072265625, -2.96160888671875, -2.851043701171875, -2.740478515625, -2.629913330078125, -2.51934814453125, -2.408782958984375, -2.2982177734375, -2.187652587890625, -2.07708740234375, -1.966522216796875, -1.85595703125, -1.745391845703125, -1.63482666015625, -1.524261474609375, -1.4136962890625, -1.303131103515625, -1.19256591796875, -1.082000732421875, -0.971435546875, -0.860870361328125, -0.75030517578125, -0.639739990234375, -0.5291748046875, -0.418609619140625, -0.30804443359375, -0.197479248046875, -0.0869140625, 0.023651123046875, 0.13421630859375, 0.244781494140625, 0.3553466796875, 0.465911865234375, 0.57647705078125, 0.687042236328125, 0.797607421875, 0.908172607421875, 1.01873779296875, 1.129302978515625, 1.2398681640625, 1.350433349609375, 1.46099853515625, 1.571563720703125, 1.68212890625, 1.792694091796875, 1.90325927734375, 2.013824462890625, 2.1243896484375, 2.234954833984375, 2.34552001953125, 2.456085205078125, 2.566650390625, 2.677215576171875, 2.78778076171875, 2.898345947265625, 3.0089111328125, 3.119476318359375, 3.23004150390625, 3.340606689453125, 3.451171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 12.0, 30.0, 35.0, 50.0, 74.0, 103.0, 161.0, 181.0, 296.0, 383.0, 606.0, 758.0, 1221.0, 1636.0, 2405.0, 3604.0, 5046.0, 7224.0, 10639.0, 15811.0, 24064.0, 35783.0, 56084.0, 92623.0, 181005.0, 264275.0, 131486.0, 73998.0, 45826.0, 30291.0, 20135.0, 13322.0, 9001.0, 6068.0, 4445.0, 3001.0, 2176.0, 1327.0, 981.0, 693.0, 528.0, 332.0, 242.0, 171.0, 108.0, 102.0, 61.0, 47.0, 32.0, 21.0, 12.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.016387939453125, -0.015880346298217773, -0.015372753143310547, -0.01486515998840332, -0.014357566833496094, -0.013849973678588867, -0.01334238052368164, -0.012834787368774414, -0.012327194213867188, -0.011819601058959961, -0.011312007904052734, -0.010804414749145508, -0.010296821594238281, -0.009789228439331055, -0.009281635284423828, -0.008774042129516602, -0.008266448974609375, -0.0077588558197021484, -0.007251262664794922, -0.006743669509887695, -0.006236076354980469, -0.005728483200073242, -0.005220890045166016, -0.004713296890258789, -0.0042057037353515625, -0.003698110580444336, -0.0031905174255371094, -0.002682924270629883, -0.0021753311157226562, -0.0016677379608154297, -0.0011601448059082031, -0.0006525516510009766, -0.00014495849609375, 0.00036263465881347656, 0.0008702278137207031, 0.0013778209686279297, 0.0018854141235351562, 0.002393007278442383, 0.0029006004333496094, 0.003408193588256836, 0.0039157867431640625, 0.004423379898071289, 0.004930973052978516, 0.005438566207885742, 0.005946159362792969, 0.006453752517700195, 0.006961345672607422, 0.0074689388275146484, 0.007976531982421875, 0.008484125137329102, 0.008991718292236328, 0.009499311447143555, 0.010006904602050781, 0.010514497756958008, 0.011022090911865234, 0.011529684066772461, 0.012037277221679688, 0.012544870376586914, 0.01305246353149414, 0.013560056686401367, 0.014067649841308594, 0.01457524299621582, 0.015082836151123047, 0.015590429306030273, 0.0160980224609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 8.0, 8.0, 16.0, 16.0, 18.0, 17.0, 22.0, 22.0, 25.0, 34.0, 42.0, 39.0, 42.0, 38.0, 58.0, 50.0, 1073.0, 40.0, 57.0, 47.0, 43.0, 56.0, 38.0, 29.0, 27.0, 18.0, 31.0, 19.0, 13.0, 16.0, 11.0, 8.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.351715087890625, -2.27374267578125, -2.195770263671875, -2.1177978515625, -2.039825439453125, -1.96185302734375, -1.883880615234375, -1.805908203125, -1.727935791015625, -1.64996337890625, -1.571990966796875, -1.4940185546875, -1.416046142578125, -1.33807373046875, -1.260101318359375, -1.18212890625, -1.104156494140625, -1.02618408203125, -0.948211669921875, -0.8702392578125, -0.792266845703125, -0.71429443359375, -0.636322021484375, -0.558349609375, -0.480377197265625, -0.40240478515625, -0.324432373046875, -0.2464599609375, -0.168487548828125, -0.09051513671875, -0.012542724609375, 0.0654296875, 0.143402099609375, 0.22137451171875, 0.299346923828125, 0.3773193359375, 0.455291748046875, 0.53326416015625, 0.611236572265625, 0.689208984375, 0.767181396484375, 0.84515380859375, 0.923126220703125, 1.0010986328125, 1.079071044921875, 1.15704345703125, 1.235015869140625, 1.31298828125, 1.390960693359375, 1.46893310546875, 1.546905517578125, 1.6248779296875, 1.702850341796875, 1.78082275390625, 1.858795166015625, 1.936767578125, 2.014739990234375, 2.09271240234375, 2.170684814453125, 2.2486572265625, 2.326629638671875, 2.40460205078125, 2.482574462890625, 2.560546875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 16.0, 14.0, 24.0, 30.0, 52.0, 77.0, 109.0, 156.0, 270.0, 338.0, 542.0, 858.0, 1196.0, 2023.0, 3131.0, 4907.0, 7938.0, 12719.0, 21932.0, 37702.0, 70248.0, 147672.0, 1389621.0, 197703.0, 86475.0, 45386.0, 25706.0, 15262.0, 9143.0, 5855.0, 3469.0, 2287.0, 1481.0, 919.0, 597.0, 440.0, 292.0, 197.0, 111.0, 78.0, 51.0, 34.0, 24.0, 15.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01522064208984375, -0.014754533767700195, -0.01428842544555664, -0.013822317123413086, -0.013356208801269531, -0.012890100479125977, -0.012423992156982422, -0.011957883834838867, -0.011491775512695312, -0.011025667190551758, -0.010559558868408203, -0.010093450546264648, -0.009627342224121094, -0.009161233901977539, -0.008695125579833984, -0.00822901725769043, -0.007762908935546875, -0.00729680061340332, -0.006830692291259766, -0.006364583969116211, -0.005898475646972656, -0.0054323673248291016, -0.004966259002685547, -0.004500150680541992, -0.0040340423583984375, -0.003567934036254883, -0.003101825714111328, -0.0026357173919677734, -0.0021696090698242188, -0.001703500747680664, -0.0012373924255371094, -0.0007712841033935547, -0.00030517578125, 0.0001609325408935547, 0.0006270408630371094, 0.001093149185180664, 0.0015592575073242188, 0.0020253658294677734, 0.002491474151611328, 0.002957582473754883, 0.0034236907958984375, 0.003889799118041992, 0.004355907440185547, 0.0048220157623291016, 0.005288124084472656, 0.005754232406616211, 0.006220340728759766, 0.00668644905090332, 0.007152557373046875, 0.00761866569519043, 0.008084774017333984, 0.008550882339477539, 0.009016990661621094, 0.009483098983764648, 0.009949207305908203, 0.010415315628051758, 0.010881423950195312, 0.011347532272338867, 0.011813640594482422, 0.012279748916625977, 0.012745857238769531, 0.013211965560913086, 0.01367807388305664, 0.014144182205200195, 0.01461029052734375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 119.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 717.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 134.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 10.0, 5.0, 2.0, 0.0, 4.0, 1.0, 17.0, 60.0, 77.0, 6.0, 6.0, 91.0, 113.0, 273.0, 8753.0, 1029750.0, 8736.0, 284.0, 103.0, 91.0, 5.0, 36.0, 88.0, 16.0, 2.0, 7.0, 1.0, 0.0, 3.0, 7.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.081536412239075e-06, -5.904585123062134e-06, -5.727633833885193e-06, -5.550682544708252e-06, -5.373731255531311e-06, -5.19677996635437e-06, -5.019828677177429e-06, -4.842877388000488e-06, -4.665926098823547e-06, -4.4889748096466064e-06, -4.3120235204696655e-06, -4.135072231292725e-06, -3.958120942115784e-06, -3.7811696529388428e-06, -3.604218363761902e-06, -3.427267074584961e-06, -3.25031578540802e-06, -3.073364496231079e-06, -2.896413207054138e-06, -2.7194619178771973e-06, -2.5425106287002563e-06, -2.3655593395233154e-06, -2.1886080503463745e-06, -2.0116567611694336e-06, -1.8347054719924927e-06, -1.6577541828155518e-06, -1.4808028936386108e-06, -1.30385160446167e-06, -1.126900315284729e-06, -9.499490261077881e-07, -7.729977369308472e-07, -5.960464477539062e-07, -4.1909515857696533e-07, -2.421438694000244e-07, -6.51925802230835e-08, 1.1175870895385742e-07, 2.8870999813079834e-07, 4.6566128730773926e-07, 6.426125764846802e-07, 8.195638656616211e-07, 9.96515154838562e-07, 1.173466444015503e-06, 1.3504177331924438e-06, 1.5273690223693848e-06, 1.7043203115463257e-06, 1.8812716007232666e-06, 2.0582228899002075e-06, 2.2351741790771484e-06, 2.4121254682540894e-06, 2.5890767574310303e-06, 2.766028046607971e-06, 2.942979335784912e-06, 3.119930624961853e-06, 3.296881914138794e-06, 3.473833203315735e-06, 3.6507844924926758e-06, 3.827735781669617e-06, 4.004687070846558e-06, 4.1816383600234985e-06, 4.3585896492004395e-06, 4.53554093837738e-06, 4.712492227554321e-06, 4.889443516731262e-06, 5.066394805908203e-06]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1004.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.492702908644787e-08, -5.963182303503345e-08, -5.4336616983619024e-08, -4.90414109322046e-08, -4.3746204880790174e-08, -3.845099882937575e-08, -3.3155792777961324e-08, -2.78605867265469e-08, -2.2565380675132474e-08, -1.727017462371805e-08, -1.1974968572303624e-08, -6.679762520889199e-09, -1.3845564694747736e-09, 3.910649581939651e-09, 9.205855633354076e-09, 1.4501061684768501e-08, 1.9796267736182926e-08, 2.509147378759735e-08, 3.0386679839011776e-08, 3.56818858904262e-08, 4.0977091941840627e-08, 4.627229799325505e-08, 5.1567504044669477e-08, 5.68627100960839e-08, 6.215791614749833e-08, 6.745312219891275e-08, 7.274832825032718e-08, 7.80435343017416e-08, 8.333874035315603e-08, 8.863394640457045e-08, 9.392915245598488e-08, 9.92243585073993e-08, 1.0451955745338637e-07, 1.098147635048008e-07, 1.1510996955621522e-07, 1.2040517560762964e-07, 1.2570038165904407e-07, 1.309955877104585e-07, 1.3629079376187292e-07, 1.4158599981328734e-07, 1.4688120586470177e-07, 1.521764119161162e-07, 1.5747161796753062e-07, 1.6276682401894504e-07, 1.6806203007035947e-07, 1.733572361217739e-07, 1.7865244217318832e-07, 1.8394764822460274e-07, 1.8924285427601717e-07, 1.945380603274316e-07, 1.9983326637884602e-07, 2.0512847243026044e-07, 2.1042367848167487e-07, 2.157188845330893e-07, 2.2101409058450372e-07, 2.2630929663591814e-07, 2.3160450268733257e-07, 2.36899708738747e-07, 2.421949147901614e-07, 2.4749010663072113e-07, 2.5278532689299027e-07, 2.580805471552594e-07, 2.633757389958191e-07, 2.6867093083637883e-07, 2.7396615109864797e-07]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 4.0, 15.0, 10.0, 16.0, 20.0, 12.0, 17.0, 23.0, 22.0, 23.0, 31.0, 29.0, 40.0, 41.0, 25.0, 45.0, 55.0, 42.0, 39.0, 40.0, 39.0, 34.0, 48.0, 28.0, 45.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 18.0, 16.0, 20.0, 15.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.625, -3.514434814453125, -3.40386962890625, -3.293304443359375, -3.1827392578125, -3.072174072265625, -2.96160888671875, -2.851043701171875, -2.740478515625, -2.629913330078125, -2.51934814453125, -2.408782958984375, -2.2982177734375, -2.187652587890625, -2.07708740234375, -1.966522216796875, -1.85595703125, -1.745391845703125, -1.63482666015625, -1.524261474609375, -1.4136962890625, -1.303131103515625, -1.19256591796875, -1.082000732421875, -0.971435546875, -0.860870361328125, -0.75030517578125, -0.639739990234375, -0.5291748046875, -0.418609619140625, -0.30804443359375, -0.197479248046875, -0.0869140625, 0.023651123046875, 0.13421630859375, 0.244781494140625, 0.3553466796875, 0.465911865234375, 0.57647705078125, 0.687042236328125, 0.797607421875, 0.908172607421875, 1.01873779296875, 1.129302978515625, 1.2398681640625, 1.350433349609375, 1.46099853515625, 1.571563720703125, 1.68212890625, 1.792694091796875, 1.90325927734375, 2.013824462890625, 2.1243896484375, 2.234954833984375, 2.34552001953125, 2.456085205078125, 2.566650390625, 2.677215576171875, 2.78778076171875, 2.898345947265625, 3.0089111328125, 3.119476318359375, 3.23004150390625, 3.340606689453125, 3.451171875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 11.0, 0.0, 7.0, 8.0, 6.0, 24.0, 25.0, 38.0, 36.0, 50.0, 73.0, 92.0, 140.0, 188.0, 275.0, 521.0, 1042.0, 2021.0, 4326.0, 10607.0, 26822.0, 83991.0, 682849.0, 168543.0, 39908.0, 15031.0, 5978.0, 2722.0, 1330.0, 705.0, 401.0, 197.0, 136.0, 111.0, 72.0, 59.0, 44.0, 50.0, 34.0, 16.0, 17.0, 9.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.890625, -6.67987060546875, -6.4691162109375, -6.25836181640625, -6.047607421875, -5.83685302734375, -5.6260986328125, -5.41534423828125, -5.20458984375, -4.99383544921875, -4.7830810546875, -4.57232666015625, -4.361572265625, -4.15081787109375, -3.9400634765625, -3.72930908203125, -3.5185546875, -3.30780029296875, -3.0970458984375, -2.88629150390625, -2.675537109375, -2.46478271484375, -2.2540283203125, -2.04327392578125, -1.83251953125, -1.62176513671875, -1.4110107421875, -1.20025634765625, -0.989501953125, -0.77874755859375, -0.5679931640625, -0.35723876953125, -0.146484375, 0.06427001953125, 0.2750244140625, 0.48577880859375, 0.696533203125, 0.90728759765625, 1.1180419921875, 1.32879638671875, 1.53955078125, 1.75030517578125, 1.9610595703125, 2.17181396484375, 2.382568359375, 2.59332275390625, 2.8040771484375, 3.01483154296875, 3.2255859375, 3.43634033203125, 3.6470947265625, 3.85784912109375, 4.068603515625, 4.27935791015625, 4.4901123046875, 4.70086669921875, 4.91162109375, 5.12237548828125, 5.3331298828125, 5.54388427734375, 5.754638671875, 5.96539306640625, 6.1761474609375, 6.38690185546875, 6.59765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 9.0, 2.0, 2.0, 13.0, 11.0, 10.0, 24.0, 16.0, 30.0, 20.0, 30.0, 30.0, 45.0, 40.0, 49.0, 58.0, 61.0, 114.0, 1542.0, 401.0, 97.0, 52.0, 52.0, 47.0, 33.0, 43.0, 27.0, 30.0, 37.0, 25.0, 17.0, 25.0, 10.0, 6.0, 12.0, 9.0, 6.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9609375, -11.6185302734375, -11.276123046875, -10.9337158203125, -10.59130859375, -10.2489013671875, -9.906494140625, -9.5640869140625, -9.2216796875, -8.8792724609375, -8.536865234375, -8.1944580078125, -7.85205078125, -7.5096435546875, -7.167236328125, -6.8248291015625, -6.482421875, -6.1400146484375, -5.797607421875, -5.4552001953125, -5.11279296875, -4.7703857421875, -4.427978515625, -4.0855712890625, -3.7431640625, -3.4007568359375, -3.058349609375, -2.7159423828125, -2.37353515625, -2.0311279296875, -1.688720703125, -1.3463134765625, -1.00390625, -0.6614990234375, -0.319091796875, 0.0233154296875, 0.36572265625, 0.7081298828125, 1.050537109375, 1.3929443359375, 1.7353515625, 2.0777587890625, 2.420166015625, 2.7625732421875, 3.10498046875, 3.4473876953125, 3.789794921875, 4.1322021484375, 4.474609375, 4.8170166015625, 5.159423828125, 5.5018310546875, 5.84423828125, 6.1866455078125, 6.529052734375, 6.8714599609375, 7.2138671875, 7.5562744140625, 7.898681640625, 8.2410888671875, 8.58349609375, 8.9259033203125, 9.268310546875, 9.6107177734375, 9.953125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 7.0, 14.0, 11.0, 17.0, 29.0, 15.0, 30.0, 40.0, 46.0, 56.0, 91.0, 113.0, 188.0, 343.0, 1026.0, 10175.0, 713567.0, 2404028.0, 13559.0, 1296.0, 363.0, 214.0, 120.0, 79.0, 53.0, 42.0, 35.0, 34.0, 28.0, 14.0, 18.0, 10.0, 12.0, 3.0, 3.0, 10.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.17578125, -18.4921875, -17.80859375, -17.125, -16.44140625, -15.7578125, -15.07421875, -14.390625, -13.70703125, -13.0234375, -12.33984375, -11.65625, -10.97265625, -10.2890625, -9.60546875, -8.921875, -8.23828125, -7.5546875, -6.87109375, -6.1875, -5.50390625, -4.8203125, -4.13671875, -3.453125, -2.76953125, -2.0859375, -1.40234375, -0.71875, -0.03515625, 0.6484375, 1.33203125, 2.015625, 2.69921875, 3.3828125, 4.06640625, 4.75, 5.43359375, 6.1171875, 6.80078125, 7.484375, 8.16796875, 8.8515625, 9.53515625, 10.21875, 10.90234375, 11.5859375, 12.26953125, 12.953125, 13.63671875, 14.3203125, 15.00390625, 15.6875, 16.37109375, 17.0546875, 17.73828125, 18.421875, 19.10546875, 19.7890625, 20.47265625, 21.15625, 21.83984375, 22.5234375, 23.20703125, 23.890625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 14.0, 31.0, 63.0, 181.0, 247.0, 248.0, 142.0, 61.0, 18.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.3286018371582, -34.506431579589844, -33.684261322021484, -32.862091064453125, -32.039920806884766, -31.21775245666504, -30.39558219909668, -29.573413848876953, -28.751243591308594, -27.929073333740234, -27.106903076171875, -26.28473472595215, -25.46256446838379, -24.64039421081543, -23.81822395324707, -22.996055603027344, -22.173885345458984, -21.351715087890625, -20.529544830322266, -19.70737648010254, -18.88520622253418, -18.06303596496582, -17.24086570739746, -16.418697357177734, -15.596525192260742, -14.774354934692383, -13.95218563079834, -13.13001537322998, -12.307846069335938, -11.485675811767578, -10.663505554199219, -9.841336250305176, -9.019166946411133, -8.196996688842773, -7.3748273849487305, -6.552657127380371, -5.730487823486328, -4.908317565917969, -4.086147785186768, -3.2639780044555664, -2.4418082237243652, -1.619638442993164, -0.7974685430526733, 0.024701356887817383, 0.8468711376190186, 1.6690411567687988, 2.4912109375, 3.313380718231201, 4.135550498962402, 4.9577202796936035, 5.779890060424805, 6.602060317993164, 7.424229621887207, 8.246399879455566, 9.06856918334961, 9.890739440917969, 10.712909698486328, 11.535079956054688, 12.35724925994873, 13.17941951751709, 14.001588821411133, 14.823759078979492, 15.645929336547852, 16.468097686767578, 17.290267944335938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 10.0, 17.0, 11.0, 23.0, 28.0, 20.0, 37.0, 25.0, 38.0, 34.0, 35.0, 53.0, 52.0, 38.0, 48.0, 42.0, 39.0, 45.0, 38.0, 48.0, 35.0, 35.0, 41.0, 29.0, 30.0, 21.0, 14.0, 15.0, 14.0, 14.0, 11.0, 13.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.01033592224121, -29.10943031311035, -28.208524703979492, -27.3076171875, -26.40671157836914, -25.50580596923828, -24.604900360107422, -23.703994750976562, -22.803089141845703, -21.902183532714844, -21.001277923583984, -20.100372314453125, -19.199464797973633, -18.298559188842773, -17.397653579711914, -16.496747970581055, -15.595840454101562, -14.694934844970703, -13.794028282165527, -12.893122673034668, -11.992216110229492, -11.091310501098633, -10.190404891967773, -9.289499282836914, -8.388592720031738, -7.487686634063721, -6.586780548095703, -5.685874938964844, -4.784968852996826, -3.8840627670288086, -2.983157157897949, -2.0822510719299316, -1.1813430786132812, -0.2804371118545532, 0.6204688549041748, 1.5213747024536133, 2.422280788421631, 3.3231868743896484, 4.224092483520508, 5.124998569488525, 6.025904655456543, 6.9268107414245605, 7.827716827392578, 8.728622436523438, 9.629528045654297, 10.530434608459473, 11.431340217590332, 12.332246780395508, 13.233152389526367, 14.134057998657227, 15.034964561462402, 15.935870170593262, 16.836776733398438, 17.737682342529297, 18.638587951660156, 19.539493560791016, 20.440399169921875, 21.341304779052734, 22.242210388183594, 23.143115997314453, 24.044023513793945, 24.944929122924805, 25.845834732055664, 26.746740341186523, 27.647647857666016]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 6.0, 11.0, 7.0, 15.0, 19.0, 10.0, 22.0, 18.0, 19.0, 24.0, 29.0, 27.0, 30.0, 35.0, 37.0, 37.0, 34.0, 43.0, 41.0, 49.0, 37.0, 42.0, 39.0, 39.0, 36.0, 36.0, 27.0, 31.0, 30.0, 27.0, 24.0, 17.0, 14.0, 16.0, 14.0, 9.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.50390625, -3.393096923828125, -3.28228759765625, -3.171478271484375, -3.0606689453125, -2.949859619140625, -2.83905029296875, -2.728240966796875, -2.617431640625, -2.506622314453125, -2.39581298828125, -2.285003662109375, -2.1741943359375, -2.063385009765625, -1.95257568359375, -1.841766357421875, -1.73095703125, -1.620147705078125, -1.50933837890625, -1.398529052734375, -1.2877197265625, -1.176910400390625, -1.06610107421875, -0.955291748046875, -0.844482421875, -0.733673095703125, -0.62286376953125, -0.512054443359375, -0.4012451171875, -0.290435791015625, -0.17962646484375, -0.068817138671875, 0.0419921875, 0.152801513671875, 0.26361083984375, 0.374420166015625, 0.4852294921875, 0.596038818359375, 0.70684814453125, 0.817657470703125, 0.928466796875, 1.039276123046875, 1.15008544921875, 1.260894775390625, 1.3717041015625, 1.482513427734375, 1.59332275390625, 1.704132080078125, 1.81494140625, 1.925750732421875, 2.03656005859375, 2.147369384765625, 2.2581787109375, 2.368988037109375, 2.47979736328125, 2.590606689453125, 2.701416015625, 2.812225341796875, 2.92303466796875, 3.033843994140625, 3.1446533203125, 3.255462646484375, 3.36627197265625, 3.477081298828125, 3.587890625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 8.0, 7.0, 9.0, 15.0, 18.0, 24.0, 40.0, 50.0, 98.0, 181.0, 317.0, 595.0, 1354.0, 3054.0, 7793.0, 22460.0, 76467.0, 364329.0, 2091854.0, 1338226.0, 209682.0, 50908.0, 16085.0, 5997.0, 2393.0, 1069.0, 571.0, 275.0, 135.0, 87.0, 37.0, 50.0, 17.0, 24.0, 13.0, 13.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.0703125, -7.84515380859375, -7.6199951171875, -7.39483642578125, -7.169677734375, -6.94451904296875, -6.7193603515625, -6.49420166015625, -6.26904296875, -6.04388427734375, -5.8187255859375, -5.59356689453125, -5.368408203125, -5.14324951171875, -4.9180908203125, -4.69293212890625, -4.4677734375, -4.24261474609375, -4.0174560546875, -3.79229736328125, -3.567138671875, -3.34197998046875, -3.1168212890625, -2.89166259765625, -2.66650390625, -2.44134521484375, -2.2161865234375, -1.99102783203125, -1.765869140625, -1.54071044921875, -1.3155517578125, -1.09039306640625, -0.865234375, -0.64007568359375, -0.4149169921875, -0.18975830078125, 0.035400390625, 0.26055908203125, 0.4857177734375, 0.71087646484375, 0.93603515625, 1.16119384765625, 1.3863525390625, 1.61151123046875, 1.836669921875, 2.06182861328125, 2.2869873046875, 2.51214599609375, 2.7373046875, 2.96246337890625, 3.1876220703125, 3.41278076171875, 3.637939453125, 3.86309814453125, 4.0882568359375, 4.31341552734375, 4.53857421875, 4.76373291015625, 4.9888916015625, 5.21405029296875, 5.439208984375, 5.66436767578125, 5.8895263671875, 6.11468505859375, 6.33984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 8.0, 18.0, 22.0, 20.0, 21.0, 43.0, 55.0, 70.0, 88.0, 117.0, 129.0, 218.0, 268.0, 299.0, 386.0, 452.0, 397.0, 310.0, 261.0, 202.0, 144.0, 112.0, 88.0, 70.0, 67.0, 40.0, 31.0, 33.0, 19.0, 13.0, 17.0, 10.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.87109375, -4.71136474609375, -4.5516357421875, -4.39190673828125, -4.232177734375, -4.07244873046875, -3.9127197265625, -3.75299072265625, -3.59326171875, -3.43353271484375, -3.2738037109375, -3.11407470703125, -2.954345703125, -2.79461669921875, -2.6348876953125, -2.47515869140625, -2.3154296875, -2.15570068359375, -1.9959716796875, -1.83624267578125, -1.676513671875, -1.51678466796875, -1.3570556640625, -1.19732666015625, -1.03759765625, -0.87786865234375, -0.7181396484375, -0.55841064453125, -0.398681640625, -0.23895263671875, -0.0792236328125, 0.08050537109375, 0.240234375, 0.39996337890625, 0.5596923828125, 0.71942138671875, 0.879150390625, 1.03887939453125, 1.1986083984375, 1.35833740234375, 1.51806640625, 1.67779541015625, 1.8375244140625, 1.99725341796875, 2.156982421875, 2.31671142578125, 2.4764404296875, 2.63616943359375, 2.7958984375, 2.95562744140625, 3.1153564453125, 3.27508544921875, 3.434814453125, 3.59454345703125, 3.7542724609375, 3.91400146484375, 4.07373046875, 4.23345947265625, 4.3931884765625, 4.55291748046875, 4.712646484375, 4.87237548828125, 5.0321044921875, 5.19183349609375, 5.3515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 10.0, 9.0, 8.0, 18.0, 18.0, 21.0, 22.0, 37.0, 60.0, 51.0, 76.0, 113.0, 153.0, 179.0, 295.0, 647.0, 2187.0, 10393.0, 77808.0, 1108773.0, 2788851.0, 178739.0, 19953.0, 3698.0, 930.0, 413.0, 208.0, 154.0, 108.0, 92.0, 57.0, 41.0, 35.0, 33.0, 26.0, 10.0, 10.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.68701171875, -13.2333984375, -12.77978515625, -12.326171875, -11.87255859375, -11.4189453125, -10.96533203125, -10.51171875, -10.05810546875, -9.6044921875, -9.15087890625, -8.697265625, -8.24365234375, -7.7900390625, -7.33642578125, -6.8828125, -6.42919921875, -5.9755859375, -5.52197265625, -5.068359375, -4.61474609375, -4.1611328125, -3.70751953125, -3.25390625, -2.80029296875, -2.3466796875, -1.89306640625, -1.439453125, -0.98583984375, -0.5322265625, -0.07861328125, 0.375, 0.82861328125, 1.2822265625, 1.73583984375, 2.189453125, 2.64306640625, 3.0966796875, 3.55029296875, 4.00390625, 4.45751953125, 4.9111328125, 5.36474609375, 5.818359375, 6.27197265625, 6.7255859375, 7.17919921875, 7.6328125, 8.08642578125, 8.5400390625, 8.99365234375, 9.447265625, 9.90087890625, 10.3544921875, 10.80810546875, 11.26171875, 11.71533203125, 12.1689453125, 12.62255859375, 13.076171875, 13.52978515625, 13.9833984375, 14.43701171875, 14.890625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 13.0, 22.0, 30.0, 41.0, 52.0, 71.0, 82.0, 86.0, 86.0, 115.0, 89.0, 79.0, 76.0, 42.0, 31.0, 31.0, 20.0, 16.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.477941513061523, -24.74338150024414, -24.00882339477539, -23.274263381958008, -22.539703369140625, -21.805143356323242, -21.070585250854492, -20.33602523803711, -19.601465225219727, -18.866905212402344, -18.132347106933594, -17.39778709411621, -16.663227081298828, -15.928668022155762, -15.194108963012695, -14.459548950195312, -13.724989891052246, -12.99043083190918, -12.255870819091797, -11.52131175994873, -10.786751747131348, -10.052192687988281, -9.317632675170898, -8.583073616027832, -7.848514080047607, -7.113954544067383, -6.379395008087158, -5.644835472106934, -4.910276412963867, -4.175716400146484, -3.441157341003418, -2.7065978050231934, -1.9720382690429688, -1.2374787330627441, -0.5029193162918091, 0.23164010047912598, 0.9661996364593506, 1.7007591724395752, 2.4353184700012207, 3.1698780059814453, 3.90443754196167, 4.6389970779418945, 5.373556613922119, 6.108116149902344, 6.84267520904541, 7.577235221862793, 8.31179428100586, 9.046354293823242, 9.780913352966309, 10.515472412109375, 11.250032424926758, 11.984591484069824, 12.719151496887207, 13.453710556030273, 14.188270568847656, 14.922829627990723, 15.657388687133789, 16.391948699951172, 17.126506805419922, 17.861066818237305, 18.595626831054688, 19.33018684387207, 20.06474494934082, 20.799304962158203, 21.533864974975586]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 5.0, 10.0, 16.0, 11.0, 12.0, 12.0, 16.0, 16.0, 23.0, 22.0, 22.0, 37.0, 24.0, 35.0, 40.0, 35.0, 36.0, 50.0, 44.0, 37.0, 48.0, 45.0, 32.0, 35.0, 36.0, 46.0, 28.0, 34.0, 35.0, 28.0, 17.0, 11.0, 16.0, 20.0, 12.0, 14.0, 7.0, 10.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-21.35034942626953, -20.72182846069336, -20.093305587768555, -19.464784622192383, -18.836261749267578, -18.207740783691406, -17.5792179107666, -16.95069694519043, -16.322174072265625, -15.693652153015137, -15.065130233764648, -14.43660831451416, -13.808086395263672, -13.1795654296875, -12.551043510437012, -11.922521591186523, -11.294000625610352, -10.665478706359863, -10.036956787109375, -9.408434867858887, -8.779912948608398, -8.151391983032227, -7.522870063781738, -6.89434814453125, -6.265826225280762, -5.637304306030273, -5.008782386779785, -4.380260944366455, -3.751739025115967, -3.1232171058654785, -2.4946954250335693, -1.8661737442016602, -1.2376518249511719, -0.6091300249099731, 0.019391775131225586, 0.6479135751724243, 1.276435375213623, 1.9049572944641113, 2.5334789752960205, 3.1620006561279297, 3.790522575378418, 4.419044494628906, 5.0475664138793945, 5.676087856292725, 6.304609775543213, 6.933131694793701, 7.561653137207031, 8.19017505645752, 8.818696975708008, 9.447218894958496, 10.075740814208984, 10.704262733459473, 11.332784652709961, 11.961305618286133, 12.589827537536621, 13.21834945678711, 13.846871376037598, 14.475393295288086, 15.103915214538574, 15.732437133789062, 16.360958099365234, 16.98948097229004, 17.61800193786621, 18.246524810791016, 18.875045776367188]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 16.0, 21.0, 22.0, 16.0, 34.0, 23.0, 39.0, 37.0, 48.0, 41.0, 43.0, 36.0, 49.0, 43.0, 50.0, 47.0, 50.0, 39.0, 41.0, 32.0, 26.0, 34.0, 28.0, 19.0, 15.0, 20.0, 11.0, 13.0, 14.0, 11.0, 11.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9375, -3.81298828125, -3.6884765625, -3.56396484375, -3.439453125, -3.31494140625, -3.1904296875, -3.06591796875, -2.94140625, -2.81689453125, -2.6923828125, -2.56787109375, -2.443359375, -2.31884765625, -2.1943359375, -2.06982421875, -1.9453125, -1.82080078125, -1.6962890625, -1.57177734375, -1.447265625, -1.32275390625, -1.1982421875, -1.07373046875, -0.94921875, -0.82470703125, -0.7001953125, -0.57568359375, -0.451171875, -0.32666015625, -0.2021484375, -0.07763671875, 0.046875, 0.17138671875, 0.2958984375, 0.42041015625, 0.544921875, 0.66943359375, 0.7939453125, 0.91845703125, 1.04296875, 1.16748046875, 1.2919921875, 1.41650390625, 1.541015625, 1.66552734375, 1.7900390625, 1.91455078125, 2.0390625, 2.16357421875, 2.2880859375, 2.41259765625, 2.537109375, 2.66162109375, 2.7861328125, 2.91064453125, 3.03515625, 3.15966796875, 3.2841796875, 3.40869140625, 3.533203125, 3.65771484375, 3.7822265625, 3.90673828125, 4.03125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 15.0, 14.0, 27.0, 42.0, 50.0, 70.0, 110.0, 183.0, 293.0, 544.0, 949.0, 1673.0, 2784.0, 5041.0, 9262.0, 17215.0, 32718.0, 67378.0, 166938.0, 427891.0, 172627.0, 69866.0, 33304.0, 17802.0, 9638.0, 5358.0, 2895.0, 1554.0, 908.0, 500.0, 336.0, 226.0, 110.0, 90.0, 49.0, 28.0, 20.0, 17.0, 8.0, 1.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0296630859375, -0.028750896453857422, -0.027838706970214844, -0.026926517486572266, -0.026014328002929688, -0.02510213851928711, -0.02418994903564453, -0.023277759552001953, -0.022365570068359375, -0.021453380584716797, -0.02054119110107422, -0.01962900161743164, -0.018716812133789062, -0.017804622650146484, -0.016892433166503906, -0.015980243682861328, -0.01506805419921875, -0.014155864715576172, -0.013243675231933594, -0.012331485748291016, -0.011419296264648438, -0.01050710678100586, -0.009594917297363281, -0.008682727813720703, -0.007770538330078125, -0.006858348846435547, -0.005946159362792969, -0.005033969879150391, -0.0041217803955078125, -0.0032095909118652344, -0.0022974014282226562, -0.0013852119445800781, -0.0004730224609375, 0.0004391670227050781, 0.0013513565063476562, 0.0022635459899902344, 0.0031757354736328125, 0.004087924957275391, 0.005000114440917969, 0.005912303924560547, 0.006824493408203125, 0.007736682891845703, 0.008648872375488281, 0.00956106185913086, 0.010473251342773438, 0.011385440826416016, 0.012297630310058594, 0.013209819793701172, 0.01412200927734375, 0.015034198760986328, 0.015946388244628906, 0.016858577728271484, 0.017770767211914062, 0.01868295669555664, 0.01959514617919922, 0.020507335662841797, 0.021419525146484375, 0.022331714630126953, 0.02324390411376953, 0.02415609359741211, 0.025068283081054688, 0.025980472564697266, 0.026892662048339844, 0.027804851531982422, 0.028717041015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 10.0, 17.0, 11.0, 14.0, 17.0, 14.0, 25.0, 26.0, 23.0, 27.0, 38.0, 37.0, 33.0, 36.0, 38.0, 33.0, 46.0, 1064.0, 40.0, 38.0, 49.0, 40.0, 37.0, 34.0, 32.0, 22.0, 24.0, 23.0, 24.0, 17.0, 21.0, 16.0, 15.0, 12.0, 12.0, 6.0, 4.0, 6.0, 4.0, 2.0, 7.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.16015625, -2.087646484375, -2.01513671875, -1.942626953125, -1.8701171875, -1.797607421875, -1.72509765625, -1.652587890625, -1.580078125, -1.507568359375, -1.43505859375, -1.362548828125, -1.2900390625, -1.217529296875, -1.14501953125, -1.072509765625, -1.0, -0.927490234375, -0.85498046875, -0.782470703125, -0.7099609375, -0.637451171875, -0.56494140625, -0.492431640625, -0.419921875, -0.347412109375, -0.27490234375, -0.202392578125, -0.1298828125, -0.057373046875, 0.01513671875, 0.087646484375, 0.16015625, 0.232666015625, 0.30517578125, 0.377685546875, 0.4501953125, 0.522705078125, 0.59521484375, 0.667724609375, 0.740234375, 0.812744140625, 0.88525390625, 0.957763671875, 1.0302734375, 1.102783203125, 1.17529296875, 1.247802734375, 1.3203125, 1.392822265625, 1.46533203125, 1.537841796875, 1.6103515625, 1.682861328125, 1.75537109375, 1.827880859375, 1.900390625, 1.972900390625, 2.04541015625, 2.117919921875, 2.1904296875, 2.262939453125, 2.33544921875, 2.407958984375, 2.48046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 14.0, 13.0, 15.0, 47.0, 45.0, 118.0, 107.0, 196.0, 262.0, 427.0, 650.0, 840.0, 1362.0, 2033.0, 2897.0, 4468.0, 6875.0, 10571.0, 16489.0, 26264.0, 41700.0, 70555.0, 134304.0, 1342258.0, 199441.0, 92175.0, 52988.0, 32344.0, 20256.0, 12847.0, 8248.0, 5457.0, 3564.0, 2393.0, 1606.0, 1006.0, 704.0, 474.0, 337.0, 250.0, 160.0, 105.0, 73.0, 55.0, 47.0, 32.0, 20.0, 10.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-0.01480865478515625, -0.014369606971740723, -0.013930559158325195, -0.013491511344909668, -0.01305246353149414, -0.012613415718078613, -0.012174367904663086, -0.011735320091247559, -0.011296272277832031, -0.010857224464416504, -0.010418176651000977, -0.00997912883758545, -0.009540081024169922, -0.009101033210754395, -0.008661985397338867, -0.00822293758392334, -0.0077838897705078125, -0.007344841957092285, -0.006905794143676758, -0.0064667463302612305, -0.006027698516845703, -0.005588650703430176, -0.0051496028900146484, -0.004710555076599121, -0.004271507263183594, -0.0038324594497680664, -0.003393411636352539, -0.0029543638229370117, -0.0025153160095214844, -0.002076268196105957, -0.0016372203826904297, -0.0011981725692749023, -0.000759124755859375, -0.00032007694244384766, 0.00011897087097167969, 0.000558018684387207, 0.0009970664978027344, 0.0014361143112182617, 0.001875162124633789, 0.0023142099380493164, 0.0027532577514648438, 0.003192305564880371, 0.0036313533782958984, 0.004070401191711426, 0.004509449005126953, 0.0049484968185424805, 0.005387544631958008, 0.005826592445373535, 0.0062656402587890625, 0.00670468807220459, 0.007143735885620117, 0.0075827836990356445, 0.008021831512451172, 0.0084608793258667, 0.008899927139282227, 0.009338974952697754, 0.009778022766113281, 0.010217070579528809, 0.010656118392944336, 0.011095166206359863, 0.01153421401977539, 0.011973261833190918, 0.012412309646606445, 0.012851357460021973, 0.0132904052734375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 146.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 631.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 165.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-2.980232238769531e-07, -2.905726432800293e-07, -2.8312206268310547e-07, -2.7567148208618164e-07, -2.682209014892578e-07, -2.60770320892334e-07, -2.5331974029541016e-07, -2.4586915969848633e-07, -2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 11.0, 10.0, 5.0, 4.0, 0.0, 2.0, 14.0, 52.0, 68.0, 55.0, 11.0, 122.0, 115.0, 104.0, 409.0, 11468.0, 933672.0, 101177.0, 560.0, 213.0, 63.0, 174.0, 16.0, 8.0, 73.0, 54.0, 40.0, 8.0, 0.0, 0.0, 8.0, 4.0, 8.0, 8.0, 14.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814697265625e-06, -3.666616976261139e-06, -3.518536686897278e-06, -3.3704563975334167e-06, -3.2223761081695557e-06, -3.0742958188056946e-06, -2.9262155294418335e-06, -2.7781352400779724e-06, -2.6300549507141113e-06, -2.4819746613502502e-06, -2.333894371986389e-06, -2.185814082622528e-06, -2.037733793258667e-06, -1.889653503894806e-06, -1.7415732145309448e-06, -1.5934929251670837e-06, -1.4454126358032227e-06, -1.2973323464393616e-06, -1.1492520570755005e-06, -1.0011717677116394e-06, -8.530914783477783e-07, -7.050111889839172e-07, -5.569308996200562e-07, -4.0885061025619507e-07, -2.60770320892334e-07, -1.126900315284729e-07, 3.5390257835388184e-08, 1.8347054719924927e-07, 3.3155083656311035e-07, 4.796311259269714e-07, 6.277114152908325e-07, 7.757917046546936e-07, 9.238719940185547e-07, 1.0719522833824158e-06, 1.2200325727462769e-06, 1.368112862110138e-06, 1.516193151473999e-06, 1.6642734408378601e-06, 1.8123537302017212e-06, 1.9604340195655823e-06, 2.1085143089294434e-06, 2.2565945982933044e-06, 2.4046748876571655e-06, 2.5527551770210266e-06, 2.7008354663848877e-06, 2.8489157557487488e-06, 2.99699604511261e-06, 3.145076334476471e-06, 3.293156623840332e-06, 3.441236913204193e-06, 3.589317202568054e-06, 3.7373974919319153e-06, 3.885477781295776e-06, 4.0335580706596375e-06, 4.1816383600234985e-06, 4.32971864938736e-06, 4.477798938751221e-06, 4.625879228115082e-06, 4.773959517478943e-06, 4.922039806842804e-06, 5.070120096206665e-06, 5.218200385570526e-06, 5.366280674934387e-06, 5.514360964298248e-06, 5.662441253662109e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 978.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.877844320271834e-08, -9.563981251403675e-08, -9.25011747199278e-08, -8.936254403124622e-08, -8.622390623713727e-08, -8.308527554845568e-08, -7.99466448597741e-08, -7.680800706566515e-08, -7.36693692715562e-08, -7.053073858287462e-08, -6.739210078876567e-08, -6.425347010008409e-08, -6.111483230597514e-08, -5.7976201617293555e-08, -5.483756737589829e-08, -5.169893313450302e-08, -4.8560302445821435e-08, -4.542166820442617e-08, -4.22830339630309e-08, -3.9144403274349315e-08, -3.600576548024037e-08, -3.286713479155878e-08, -2.9728500550163517e-08, -2.658986630876825e-08, -2.3451232067372985e-08, -2.031259782597772e-08, -1.7173963584582452e-08, -1.4035331119544026e-08, -1.089669687814876e-08, -7.758062636753493e-09, -4.6194301717150665e-09, -1.4807959303198004e-09, 1.6578312056481082e-09, 4.7964650029541644e-09, 7.93509880026022e-09, 1.1073732153477067e-08, 1.4212366394872333e-08, 1.73510006362676e-08, 2.0489633101306026e-08, 2.3628267342701292e-08, 2.676690158409656e-08, 2.9905535825491825e-08, 3.304417006688709e-08, 3.618280430828236e-08, 3.9321434996963944e-08, 4.246007279107289e-08, 4.5598703479754477e-08, 4.873733772114974e-08, 5.187597196254501e-08, 5.5014606203940275e-08, 5.815324044533554e-08, 6.129187113401713e-08, 6.443050892812607e-08, 6.756913961680766e-08, 7.070777030548925e-08, 7.384640809959819e-08, 7.698504589370714e-08, 8.012367658238873e-08, 8.326231437649767e-08, 8.640094506517926e-08, 8.95395828592882e-08, 9.267821354796979e-08, 9.581684423665138e-08, 9.895548203076032e-08, 1.0209411271944191e-07]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 977.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 16.0, 21.0, 22.0, 16.0, 34.0, 23.0, 39.0, 37.0, 48.0, 41.0, 43.0, 36.0, 49.0, 43.0, 50.0, 47.0, 50.0, 39.0, 41.0, 32.0, 26.0, 34.0, 28.0, 19.0, 15.0, 20.0, 11.0, 13.0, 14.0, 11.0, 11.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9375, -3.81298828125, -3.6884765625, -3.56396484375, -3.439453125, -3.31494140625, -3.1904296875, -3.06591796875, -2.94140625, -2.81689453125, -2.6923828125, -2.56787109375, -2.443359375, -2.31884765625, -2.1943359375, -2.06982421875, -1.9453125, -1.82080078125, -1.6962890625, -1.57177734375, -1.447265625, -1.32275390625, -1.1982421875, -1.07373046875, -0.94921875, -0.82470703125, -0.7001953125, -0.57568359375, -0.451171875, -0.32666015625, -0.2021484375, -0.07763671875, 0.046875, 0.17138671875, 0.2958984375, 0.42041015625, 0.544921875, 0.66943359375, 0.7939453125, 0.91845703125, 1.04296875, 1.16748046875, 1.2919921875, 1.41650390625, 1.541015625, 1.66552734375, 1.7900390625, 1.91455078125, 2.0390625, 2.16357421875, 2.2880859375, 2.41259765625, 2.537109375, 2.66162109375, 2.7861328125, 2.91064453125, 3.03515625, 3.15966796875, 3.2841796875, 3.40869140625, 3.533203125, 3.65771484375, 3.7822265625, 3.90673828125, 4.03125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 0.0, 9.0, 8.0, 14.0, 29.0, 33.0, 62.0, 82.0, 106.0, 181.0, 306.0, 530.0, 844.0, 1457.0, 2428.0, 4069.0, 6887.0, 12559.0, 22621.0, 42413.0, 81115.0, 173816.0, 334426.0, 182509.0, 84458.0, 43596.0, 23404.0, 12897.0, 7334.0, 4106.0, 2456.0, 1492.0, 823.0, 544.0, 356.0, 208.0, 123.0, 92.0, 57.0, 37.0, 27.0, 11.0, 12.0, 5.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.91094970703125, -3.7828369140625, -3.65472412109375, -3.526611328125, -3.39849853515625, -3.2703857421875, -3.14227294921875, -3.01416015625, -2.88604736328125, -2.7579345703125, -2.62982177734375, -2.501708984375, -2.37359619140625, -2.2454833984375, -2.11737060546875, -1.9892578125, -1.86114501953125, -1.7330322265625, -1.60491943359375, -1.476806640625, -1.34869384765625, -1.2205810546875, -1.09246826171875, -0.96435546875, -0.83624267578125, -0.7081298828125, -0.58001708984375, -0.451904296875, -0.32379150390625, -0.1956787109375, -0.06756591796875, 0.060546875, 0.18865966796875, 0.3167724609375, 0.44488525390625, 0.572998046875, 0.70111083984375, 0.8292236328125, 0.95733642578125, 1.08544921875, 1.21356201171875, 1.3416748046875, 1.46978759765625, 1.597900390625, 1.72601318359375, 1.8541259765625, 1.98223876953125, 2.1103515625, 2.23846435546875, 2.3665771484375, 2.49468994140625, 2.622802734375, 2.75091552734375, 2.8790283203125, 3.00714111328125, 3.13525390625, 3.26336669921875, 3.3914794921875, 3.51959228515625, 3.647705078125, 3.77581787109375, 3.9039306640625, 4.03204345703125, 4.16015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 11.0, 7.0, 7.0, 12.0, 17.0, 29.0, 13.0, 18.0, 30.0, 38.0, 30.0, 32.0, 57.0, 80.0, 94.0, 166.0, 1384.0, 406.0, 157.0, 102.0, 62.0, 48.0, 46.0, 30.0, 39.0, 29.0, 28.0, 21.0, 13.0, 13.0, 9.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9296875, -11.518310546875, -11.10693359375, -10.695556640625, -10.2841796875, -9.872802734375, -9.46142578125, -9.050048828125, -8.638671875, -8.227294921875, -7.81591796875, -7.404541015625, -6.9931640625, -6.581787109375, -6.17041015625, -5.759033203125, -5.34765625, -4.936279296875, -4.52490234375, -4.113525390625, -3.7021484375, -3.290771484375, -2.87939453125, -2.468017578125, -2.056640625, -1.645263671875, -1.23388671875, -0.822509765625, -0.4111328125, 0.000244140625, 0.41162109375, 0.822998046875, 1.234375, 1.645751953125, 2.05712890625, 2.468505859375, 2.8798828125, 3.291259765625, 3.70263671875, 4.114013671875, 4.525390625, 4.936767578125, 5.34814453125, 5.759521484375, 6.1708984375, 6.582275390625, 6.99365234375, 7.405029296875, 7.81640625, 8.227783203125, 8.63916015625, 9.050537109375, 9.4619140625, 9.873291015625, 10.28466796875, 10.696044921875, 11.107421875, 11.518798828125, 11.93017578125, 12.341552734375, 12.7529296875, 13.164306640625, 13.57568359375, 13.987060546875, 14.3984375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 10.0, 24.0, 29.0, 57.0, 103.0, 135.0, 293.0, 629.0, 2098.0, 14035.0, 217587.0, 2790941.0, 108166.0, 8829.0, 1554.0, 511.0, 261.0, 143.0, 96.0, 58.0, 41.0, 32.0, 13.0, 16.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1160888671875, -14.583740234375, -14.0513916015625, -13.51904296875, -12.9866943359375, -12.454345703125, -11.9219970703125, -11.3896484375, -10.8572998046875, -10.324951171875, -9.7926025390625, -9.26025390625, -8.7279052734375, -8.195556640625, -7.6632080078125, -7.130859375, -6.5985107421875, -6.066162109375, -5.5338134765625, -5.00146484375, -4.4691162109375, -3.936767578125, -3.4044189453125, -2.8720703125, -2.3397216796875, -1.807373046875, -1.2750244140625, -0.74267578125, -0.2103271484375, 0.322021484375, 0.8543701171875, 1.38671875, 1.9190673828125, 2.451416015625, 2.9837646484375, 3.51611328125, 4.0484619140625, 4.580810546875, 5.1131591796875, 5.6455078125, 6.1778564453125, 6.710205078125, 7.2425537109375, 7.77490234375, 8.3072509765625, 8.839599609375, 9.3719482421875, 9.904296875, 10.4366455078125, 10.968994140625, 11.5013427734375, 12.03369140625, 12.5660400390625, 13.098388671875, 13.6307373046875, 14.1630859375, 14.6954345703125, 15.227783203125, 15.7601318359375, 16.29248046875, 16.8248291015625, 17.357177734375, 17.8895263671875, 18.421875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 7.0, 214.0, 579.0, 207.0, 12.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.43085765838623, -8.188886642456055, -4.946916580200195, -1.7049455642700195, 1.5370244979858398, 4.778994560241699, 8.020966529846191, 11.26293659210205, 14.50490665435791, 17.746877670288086, 20.988847732543945, 24.230819702148438, 27.472789764404297, 30.714759826660156, 33.956729888916016, 37.198699951171875, 40.440670013427734, 43.682640075683594, 46.92461013793945, 50.16658020019531, 53.40855407714844, 56.65052032470703, 59.892494201660156, 63.134464263916016, 66.37643432617188, 69.618408203125, 72.8603744506836, 76.10234832763672, 79.34431457519531, 82.58628845214844, 85.82826232910156, 89.07022857666016, 92.31219482421875, 95.55416870117188, 98.79613494873047, 102.0381088256836, 105.28007507324219, 108.52204895019531, 111.76402282714844, 115.00598907470703, 118.24795532226562, 121.48992919921875, 124.73189544677734, 127.97386932373047, 131.21583557128906, 134.4578094482422, 137.6997833251953, 140.94174194335938, 144.1837158203125, 147.42568969726562, 150.66766357421875, 153.9096221923828, 157.15159606933594, 160.39356994628906, 163.6355438232422, 166.87750244140625, 170.11949157714844, 173.36146545410156, 176.6034393310547, 179.84539794921875, 183.08737182617188, 186.329345703125, 189.57131958007812, 192.81329345703125, 196.0552520751953]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 15.0, 7.0, 10.0, 16.0, 8.0, 11.0, 14.0, 17.0, 22.0, 19.0, 30.0, 24.0, 29.0, 39.0, 35.0, 39.0, 47.0, 35.0, 35.0, 50.0, 33.0, 38.0, 52.0, 33.0, 39.0, 21.0, 25.0, 32.0, 34.0, 22.0, 26.0, 24.0, 24.0, 21.0, 10.0, 8.0, 15.0, 3.0, 13.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.566593170166016, -23.82815170288086, -23.08970832824707, -22.351266860961914, -21.612823486328125, -20.87438201904297, -20.135940551757812, -19.397499084472656, -18.659055709838867, -17.92061424255371, -17.182170867919922, -16.443729400634766, -15.705286979675293, -14.96684455871582, -14.228403091430664, -13.489960670471191, -12.751518249511719, -12.013075828552246, -11.274633407592773, -10.536191940307617, -9.797749519348145, -9.059307098388672, -8.320865631103516, -7.582423210144043, -6.84398078918457, -6.105538368225098, -5.367096424102783, -4.628654479980469, -3.890212059020996, -3.1517698764801025, -2.413327693939209, -1.6748857498168945, -0.9364452362060547, -0.19800305366516113, 0.5404391288757324, 1.278881311416626, 2.0173234939575195, 2.755765676498413, 3.4942078590393066, 4.232649803161621, 4.971092224121094, 5.709534645080566, 6.447976589202881, 7.186418533325195, 7.924860954284668, 8.66330337524414, 9.401744842529297, 10.14018726348877, 10.878629684448242, 11.617072105407715, 12.355514526367188, 13.093955993652344, 13.832398414611816, 14.570840835571289, 15.309282302856445, 16.047725677490234, 16.78616714477539, 17.524608612060547, 18.263051986694336, 19.001493453979492, 19.73993682861328, 20.478378295898438, 21.216819763183594, 21.95526123046875, 22.69370460510254]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 7.0, 6.0, 8.0, 9.0, 9.0, 17.0, 18.0, 29.0, 22.0, 25.0, 22.0, 25.0, 45.0, 43.0, 40.0, 31.0, 47.0, 42.0, 38.0, 42.0, 44.0, 41.0, 55.0, 49.0, 32.0, 41.0, 22.0, 25.0, 28.0, 24.0, 20.0, 10.0, 20.0, 9.0, 11.0, 12.0, 6.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.78125, -3.65606689453125, -3.5308837890625, -3.40570068359375, -3.280517578125, -3.15533447265625, -3.0301513671875, -2.90496826171875, -2.77978515625, -2.65460205078125, -2.5294189453125, -2.40423583984375, -2.279052734375, -2.15386962890625, -2.0286865234375, -1.90350341796875, -1.7783203125, -1.65313720703125, -1.5279541015625, -1.40277099609375, -1.277587890625, -1.15240478515625, -1.0272216796875, -0.90203857421875, -0.77685546875, -0.65167236328125, -0.5264892578125, -0.40130615234375, -0.276123046875, -0.15093994140625, -0.0257568359375, 0.09942626953125, 0.224609375, 0.34979248046875, 0.4749755859375, 0.60015869140625, 0.725341796875, 0.85052490234375, 0.9757080078125, 1.10089111328125, 1.22607421875, 1.35125732421875, 1.4764404296875, 1.60162353515625, 1.726806640625, 1.85198974609375, 1.9771728515625, 2.10235595703125, 2.2275390625, 2.35272216796875, 2.4779052734375, 2.60308837890625, 2.728271484375, 2.85345458984375, 2.9786376953125, 3.10382080078125, 3.22900390625, 3.35418701171875, 3.4793701171875, 3.60455322265625, 3.729736328125, 3.85491943359375, 3.9801025390625, 4.10528564453125, 4.23046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 22.0, 39.0, 66.0, 80.0, 153.0, 247.0, 420.0, 908.0, 2038.0, 5166.0, 14582.0, 49167.0, 250323.0, 2231264.0, 1431181.0, 153894.0, 35599.0, 11375.0, 4174.0, 1794.0, 812.0, 412.0, 177.0, 132.0, 75.0, 42.0, 33.0, 22.0, 10.0, 9.0, 8.0, 2.0, 3.0, 2.0, 6.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.41278076171875, -7.1263427734375, -6.83990478515625, -6.553466796875, -6.26702880859375, -5.9805908203125, -5.69415283203125, -5.40771484375, -5.12127685546875, -4.8348388671875, -4.54840087890625, -4.261962890625, -3.97552490234375, -3.6890869140625, -3.40264892578125, -3.1162109375, -2.82977294921875, -2.5433349609375, -2.25689697265625, -1.970458984375, -1.68402099609375, -1.3975830078125, -1.11114501953125, -0.82470703125, -0.53826904296875, -0.2518310546875, 0.03460693359375, 0.321044921875, 0.60748291015625, 0.8939208984375, 1.18035888671875, 1.466796875, 1.75323486328125, 2.0396728515625, 2.32611083984375, 2.612548828125, 2.89898681640625, 3.1854248046875, 3.47186279296875, 3.75830078125, 4.04473876953125, 4.3311767578125, 4.61761474609375, 4.904052734375, 5.19049072265625, 5.4769287109375, 5.76336669921875, 6.0498046875, 6.33624267578125, 6.6226806640625, 6.90911865234375, 7.195556640625, 7.48199462890625, 7.7684326171875, 8.05487060546875, 8.34130859375, 8.62774658203125, 8.9141845703125, 9.20062255859375, 9.487060546875, 9.77349853515625, 10.0599365234375, 10.34637451171875, 10.6328125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 9.0, 17.0, 26.0, 44.0, 62.0, 73.0, 79.0, 121.0, 207.0, 291.0, 420.0, 599.0, 584.0, 476.0, 291.0, 216.0, 180.0, 95.0, 82.0, 63.0, 38.0, 31.0, 16.0, 12.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.8131103515625, -4.594970703125, -4.3768310546875, -4.15869140625, -3.9405517578125, -3.722412109375, -3.5042724609375, -3.2861328125, -3.0679931640625, -2.849853515625, -2.6317138671875, -2.41357421875, -2.1954345703125, -1.977294921875, -1.7591552734375, -1.541015625, -1.3228759765625, -1.104736328125, -0.8865966796875, -0.66845703125, -0.4503173828125, -0.232177734375, -0.0140380859375, 0.2041015625, 0.4222412109375, 0.640380859375, 0.8585205078125, 1.07666015625, 1.2947998046875, 1.512939453125, 1.7310791015625, 1.94921875, 2.1673583984375, 2.385498046875, 2.6036376953125, 2.82177734375, 3.0399169921875, 3.258056640625, 3.4761962890625, 3.6943359375, 3.9124755859375, 4.130615234375, 4.3487548828125, 4.56689453125, 4.7850341796875, 5.003173828125, 5.2213134765625, 5.439453125, 5.6575927734375, 5.875732421875, 6.0938720703125, 6.31201171875, 6.5301513671875, 6.748291015625, 6.9664306640625, 7.1845703125, 7.4027099609375, 7.620849609375, 7.8389892578125, 8.05712890625, 8.2752685546875, 8.493408203125, 8.7115478515625, 8.9296875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 10.0, 2.0, 11.0, 24.0, 22.0, 32.0, 41.0, 74.0, 104.0, 189.0, 362.0, 735.0, 1680.0, 4177.0, 12526.0, 44357.0, 187567.0, 1187573.0, 2318209.0, 334875.0, 72128.0, 19293.0, 6031.0, 2229.0, 972.0, 438.0, 243.0, 139.0, 63.0, 48.0, 34.0, 34.0, 19.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.875, -9.5860595703125, -9.297119140625, -9.0081787109375, -8.71923828125, -8.4302978515625, -8.141357421875, -7.8524169921875, -7.5634765625, -7.2745361328125, -6.985595703125, -6.6966552734375, -6.40771484375, -6.1187744140625, -5.829833984375, -5.5408935546875, -5.251953125, -4.9630126953125, -4.674072265625, -4.3851318359375, -4.09619140625, -3.8072509765625, -3.518310546875, -3.2293701171875, -2.9404296875, -2.6514892578125, -2.362548828125, -2.0736083984375, -1.78466796875, -1.4957275390625, -1.206787109375, -0.9178466796875, -0.62890625, -0.3399658203125, -0.051025390625, 0.2379150390625, 0.52685546875, 0.8157958984375, 1.104736328125, 1.3936767578125, 1.6826171875, 1.9715576171875, 2.260498046875, 2.5494384765625, 2.83837890625, 3.1273193359375, 3.416259765625, 3.7052001953125, 3.994140625, 4.2830810546875, 4.572021484375, 4.8609619140625, 5.14990234375, 5.4388427734375, 5.727783203125, 6.0167236328125, 6.3056640625, 6.5946044921875, 6.883544921875, 7.1724853515625, 7.46142578125, 7.7503662109375, 8.039306640625, 8.3282470703125, 8.6171875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 22.0, 29.0, 30.0, 63.0, 90.0, 121.0, 115.0, 114.0, 118.0, 103.0, 66.0, 57.0, 25.0, 18.0, 11.0, 6.0, 4.0, 4.0], "bins": [-48.4801139831543, -47.56629180908203, -46.65247344970703, -45.738651275634766, -44.8248291015625, -43.9110107421875, -42.997188568115234, -42.08336639404297, -41.16954803466797, -40.2557258605957, -39.3419075012207, -38.42808532714844, -37.51426315307617, -36.60044479370117, -35.686622619628906, -34.772804260253906, -33.85898208618164, -32.945159912109375, -32.031341552734375, -31.11751937866211, -30.203699111938477, -29.289878845214844, -28.376056671142578, -27.462236404418945, -26.54841423034668, -25.634593963623047, -24.72077178955078, -23.80695152282715, -22.893131256103516, -21.97930908203125, -21.065488815307617, -20.151668548583984, -19.23784637451172, -18.324026107788086, -17.41020393371582, -16.496383666992188, -15.582563400268555, -14.668742179870605, -13.754920959472656, -12.841100692749023, -11.92728042602539, -11.013459205627441, -10.099638938903809, -9.18581771850586, -8.271997451782227, -7.358176231384277, -6.444355487823486, -5.530534744262695, -4.6167144775390625, -3.7028937339782715, -2.7890729904174805, -1.8752520084381104, -0.9614312648773193, -0.04761028289794922, 0.8662104606628418, 1.7800312042236328, 2.693851947784424, 3.607672691345215, 4.521493434906006, 5.435314178466797, 6.349135398864746, 7.262956142425537, 8.176776885986328, 9.090597152709961, 10.00441837310791]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 11.0, 10.0, 9.0, 14.0, 11.0, 25.0, 22.0, 24.0, 27.0, 15.0, 23.0, 32.0, 30.0, 40.0, 44.0, 37.0, 32.0, 26.0, 40.0, 34.0, 48.0, 37.0, 35.0, 32.0, 31.0, 34.0, 44.0, 30.0, 18.0, 32.0, 18.0, 18.0, 23.0, 17.0, 15.0, 6.0, 10.0, 14.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-19.134492874145508, -18.515792846679688, -17.897090911865234, -17.278390884399414, -16.659690856933594, -16.04098892211914, -15.42228889465332, -14.803587913513184, -14.184886932373047, -13.56618595123291, -12.947484970092773, -12.328784942626953, -11.710083961486816, -11.09138298034668, -10.47268295288086, -9.853981971740723, -9.235280990600586, -8.61658000946045, -7.997879505157471, -7.379179000854492, -6.7604780197143555, -6.141777038574219, -5.52307653427124, -4.904376029968262, -4.285675048828125, -3.6669743061065674, -3.0482735633850098, -2.429572820663452, -1.8108720779418945, -1.192171335220337, -0.5734705924987793, 0.04522991180419922, 0.6639328002929688, 1.2826335430145264, 1.901334285736084, 2.5200350284576416, 3.138735771179199, 3.757436513900757, 4.3761372566223145, 4.994837760925293, 5.61353874206543, 6.232239723205566, 6.850940227508545, 7.469640731811523, 8.08834171295166, 8.707042694091797, 9.325742721557617, 9.944443702697754, 10.56314468383789, 11.181845664978027, 11.800546646118164, 12.419246673583984, 13.037947654724121, 13.656648635864258, 14.275348663330078, 14.894049644470215, 15.512750625610352, 16.131450653076172, 16.750152587890625, 17.368852615356445, 17.987552642822266, 18.60625457763672, 19.22495460510254, 19.84365463256836, 20.462356567382812]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 17.0, 29.0, 29.0, 25.0, 31.0, 31.0, 35.0, 41.0, 48.0, 48.0, 59.0, 39.0, 50.0, 33.0, 52.0, 29.0, 48.0, 28.0, 41.0, 37.0, 35.0, 29.0, 26.0, 19.0, 20.0, 26.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0076904296875, -3.866943359375, -3.7261962890625, -3.58544921875, -3.4447021484375, -3.303955078125, -3.1632080078125, -3.0224609375, -2.8817138671875, -2.740966796875, -2.6002197265625, -2.45947265625, -2.3187255859375, -2.177978515625, -2.0372314453125, -1.896484375, -1.7557373046875, -1.614990234375, -1.4742431640625, -1.33349609375, -1.1927490234375, -1.052001953125, -0.9112548828125, -0.7705078125, -0.6297607421875, -0.489013671875, -0.3482666015625, -0.20751953125, -0.0667724609375, 0.073974609375, 0.2147216796875, 0.35546875, 0.4962158203125, 0.636962890625, 0.7777099609375, 0.91845703125, 1.0592041015625, 1.199951171875, 1.3406982421875, 1.4814453125, 1.6221923828125, 1.762939453125, 1.9036865234375, 2.04443359375, 2.1851806640625, 2.325927734375, 2.4666748046875, 2.607421875, 2.7481689453125, 2.888916015625, 3.0296630859375, 3.17041015625, 3.3111572265625, 3.451904296875, 3.5926513671875, 3.7333984375, 3.8741455078125, 4.014892578125, 4.1556396484375, 4.29638671875, 4.4371337890625, 4.577880859375, 4.7186279296875, 4.859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 14.0, 21.0, 16.0, 39.0, 50.0, 70.0, 152.0, 172.0, 262.0, 473.0, 599.0, 1060.0, 1778.0, 2842.0, 4826.0, 8435.0, 14362.0, 24287.0, 42488.0, 75915.0, 154407.0, 334118.0, 182851.0, 85963.0, 47185.0, 27227.0, 15897.0, 9260.0, 5363.0, 3289.0, 1889.0, 1154.0, 737.0, 432.0, 298.0, 192.0, 148.0, 71.0, 49.0, 53.0, 33.0, 22.0, 10.0, 13.0, 6.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.02764892578125, -0.026849746704101562, -0.026050567626953125, -0.025251388549804688, -0.02445220947265625, -0.023653030395507812, -0.022853851318359375, -0.022054672241210938, -0.0212554931640625, -0.020456314086914062, -0.019657135009765625, -0.018857955932617188, -0.01805877685546875, -0.017259597778320312, -0.016460418701171875, -0.015661239624023438, -0.014862060546875, -0.014062881469726562, -0.013263702392578125, -0.012464523315429688, -0.01166534423828125, -0.010866165161132812, -0.010066986083984375, -0.009267807006835938, -0.0084686279296875, -0.0076694488525390625, -0.006870269775390625, -0.0060710906982421875, -0.00527191162109375, -0.0044727325439453125, -0.003673553466796875, -0.0028743743896484375, -0.0020751953125, -0.0012760162353515625, -0.000476837158203125, 0.0003223419189453125, 0.00112152099609375, 0.0019207000732421875, 0.002719879150390625, 0.0035190582275390625, 0.0043182373046875, 0.0051174163818359375, 0.005916595458984375, 0.0067157745361328125, 0.00751495361328125, 0.008314132690429688, 0.009113311767578125, 0.009912490844726562, 0.010711669921875, 0.011510848999023438, 0.012310028076171875, 0.013109207153320312, 0.01390838623046875, 0.014707565307617188, 0.015506744384765625, 0.016305923461914062, 0.0171051025390625, 0.017904281616210938, 0.018703460693359375, 0.019502639770507812, 0.02030181884765625, 0.021100997924804688, 0.021900177001953125, 0.022699356079101562, 0.02349853515625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 7.0, 14.0, 11.0, 11.0, 11.0, 12.0, 15.0, 31.0, 28.0, 21.0, 29.0, 33.0, 42.0, 47.0, 37.0, 42.0, 37.0, 39.0, 1069.0, 51.0, 54.0, 31.0, 31.0, 38.0, 35.0, 35.0, 23.0, 17.0, 22.0, 16.0, 22.0, 12.0, 9.0, 17.0, 14.0, 14.0, 7.0, 6.0, 1.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.681640625, -2.601837158203125, -2.52203369140625, -2.442230224609375, -2.3624267578125, -2.282623291015625, -2.20281982421875, -2.123016357421875, -2.043212890625, -1.963409423828125, -1.88360595703125, -1.803802490234375, -1.7239990234375, -1.644195556640625, -1.56439208984375, -1.484588623046875, -1.40478515625, -1.324981689453125, -1.24517822265625, -1.165374755859375, -1.0855712890625, -1.005767822265625, -0.92596435546875, -0.846160888671875, -0.766357421875, -0.686553955078125, -0.60675048828125, -0.526947021484375, -0.4471435546875, -0.367340087890625, -0.28753662109375, -0.207733154296875, -0.1279296875, -0.048126220703125, 0.03167724609375, 0.111480712890625, 0.1912841796875, 0.271087646484375, 0.35089111328125, 0.430694580078125, 0.510498046875, 0.590301513671875, 0.67010498046875, 0.749908447265625, 0.8297119140625, 0.909515380859375, 0.98931884765625, 1.069122314453125, 1.14892578125, 1.228729248046875, 1.30853271484375, 1.388336181640625, 1.4681396484375, 1.547943115234375, 1.62774658203125, 1.707550048828125, 1.787353515625, 1.867156982421875, 1.94696044921875, 2.026763916015625, 2.1065673828125, 2.186370849609375, 2.26617431640625, 2.345977783203125, 2.42578125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 10.0, 5.0, 5.0, 4.0, 9.0, 21.0, 28.0, 51.0, 51.0, 85.0, 96.0, 178.0, 284.0, 369.0, 497.0, 729.0, 1137.0, 1607.0, 2429.0, 3687.0, 5499.0, 8515.0, 12992.0, 21024.0, 33881.0, 58086.0, 106366.0, 254792.0, 1316904.0, 111910.0, 60256.0, 34955.0, 21572.0, 13339.0, 8514.0, 5816.0, 3608.0, 2456.0, 1806.0, 1100.0, 748.0, 523.0, 397.0, 220.0, 152.0, 139.0, 119.0, 64.0, 33.0, 26.0, 11.0, 14.0, 11.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01471710205078125, -0.014227032661437988, -0.013736963272094727, -0.013246893882751465, -0.012756824493408203, -0.012266755104064941, -0.01177668571472168, -0.011286616325378418, -0.010796546936035156, -0.010306477546691895, -0.009816408157348633, -0.009326338768005371, -0.00883626937866211, -0.008346199989318848, -0.007856130599975586, -0.007366061210632324, -0.0068759918212890625, -0.006385922431945801, -0.005895853042602539, -0.005405783653259277, -0.004915714263916016, -0.004425644874572754, -0.003935575485229492, -0.0034455060958862305, -0.0029554367065429688, -0.002465367317199707, -0.0019752979278564453, -0.0014852285385131836, -0.0009951591491699219, -0.0005050897598266602, -1.5020370483398438e-05, 0.0004750490188598633, 0.000965118408203125, 0.0014551877975463867, 0.0019452571868896484, 0.00243532657623291, 0.002925395965576172, 0.0034154653549194336, 0.0039055347442626953, 0.004395604133605957, 0.004885673522949219, 0.0053757429122924805, 0.005865812301635742, 0.006355881690979004, 0.006845951080322266, 0.007336020469665527, 0.007826089859008789, 0.00831615924835205, 0.008806228637695312, 0.009296298027038574, 0.009786367416381836, 0.010276436805725098, 0.01076650619506836, 0.011256575584411621, 0.011746644973754883, 0.012236714363098145, 0.012726783752441406, 0.013216853141784668, 0.01370692253112793, 0.014196991920471191, 0.014687061309814453, 0.015177130699157715, 0.015667200088500977, 0.01615726947784424, 0.0166473388671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 204.0, 0.0, 0.0, 0.0, 0.0, 0.0, 478.0, 0.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 8.0, 6.0, 2.0, 2.0, 35.0, 27.0, 14.0, 1.0, 53.0, 71.0, 50.0, 128.0, 302.0, 229.0, 1219.0, 895471.0, 149319.0, 765.0, 214.0, 273.0, 97.0, 96.0, 56.0, 30.0, 1.0, 16.0, 32.0, 13.0, 3.0, 2.0, 5.0, 3.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.812624633312225e-06, -6.591901183128357e-06, -6.3711777329444885e-06, -6.15045428276062e-06, -5.929730832576752e-06, -5.709007382392883e-06, -5.488283932209015e-06, -5.2675604820251465e-06, -5.046837031841278e-06, -4.82611358165741e-06, -4.605390131473541e-06, -4.384666681289673e-06, -4.1639432311058044e-06, -3.943219780921936e-06, -3.7224963307380676e-06, -3.5017728805541992e-06, -3.281049430370331e-06, -3.0603259801864624e-06, -2.839602530002594e-06, -2.6188790798187256e-06, -2.398155629634857e-06, -2.1774321794509888e-06, -1.9567087292671204e-06, -1.735985279083252e-06, -1.5152618288993835e-06, -1.2945383787155151e-06, -1.0738149285316467e-06, -8.530914783477783e-07, -6.323680281639099e-07, -4.116445779800415e-07, -1.909211277961731e-07, 2.9802322387695312e-08, 2.505257725715637e-07, 4.7124922275543213e-07, 6.919726729393005e-07, 9.126961231231689e-07, 1.1334195733070374e-06, 1.3541430234909058e-06, 1.5748664736747742e-06, 1.7955899238586426e-06, 2.016313374042511e-06, 2.2370368242263794e-06, 2.457760274410248e-06, 2.678483724594116e-06, 2.8992071747779846e-06, 3.119930624961853e-06, 3.3406540751457214e-06, 3.56137752532959e-06, 3.7821009755134583e-06, 4.002824425697327e-06, 4.223547875881195e-06, 4.4442713260650635e-06, 4.664994776248932e-06, 4.8857182264328e-06, 5.106441676616669e-06, 5.327165126800537e-06, 5.5478885769844055e-06, 5.768612027168274e-06, 5.989335477352142e-06, 6.210058927536011e-06, 6.430782377719879e-06, 6.6515058279037476e-06, 6.872229278087616e-06, 7.092952728271484e-06]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 40.0, 888.0, 65.0, 14.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3163825087758596e-06, -1.2823385304727708e-06, -1.248294552169682e-06, -1.2142505738665932e-06, -1.1802065955635044e-06, -1.1461626172604156e-06, -1.1121186389573268e-06, -1.0780745469674002e-06, -1.0440305686643114e-06, -1.0099865903612226e-06, -9.759426120581338e-07, -9.41898633755045e-07, -9.078546554519562e-07, -8.738106771488674e-07, -8.397666420023597e-07, -8.057226636992709e-07, -7.71678742239601e-07, -7.376347639365122e-07, -7.035907856334234e-07, -6.695468073303346e-07, -6.355028290272458e-07, -6.014588507241569e-07, -5.674148155776493e-07, -5.333708372745605e-07, -4.993268589714717e-07, -4.6528288066838286e-07, -4.3123890236529405e-07, -3.971948956404958e-07, -3.63150917337407e-07, -3.291069390343182e-07, -2.9506293230951997e-07, -2.6101895400643116e-07, -2.2697508939018007e-07, -1.9293111108709127e-07, -1.5888711857314775e-07, -1.2484312605920422e-07, -9.079914775611542e-08, -5.675516945302661e-08, -2.271117693908309e-08, 1.1332815574860433e-08, 4.537679387794924e-08, 7.94207792864654e-08, 1.1346476469498157e-07, 1.475087572089251e-07, 1.815527355120139e-07, 2.155967138151027e-07, 2.4964072053990094e-07, 2.8368469884298975e-07, 3.1772867714607855e-07, 3.5177265544916736e-07, 3.8581663375225617e-07, 4.198606404770544e-07, 4.539046187801432e-07, 4.879485686615226e-07, 5.219926038080303e-07, 5.560365821111191e-07, 5.900805604142079e-07, 6.241245387172967e-07, 6.581685170203855e-07, 6.922124953234743e-07, 7.26256530469982e-07, 7.603005087730708e-07, 7.943444870761596e-07, 8.283884653792484e-07, 8.624324436823372e-07]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 101.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 813.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 17.0, 29.0, 29.0, 25.0, 31.0, 31.0, 35.0, 41.0, 48.0, 48.0, 59.0, 39.0, 50.0, 33.0, 52.0, 29.0, 48.0, 28.0, 41.0, 37.0, 35.0, 29.0, 26.0, 19.0, 20.0, 26.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0076904296875, -3.866943359375, -3.7261962890625, -3.58544921875, -3.4447021484375, -3.303955078125, -3.1632080078125, -3.0224609375, -2.8817138671875, -2.740966796875, -2.6002197265625, -2.45947265625, -2.3187255859375, -2.177978515625, -2.0372314453125, -1.896484375, -1.7557373046875, -1.614990234375, -1.4742431640625, -1.33349609375, -1.1927490234375, -1.052001953125, -0.9112548828125, -0.7705078125, -0.6297607421875, -0.489013671875, -0.3482666015625, -0.20751953125, -0.0667724609375, 0.073974609375, 0.2147216796875, 0.35546875, 0.4962158203125, 0.636962890625, 0.7777099609375, 0.91845703125, 1.0592041015625, 1.199951171875, 1.3406982421875, 1.4814453125, 1.6221923828125, 1.762939453125, 1.9036865234375, 2.04443359375, 2.1851806640625, 2.325927734375, 2.4666748046875, 2.607421875, 2.7481689453125, 2.888916015625, 3.0296630859375, 3.17041015625, 3.3111572265625, 3.451904296875, 3.5926513671875, 3.7333984375, 3.8741455078125, 4.014892578125, 4.1556396484375, 4.29638671875, 4.4371337890625, 4.577880859375, 4.7186279296875, 4.859375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 13.0, 9.0, 22.0, 24.0, 43.0, 67.0, 99.0, 155.0, 230.0, 371.0, 670.0, 1113.0, 1836.0, 3270.0, 5642.0, 10505.0, 19370.0, 35581.0, 65358.0, 126624.0, 306979.0, 242079.0, 104726.0, 56128.0, 30368.0, 16526.0, 8890.0, 4939.0, 2865.0, 1568.0, 939.0, 554.0, 335.0, 223.0, 145.0, 77.0, 66.0, 34.0, 30.0, 17.0, 17.0, 12.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.32421875, -4.18853759765625, -4.0528564453125, -3.91717529296875, -3.781494140625, -3.64581298828125, -3.5101318359375, -3.37445068359375, -3.23876953125, -3.10308837890625, -2.9674072265625, -2.83172607421875, -2.696044921875, -2.56036376953125, -2.4246826171875, -2.28900146484375, -2.1533203125, -2.01763916015625, -1.8819580078125, -1.74627685546875, -1.610595703125, -1.47491455078125, -1.3392333984375, -1.20355224609375, -1.06787109375, -0.93218994140625, -0.7965087890625, -0.66082763671875, -0.525146484375, -0.38946533203125, -0.2537841796875, -0.11810302734375, 0.017578125, 0.15325927734375, 0.2889404296875, 0.42462158203125, 0.560302734375, 0.69598388671875, 0.8316650390625, 0.96734619140625, 1.10302734375, 1.23870849609375, 1.3743896484375, 1.51007080078125, 1.645751953125, 1.78143310546875, 1.9171142578125, 2.05279541015625, 2.1884765625, 2.32415771484375, 2.4598388671875, 2.59552001953125, 2.731201171875, 2.86688232421875, 3.0025634765625, 3.13824462890625, 3.27392578125, 3.40960693359375, 3.5452880859375, 3.68096923828125, 3.816650390625, 3.95233154296875, 4.0880126953125, 4.22369384765625, 4.359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 4.0, 8.0, 5.0, 18.0, 16.0, 16.0, 17.0, 22.0, 16.0, 38.0, 27.0, 45.0, 41.0, 44.0, 77.0, 114.0, 197.0, 1497.0, 262.0, 158.0, 74.0, 65.0, 40.0, 41.0, 45.0, 26.0, 17.0, 18.0, 18.0, 12.0, 15.0, 17.0, 7.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.6842041015625, -11.337158203125, -10.9901123046875, -10.64306640625, -10.2960205078125, -9.948974609375, -9.6019287109375, -9.2548828125, -8.9078369140625, -8.560791015625, -8.2137451171875, -7.86669921875, -7.5196533203125, -7.172607421875, -6.8255615234375, -6.478515625, -6.1314697265625, -5.784423828125, -5.4373779296875, -5.09033203125, -4.7432861328125, -4.396240234375, -4.0491943359375, -3.7021484375, -3.3551025390625, -3.008056640625, -2.6610107421875, -2.31396484375, -1.9669189453125, -1.619873046875, -1.2728271484375, -0.92578125, -0.5787353515625, -0.231689453125, 0.1153564453125, 0.46240234375, 0.8094482421875, 1.156494140625, 1.5035400390625, 1.8505859375, 2.1976318359375, 2.544677734375, 2.8917236328125, 3.23876953125, 3.5858154296875, 3.932861328125, 4.2799072265625, 4.626953125, 4.9739990234375, 5.321044921875, 5.6680908203125, 6.01513671875, 6.3621826171875, 6.709228515625, 7.0562744140625, 7.4033203125, 7.7503662109375, 8.097412109375, 8.4444580078125, 8.79150390625, 9.1385498046875, 9.485595703125, 9.8326416015625, 10.1796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 8.0, 8.0, 11.0, 8.0, 18.0, 21.0, 38.0, 39.0, 64.0, 67.0, 93.0, 135.0, 203.0, 372.0, 866.0, 3503.0, 24868.0, 307248.0, 2647200.0, 142961.0, 14082.0, 2219.0, 666.0, 298.0, 193.0, 116.0, 96.0, 78.0, 48.0, 33.0, 31.0, 25.0, 22.0, 19.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.03125, -13.5977783203125, -13.164306640625, -12.7308349609375, -12.29736328125, -11.8638916015625, -11.430419921875, -10.9969482421875, -10.5634765625, -10.1300048828125, -9.696533203125, -9.2630615234375, -8.82958984375, -8.3961181640625, -7.962646484375, -7.5291748046875, -7.095703125, -6.6622314453125, -6.228759765625, -5.7952880859375, -5.36181640625, -4.9283447265625, -4.494873046875, -4.0614013671875, -3.6279296875, -3.1944580078125, -2.760986328125, -2.3275146484375, -1.89404296875, -1.4605712890625, -1.027099609375, -0.5936279296875, -0.16015625, 0.2733154296875, 0.706787109375, 1.1402587890625, 1.57373046875, 2.0072021484375, 2.440673828125, 2.8741455078125, 3.3076171875, 3.7410888671875, 4.174560546875, 4.6080322265625, 5.04150390625, 5.4749755859375, 5.908447265625, 6.3419189453125, 6.775390625, 7.2088623046875, 7.642333984375, 8.0758056640625, 8.50927734375, 8.9427490234375, 9.376220703125, 9.8096923828125, 10.2431640625, 10.6766357421875, 11.110107421875, 11.5435791015625, 11.97705078125, 12.4105224609375, 12.843994140625, 13.2774658203125, 13.7109375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 42.0, 319.0, 486.0, 151.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.276069641113281, -9.38602352142334, -6.495977401733398, -3.605931282043457, -0.7158851623535156, 2.174160957336426, 5.064207077026367, 7.954254150390625, 10.84429931640625, 13.734345436096191, 16.624391555786133, 19.51443862915039, 22.404483795166016, 25.29452896118164, 28.1845760345459, 31.074623107910156, 33.96466827392578, 36.854713439941406, 39.74475860595703, 42.63480758666992, 45.52485275268555, 48.41489791870117, 51.30494689941406, 54.19499206542969, 57.08503723144531, 59.97508239746094, 62.86512756347656, 65.75517272949219, 68.64521789550781, 71.53527069091797, 74.4253158569336, 77.31536102294922, 80.20539855957031, 83.09544372558594, 85.98548889160156, 88.87553405761719, 91.76557922363281, 94.65563201904297, 97.5456771850586, 100.43572235107422, 103.32576751708984, 106.21581268310547, 109.1058578491211, 111.99590301513672, 114.88595581054688, 117.7760009765625, 120.66604614257812, 123.55609130859375, 126.44613647460938, 129.336181640625, 132.22622680664062, 135.11627197265625, 138.00631713867188, 140.8963623046875, 143.78640747070312, 146.67645263671875, 149.56649780273438, 152.45654296875, 155.34658813476562, 158.23663330078125, 161.12667846679688, 164.0167236328125, 166.90676879882812, 169.79681396484375, 172.68687438964844]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 10.0, 6.0, 9.0, 15.0, 9.0, 12.0, 15.0, 17.0, 20.0, 26.0, 25.0, 30.0, 34.0, 24.0, 37.0, 33.0, 35.0, 39.0, 39.0, 48.0, 44.0, 40.0, 38.0, 39.0, 31.0, 27.0, 28.0, 40.0, 23.0, 36.0, 27.0, 28.0, 13.0, 22.0, 13.0, 13.0, 13.0, 8.0, 4.0, 8.0, 3.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.122787475585938, -18.476417541503906, -17.830047607421875, -17.183677673339844, -16.537307739257812, -15.890938758850098, -15.244569778442383, -14.598199844360352, -13.95182991027832, -13.305459976196289, -12.659090042114258, -12.012721061706543, -11.366351127624512, -10.71998119354248, -10.073612213134766, -9.427242279052734, -8.780872344970703, -8.134502410888672, -7.488132953643799, -6.841763496398926, -6.1953935623168945, -5.549023628234863, -4.90265417098999, -4.256284713745117, -3.609914779663086, -2.963545083999634, -2.3171753883361816, -1.6708056926727295, -1.0244359970092773, -0.3780663013458252, 0.26830339431762695, 0.9146728515625, 1.5610427856445312, 2.2074124813079834, 2.8537821769714355, 3.5001518726348877, 4.14652156829834, 4.792891502380371, 5.439260959625244, 6.085630416870117, 6.732000350952148, 7.37837028503418, 8.024740219116211, 8.671109199523926, 9.317479133605957, 9.963849067687988, 10.610218048095703, 11.256587982177734, 11.902957916259766, 12.549327850341797, 13.195697784423828, 13.842066764831543, 14.488436698913574, 15.134806632995605, 15.78117561340332, 16.42754554748535, 17.073915481567383, 17.720285415649414, 18.366655349731445, 19.013025283813477, 19.659393310546875, 20.305763244628906, 20.952133178710938, 21.59850311279297, 22.244873046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 8.0, 9.0, 10.0, 14.0, 17.0, 27.0, 16.0, 20.0, 35.0, 27.0, 36.0, 59.0, 42.0, 45.0, 37.0, 52.0, 43.0, 48.0, 43.0, 44.0, 45.0, 47.0, 38.0, 27.0, 34.0, 33.0, 19.0, 23.0, 25.0, 13.0, 12.0, 15.0, 5.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.02685546875, -3.8818359375, -3.73681640625, -3.591796875, -3.44677734375, -3.3017578125, -3.15673828125, -3.01171875, -2.86669921875, -2.7216796875, -2.57666015625, -2.431640625, -2.28662109375, -2.1416015625, -1.99658203125, -1.8515625, -1.70654296875, -1.5615234375, -1.41650390625, -1.271484375, -1.12646484375, -0.9814453125, -0.83642578125, -0.69140625, -0.54638671875, -0.4013671875, -0.25634765625, -0.111328125, 0.03369140625, 0.1787109375, 0.32373046875, 0.46875, 0.61376953125, 0.7587890625, 0.90380859375, 1.048828125, 1.19384765625, 1.3388671875, 1.48388671875, 1.62890625, 1.77392578125, 1.9189453125, 2.06396484375, 2.208984375, 2.35400390625, 2.4990234375, 2.64404296875, 2.7890625, 2.93408203125, 3.0791015625, 3.22412109375, 3.369140625, 3.51416015625, 3.6591796875, 3.80419921875, 3.94921875, 4.09423828125, 4.2392578125, 4.38427734375, 4.529296875, 4.67431640625, 4.8193359375, 4.96435546875, 5.109375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 8.0, 12.0, 12.0, 19.0, 21.0, 28.0, 41.0, 49.0, 79.0, 90.0, 131.0, 229.0, 361.0, 558.0, 6080.0, 4179324.0, 5643.0, 534.0, 328.0, 219.0, 126.0, 93.0, 80.0, 51.0, 42.0, 32.0, 18.0, 20.0, 10.0, 14.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -64.8642578125, -62.416015625, -59.9677734375, -57.51953125, -55.0712890625, -52.623046875, -50.1748046875, -47.7265625, -45.2783203125, -42.830078125, -40.3818359375, -37.93359375, -35.4853515625, -33.037109375, -30.5888671875, -28.140625, -25.6923828125, -23.244140625, -20.7958984375, -18.34765625, -15.8994140625, -13.451171875, -11.0029296875, -8.5546875, -6.1064453125, -3.658203125, -1.2099609375, 1.23828125, 3.6865234375, 6.134765625, 8.5830078125, 11.03125, 13.4794921875, 15.927734375, 18.3759765625, 20.82421875, 23.2724609375, 25.720703125, 28.1689453125, 30.6171875, 33.0654296875, 35.513671875, 37.9619140625, 40.41015625, 42.8583984375, 45.306640625, 47.7548828125, 50.203125, 52.6513671875, 55.099609375, 57.5478515625, 59.99609375, 62.4443359375, 64.892578125, 67.3408203125, 69.7890625, 72.2373046875, 74.685546875, 77.1337890625, 79.58203125, 82.0302734375, 84.478515625, 86.9267578125, 89.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 17.0, 19.0, 22.0, 34.0, 37.0, 50.0, 77.0, 87.0, 105.0, 159.0, 245.0, 330.0, 473.0, 607.0, 553.0, 352.0, 214.0, 162.0, 126.0, 90.0, 57.0, 54.0, 34.0, 24.0, 24.0, 19.0, 11.0, 14.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.26953125, -5.08502197265625, -4.9005126953125, -4.71600341796875, -4.531494140625, -4.34698486328125, -4.1624755859375, -3.97796630859375, -3.79345703125, -3.60894775390625, -3.4244384765625, -3.23992919921875, -3.055419921875, -2.87091064453125, -2.6864013671875, -2.50189208984375, -2.3173828125, -2.13287353515625, -1.9483642578125, -1.76385498046875, -1.579345703125, -1.39483642578125, -1.2103271484375, -1.02581787109375, -0.84130859375, -0.65679931640625, -0.4722900390625, -0.28778076171875, -0.103271484375, 0.08123779296875, 0.2657470703125, 0.45025634765625, 0.634765625, 0.81927490234375, 1.0037841796875, 1.18829345703125, 1.372802734375, 1.55731201171875, 1.7418212890625, 1.92633056640625, 2.11083984375, 2.29534912109375, 2.4798583984375, 2.66436767578125, 2.848876953125, 3.03338623046875, 3.2178955078125, 3.40240478515625, 3.5869140625, 3.77142333984375, 3.9559326171875, 4.14044189453125, 4.324951171875, 4.50946044921875, 4.6939697265625, 4.87847900390625, 5.06298828125, 5.24749755859375, 5.4320068359375, 5.61651611328125, 5.801025390625, 5.98553466796875, 6.1700439453125, 6.35455322265625, 6.5390625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 11.0, 7.0, 12.0, 13.0, 8.0, 15.0, 24.0, 27.0, 26.0, 44.0, 39.0, 55.0, 117.0, 258.0, 925.0, 11272.0, 487914.0, 3638439.0, 51561.0, 2545.0, 451.0, 162.0, 73.0, 62.0, 44.0, 36.0, 30.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.421875, -29.604736328125, -28.78759765625, -27.970458984375, -27.1533203125, -26.336181640625, -25.51904296875, -24.701904296875, -23.884765625, -23.067626953125, -22.25048828125, -21.433349609375, -20.6162109375, -19.799072265625, -18.98193359375, -18.164794921875, -17.34765625, -16.530517578125, -15.71337890625, -14.896240234375, -14.0791015625, -13.261962890625, -12.44482421875, -11.627685546875, -10.810546875, -9.993408203125, -9.17626953125, -8.359130859375, -7.5419921875, -6.724853515625, -5.90771484375, -5.090576171875, -4.2734375, -3.456298828125, -2.63916015625, -1.822021484375, -1.0048828125, -0.187744140625, 0.62939453125, 1.446533203125, 2.263671875, 3.080810546875, 3.89794921875, 4.715087890625, 5.5322265625, 6.349365234375, 7.16650390625, 7.983642578125, 8.80078125, 9.617919921875, 10.43505859375, 11.252197265625, 12.0693359375, 12.886474609375, 13.70361328125, 14.520751953125, 15.337890625, 16.155029296875, 16.97216796875, 17.789306640625, 18.6064453125, 19.423583984375, 20.24072265625, 21.057861328125, 21.875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 114.0, 447.0, 343.0, 94.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.72113037109375, -27.287437438964844, -23.853742599487305, -20.420047760009766, -16.98635482788086, -13.552661895751953, -10.118967056274414, -6.685272216796875, -3.2515792846679688, 0.1821146011352539, 3.6158084869384766, 7.049502372741699, 10.483196258544922, 13.916889190673828, 17.350584030151367, 20.784278869628906, 24.217971801757812, 27.65166473388672, 31.085359573364258, 34.5190544128418, 37.9527473449707, 41.38644027709961, 44.82013702392578, 48.25382995605469, 51.687522888183594, 55.1212158203125, 58.554908752441406, 61.98860549926758, 65.42230224609375, 68.85598754882812, 72.28968811035156, 75.72338104248047, 79.15707397460938, 82.59076690673828, 86.02445983886719, 89.4581527709961, 92.891845703125, 96.32554626464844, 99.75923919677734, 103.19293212890625, 106.62662506103516, 110.06031799316406, 113.49401092529297, 116.92770385742188, 120.36140441894531, 123.79508972167969, 127.22879028320312, 130.6624755859375, 134.09617614746094, 137.52987670898438, 140.96356201171875, 144.3972625732422, 147.83094787597656, 151.2646484375, 154.69833374023438, 158.1320343017578, 161.56573486328125, 164.9994354248047, 168.43312072753906, 171.8668212890625, 175.30050659179688, 178.7342071533203, 182.1678924560547, 185.60159301757812, 189.0352783203125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 13.0, 11.0, 15.0, 19.0, 17.0, 20.0, 17.0, 32.0, 40.0, 29.0, 48.0, 35.0, 45.0, 41.0, 32.0, 38.0, 56.0, 43.0, 36.0, 49.0, 48.0, 32.0, 35.0, 23.0, 27.0, 32.0, 29.0, 22.0, 21.0, 16.0, 16.0, 6.0, 16.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.727737426757812, -20.0755615234375, -19.423385620117188, -18.771209716796875, -18.119033813476562, -17.46685791015625, -16.814682006835938, -16.162506103515625, -15.510330200195312, -14.858154296875, -14.205978393554688, -13.553802490234375, -12.901626586914062, -12.24945068359375, -11.597274780273438, -10.945098876953125, -10.292922973632812, -9.6407470703125, -8.988571166992188, -8.336395263671875, -7.6842193603515625, -7.03204345703125, -6.3798675537109375, -5.727691650390625, -5.0755157470703125, -4.42333984375, -3.7711639404296875, -3.118988037109375, -2.4668121337890625, -1.81463623046875, -1.1624603271484375, -0.510284423828125, 0.1418895721435547, 0.7940654754638672, 1.4462413787841797, 2.098417282104492, 2.7505931854248047, 3.402769088745117, 4.05494499206543, 4.707120895385742, 5.359296798706055, 6.011472702026367, 6.66364860534668, 7.315824508666992, 7.968000411987305, 8.620176315307617, 9.27235221862793, 9.924528121948242, 10.576704025268555, 11.228879928588867, 11.88105583190918, 12.533231735229492, 13.185407638549805, 13.837583541870117, 14.48975944519043, 15.141935348510742, 15.794111251831055, 16.446287155151367, 17.09846305847168, 17.750638961791992, 18.402814865112305, 19.054990768432617, 19.70716667175293, 20.359342575073242, 21.011518478393555]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 13.0, 11.0, 24.0, 20.0, 25.0, 32.0, 29.0, 24.0, 30.0, 43.0, 40.0, 56.0, 51.0, 58.0, 41.0, 49.0, 56.0, 35.0, 47.0, 33.0, 37.0, 29.0, 31.0, 25.0, 28.0, 20.0, 17.0, 25.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30596923828125, -4.1627197265625, -4.01947021484375, -3.876220703125, -3.73297119140625, -3.5897216796875, -3.44647216796875, -3.30322265625, -3.15997314453125, -3.0167236328125, -2.87347412109375, -2.730224609375, -2.58697509765625, -2.4437255859375, -2.30047607421875, -2.1572265625, -2.01397705078125, -1.8707275390625, -1.72747802734375, -1.584228515625, -1.44097900390625, -1.2977294921875, -1.15447998046875, -1.01123046875, -0.86798095703125, -0.7247314453125, -0.58148193359375, -0.438232421875, -0.29498291015625, -0.1517333984375, -0.00848388671875, 0.134765625, 0.27801513671875, 0.4212646484375, 0.56451416015625, 0.707763671875, 0.85101318359375, 0.9942626953125, 1.13751220703125, 1.28076171875, 1.42401123046875, 1.5672607421875, 1.71051025390625, 1.853759765625, 1.99700927734375, 2.1402587890625, 2.28350830078125, 2.4267578125, 2.57000732421875, 2.7132568359375, 2.85650634765625, 2.999755859375, 3.14300537109375, 3.2862548828125, 3.42950439453125, 3.57275390625, 3.71600341796875, 3.8592529296875, 4.00250244140625, 4.145751953125, 4.28900146484375, 4.4322509765625, 4.57550048828125, 4.71875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 2.0, 11.0, 13.0, 25.0, 42.0, 42.0, 70.0, 107.0, 176.0, 250.0, 425.0, 666.0, 1018.0, 1805.0, 3108.0, 5240.0, 8930.0, 15730.0, 27060.0, 47339.0, 92936.0, 244275.0, 344691.0, 120125.0, 57798.0, 32042.0, 18570.0, 10673.0, 6211.0, 3529.0, 2168.0, 1309.0, 783.0, 499.0, 321.0, 210.0, 116.0, 80.0, 48.0, 39.0, 20.0, 22.0, 7.0, 11.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029083251953125, -0.028149843215942383, -0.027216434478759766, -0.02628302574157715, -0.02534961700439453, -0.024416208267211914, -0.023482799530029297, -0.02254939079284668, -0.021615982055664062, -0.020682573318481445, -0.019749164581298828, -0.01881575584411621, -0.017882347106933594, -0.016948938369750977, -0.01601552963256836, -0.015082120895385742, -0.014148712158203125, -0.013215303421020508, -0.01228189468383789, -0.011348485946655273, -0.010415077209472656, -0.009481668472290039, -0.008548259735107422, -0.007614850997924805, -0.0066814422607421875, -0.00574803352355957, -0.004814624786376953, -0.003881216049194336, -0.0029478073120117188, -0.0020143985748291016, -0.0010809898376464844, -0.0001475811004638672, 0.00078582763671875, 0.0017192363739013672, 0.0026526451110839844, 0.0035860538482666016, 0.004519462585449219, 0.005452871322631836, 0.006386280059814453, 0.00731968879699707, 0.008253097534179688, 0.009186506271362305, 0.010119915008544922, 0.011053323745727539, 0.011986732482910156, 0.012920141220092773, 0.01385354995727539, 0.014786958694458008, 0.015720367431640625, 0.016653776168823242, 0.01758718490600586, 0.018520593643188477, 0.019454002380371094, 0.02038741111755371, 0.021320819854736328, 0.022254228591918945, 0.023187637329101562, 0.02412104606628418, 0.025054454803466797, 0.025987863540649414, 0.02692127227783203, 0.02785468101501465, 0.028788089752197266, 0.029721498489379883, 0.0306549072265625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 14.0, 11.0, 12.0, 12.0, 15.0, 15.0, 15.0, 14.0, 24.0, 31.0, 16.0, 30.0, 28.0, 36.0, 22.0, 42.0, 41.0, 34.0, 28.0, 1075.0, 29.0, 35.0, 45.0, 42.0, 38.0, 29.0, 25.0, 33.0, 29.0, 20.0, 18.0, 25.0, 17.0, 13.0, 18.0, 15.0, 8.0, 12.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.453125, -2.375396728515625, -2.29766845703125, -2.219940185546875, -2.1422119140625, -2.064483642578125, -1.98675537109375, -1.909027099609375, -1.831298828125, -1.753570556640625, -1.67584228515625, -1.598114013671875, -1.5203857421875, -1.442657470703125, -1.36492919921875, -1.287200927734375, -1.20947265625, -1.131744384765625, -1.05401611328125, -0.976287841796875, -0.8985595703125, -0.820831298828125, -0.74310302734375, -0.665374755859375, -0.587646484375, -0.509918212890625, -0.43218994140625, -0.354461669921875, -0.2767333984375, -0.199005126953125, -0.12127685546875, -0.043548583984375, 0.0341796875, 0.111907958984375, 0.18963623046875, 0.267364501953125, 0.3450927734375, 0.422821044921875, 0.50054931640625, 0.578277587890625, 0.656005859375, 0.733734130859375, 0.81146240234375, 0.889190673828125, 0.9669189453125, 1.044647216796875, 1.12237548828125, 1.200103759765625, 1.27783203125, 1.355560302734375, 1.43328857421875, 1.511016845703125, 1.5887451171875, 1.666473388671875, 1.74420166015625, 1.821929931640625, 1.899658203125, 1.977386474609375, 2.05511474609375, 2.132843017578125, 2.2105712890625, 2.288299560546875, 2.36602783203125, 2.443756103515625, 2.521484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 24.0, 44.0, 43.0, 78.0, 126.0, 166.0, 249.0, 350.0, 542.0, 864.0, 1233.0, 1739.0, 2597.0, 3975.0, 5844.0, 8817.0, 13572.0, 20499.0, 31746.0, 50160.0, 85867.0, 173841.0, 1339521.0, 147214.0, 76879.0, 45936.0, 29106.0, 18932.0, 12415.0, 8157.0, 5528.0, 3621.0, 2484.0, 1632.0, 1116.0, 767.0, 495.0, 291.0, 190.0, 134.0, 109.0, 77.0, 47.0, 34.0, 14.0, 15.0, 9.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.0153961181640625, -0.014920949935913086, -0.014445781707763672, -0.013970613479614258, -0.013495445251464844, -0.01302027702331543, -0.012545108795166016, -0.012069940567016602, -0.011594772338867188, -0.011119604110717773, -0.01064443588256836, -0.010169267654418945, -0.009694099426269531, -0.009218931198120117, -0.008743762969970703, -0.008268594741821289, -0.007793426513671875, -0.007318258285522461, -0.006843090057373047, -0.006367921829223633, -0.005892753601074219, -0.005417585372924805, -0.004942417144775391, -0.0044672489166259766, -0.0039920806884765625, -0.0035169124603271484, -0.0030417442321777344, -0.0025665760040283203, -0.0020914077758789062, -0.0016162395477294922, -0.0011410713195800781, -0.0006659030914306641, -0.00019073486328125, 0.00028443336486816406, 0.0007596015930175781, 0.0012347698211669922, 0.0017099380493164062, 0.0021851062774658203, 0.0026602745056152344, 0.0031354427337646484, 0.0036106109619140625, 0.0040857791900634766, 0.004560947418212891, 0.005036115646362305, 0.005511283874511719, 0.005986452102661133, 0.006461620330810547, 0.006936788558959961, 0.007411956787109375, 0.007887125015258789, 0.008362293243408203, 0.008837461471557617, 0.009312629699707031, 0.009787797927856445, 0.01026296615600586, 0.010738134384155273, 0.011213302612304688, 0.011688470840454102, 0.012163639068603516, 0.01263880729675293, 0.013113975524902344, 0.013589143753051758, 0.014064311981201172, 0.014539480209350586, 0.0150146484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 200.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 467.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 193.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 9.0, 5.0, 4.0, 0.0, 0.0, 6.0, 28.0, 28.0, 3.0, 12.0, 5.0, 33.0, 18.0, 58.0, 96.0, 32.0, 119.0, 212.0, 172.0, 459.0, 3369.0, 145920.0, 893308.0, 3341.0, 464.0, 123.0, 196.0, 167.0, 50.0, 78.0, 74.0, 30.0, 40.0, 7.0, 9.0, 6.0, 17.0, 35.0, 4.0, 6.0, 2.0, 0.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.616806447505951e-06, -5.451962351799011e-06, -5.2871182560920715e-06, -5.122274160385132e-06, -4.957430064678192e-06, -4.7925859689712524e-06, -4.627741873264313e-06, -4.462897777557373e-06, -4.298053681850433e-06, -4.133209586143494e-06, -3.968365490436554e-06, -3.8035213947296143e-06, -3.6386772990226746e-06, -3.473833203315735e-06, -3.308989107608795e-06, -3.1441450119018555e-06, -2.9793009161949158e-06, -2.814456820487976e-06, -2.6496127247810364e-06, -2.4847686290740967e-06, -2.319924533367157e-06, -2.1550804376602173e-06, -1.9902363419532776e-06, -1.8253922462463379e-06, -1.6605481505393982e-06, -1.4957040548324585e-06, -1.3308599591255188e-06, -1.166015863418579e-06, -1.0011717677116394e-06, -8.363276720046997e-07, -6.7148357629776e-07, -5.066394805908203e-07, -3.417953848838806e-07, -1.7695128917694092e-07, -1.210719347000122e-08, 1.5273690223693848e-07, 3.175809979438782e-07, 4.824250936508179e-07, 6.472691893577576e-07, 8.121132850646973e-07, 9.76957380771637e-07, 1.1418014764785767e-06, 1.3066455721855164e-06, 1.471489667892456e-06, 1.6363337635993958e-06, 1.8011778593063354e-06, 1.966021955013275e-06, 2.130866050720215e-06, 2.2957101464271545e-06, 2.4605542421340942e-06, 2.625398337841034e-06, 2.7902424335479736e-06, 2.9550865292549133e-06, 3.119930624961853e-06, 3.2847747206687927e-06, 3.4496188163757324e-06, 3.614462912082672e-06, 3.779307007789612e-06, 3.9441511034965515e-06, 4.108995199203491e-06, 4.273839294910431e-06, 4.438683390617371e-06, 4.60352748632431e-06, 4.76837158203125e-06]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 18.0, 15.0, 13.0, 26.0, 756.0, 25.0, 26.0, 22.0, 26.0, 13.0, 10.0, 6.0, 6.0, 3.0, 9.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6370029243262252e-07, -1.5685598953041335e-07, -1.500117008390589e-07, -1.4316739793684974e-07, -1.363231092454953e-07, -1.2947880634328612e-07, -1.2263450344107696e-07, -1.1579021474972251e-07, -1.089459189529407e-07, -1.021016231561589e-07, -9.525732735937709e-08, -8.841303156259528e-08, -8.156872866038611e-08, -7.472443996903166e-08, -6.78801370668225e-08, -6.103584127004069e-08, -5.4191545473258884e-08, -4.734724967647708e-08, -4.050295387969527e-08, -3.365865453019978e-08, -2.6814358733417976e-08, -1.9970062936636168e-08, -1.3125763587140682e-08, -6.2814677903588745e-09, 5.62828006422933e-10, 7.40712469138316e-09, 1.4251421376343387e-08, 2.1095718949482034e-08, 2.794001474626384e-08, 3.478431054304565e-08, 4.1628609892541135e-08, 4.847290568932294e-08, 5.531720148610475e-08, 6.216149728288656e-08, 6.900579307966836e-08, 7.585009598187753e-08, 8.269438467323198e-08, 8.953868757544114e-08, 9.638298337222295e-08, 1.0322727916900476e-07, 1.1007157496578657e-07, 1.1691587076256837e-07, 1.2376017366477754e-07, 1.30604462356132e-07, 1.3744876525834115e-07, 1.442930539496956e-07, 1.5113735685190477e-07, 1.5798164554325922e-07, 1.6482594844546838e-07, 1.7167025134767755e-07, 1.78514540039032e-07, 1.8535884294124116e-07, 1.9220313163259561e-07, 1.9904743453480478e-07, 2.0589172322615923e-07, 2.127360261283684e-07, 2.1958032903057756e-07, 2.2642463193278672e-07, 2.3326892062414117e-07, 2.4011322352635034e-07, 2.469575122177048e-07, 2.5380180090905924e-07, 2.606461180221231e-07, 2.6749040671347757e-07, 2.74334695404832e-07]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 127.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 736.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 129.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 13.0, 11.0, 24.0, 20.0, 25.0, 32.0, 29.0, 24.0, 30.0, 43.0, 40.0, 56.0, 51.0, 58.0, 41.0, 49.0, 56.0, 35.0, 47.0, 33.0, 37.0, 29.0, 31.0, 25.0, 28.0, 20.0, 17.0, 25.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30596923828125, -4.1627197265625, -4.01947021484375, -3.876220703125, -3.73297119140625, -3.5897216796875, -3.44647216796875, -3.30322265625, -3.15997314453125, -3.0167236328125, -2.87347412109375, -2.730224609375, -2.58697509765625, -2.4437255859375, -2.30047607421875, -2.1572265625, -2.01397705078125, -1.8707275390625, -1.72747802734375, -1.584228515625, -1.44097900390625, -1.2977294921875, -1.15447998046875, -1.01123046875, -0.86798095703125, -0.7247314453125, -0.58148193359375, -0.438232421875, -0.29498291015625, -0.1517333984375, -0.00848388671875, 0.134765625, 0.27801513671875, 0.4212646484375, 0.56451416015625, 0.707763671875, 0.85101318359375, 0.9942626953125, 1.13751220703125, 1.28076171875, 1.42401123046875, 1.5672607421875, 1.71051025390625, 1.853759765625, 1.99700927734375, 2.1402587890625, 2.28350830078125, 2.4267578125, 2.57000732421875, 2.7132568359375, 2.85650634765625, 2.999755859375, 3.14300537109375, 3.2862548828125, 3.42950439453125, 3.57275390625, 3.71600341796875, 3.8592529296875, 4.00250244140625, 4.145751953125, 4.28900146484375, 4.4322509765625, 4.57550048828125, 4.71875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 13.0, 8.0, 15.0, 19.0, 25.0, 48.0, 57.0, 81.0, 129.0, 193.0, 289.0, 363.0, 564.0, 823.0, 1272.0, 2126.0, 3418.0, 6139.0, 11013.0, 21808.0, 45896.0, 110402.0, 324522.0, 318895.0, 107943.0, 44931.0, 21308.0, 10836.0, 5923.0, 3444.0, 2078.0, 1395.0, 802.0, 563.0, 411.0, 248.0, 188.0, 98.0, 85.0, 50.0, 40.0, 28.0, 16.0, 12.0, 8.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.22265625, -5.05938720703125, -4.8961181640625, -4.73284912109375, -4.569580078125, -4.40631103515625, -4.2430419921875, -4.07977294921875, -3.91650390625, -3.75323486328125, -3.5899658203125, -3.42669677734375, -3.263427734375, -3.10015869140625, -2.9368896484375, -2.77362060546875, -2.6103515625, -2.44708251953125, -2.2838134765625, -2.12054443359375, -1.957275390625, -1.79400634765625, -1.6307373046875, -1.46746826171875, -1.30419921875, -1.14093017578125, -0.9776611328125, -0.81439208984375, -0.651123046875, -0.48785400390625, -0.3245849609375, -0.16131591796875, 0.001953125, 0.16522216796875, 0.3284912109375, 0.49176025390625, 0.655029296875, 0.81829833984375, 0.9815673828125, 1.14483642578125, 1.30810546875, 1.47137451171875, 1.6346435546875, 1.79791259765625, 1.961181640625, 2.12445068359375, 2.2877197265625, 2.45098876953125, 2.6142578125, 2.77752685546875, 2.9407958984375, 3.10406494140625, 3.267333984375, 3.43060302734375, 3.5938720703125, 3.75714111328125, 3.92041015625, 4.08367919921875, 4.2469482421875, 4.41021728515625, 4.573486328125, 4.73675537109375, 4.9000244140625, 5.06329345703125, 5.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 12.0, 14.0, 14.0, 21.0, 27.0, 26.0, 41.0, 40.0, 52.0, 69.0, 78.0, 130.0, 290.0, 1539.0, 207.0, 109.0, 69.0, 56.0, 44.0, 41.0, 31.0, 28.0, 22.0, 22.0, 16.0, 9.0, 13.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.41357421875, -13.0224609375, -12.63134765625, -12.240234375, -11.84912109375, -11.4580078125, -11.06689453125, -10.67578125, -10.28466796875, -9.8935546875, -9.50244140625, -9.111328125, -8.72021484375, -8.3291015625, -7.93798828125, -7.546875, -7.15576171875, -6.7646484375, -6.37353515625, -5.982421875, -5.59130859375, -5.2001953125, -4.80908203125, -4.41796875, -4.02685546875, -3.6357421875, -3.24462890625, -2.853515625, -2.46240234375, -2.0712890625, -1.68017578125, -1.2890625, -0.89794921875, -0.5068359375, -0.11572265625, 0.275390625, 0.66650390625, 1.0576171875, 1.44873046875, 1.83984375, 2.23095703125, 2.6220703125, 3.01318359375, 3.404296875, 3.79541015625, 4.1865234375, 4.57763671875, 4.96875, 5.35986328125, 5.7509765625, 6.14208984375, 6.533203125, 6.92431640625, 7.3154296875, 7.70654296875, 8.09765625, 8.48876953125, 8.8798828125, 9.27099609375, 9.662109375, 10.05322265625, 10.4443359375, 10.83544921875, 11.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 7.0, 18.0, 23.0, 35.0, 75.0, 110.0, 174.0, 333.0, 934.0, 12484.0, 3113947.0, 15693.0, 996.0, 386.0, 168.0, 104.0, 62.0, 38.0, 27.0, 12.0, 12.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.8125, -42.54345703125, -41.2744140625, -40.00537109375, -38.736328125, -37.46728515625, -36.1982421875, -34.92919921875, -33.66015625, -32.39111328125, -31.1220703125, -29.85302734375, -28.583984375, -27.31494140625, -26.0458984375, -24.77685546875, -23.5078125, -22.23876953125, -20.9697265625, -19.70068359375, -18.431640625, -17.16259765625, -15.8935546875, -14.62451171875, -13.35546875, -12.08642578125, -10.8173828125, -9.54833984375, -8.279296875, -7.01025390625, -5.7412109375, -4.47216796875, -3.203125, -1.93408203125, -0.6650390625, 0.60400390625, 1.873046875, 3.14208984375, 4.4111328125, 5.68017578125, 6.94921875, 8.21826171875, 9.4873046875, 10.75634765625, 12.025390625, 13.29443359375, 14.5634765625, 15.83251953125, 17.1015625, 18.37060546875, 19.6396484375, 20.90869140625, 22.177734375, 23.44677734375, 24.7158203125, 25.98486328125, 27.25390625, 28.52294921875, 29.7919921875, 31.06103515625, 32.330078125, 33.59912109375, 34.8681640625, 36.13720703125, 37.40625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 49.0, 281.0, 427.0, 204.0, 39.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.09678268432617, -43.83516311645508, -41.57353973388672, -39.311920166015625, -37.05030059814453, -34.78867721557617, -32.52705764770508, -30.26543617248535, -28.003814697265625, -25.7421932220459, -23.480571746826172, -21.218952178955078, -18.95733070373535, -16.695709228515625, -14.434088706970215, -12.172468185424805, -9.910846710205078, -7.64922571182251, -5.387604713439941, -3.125983715057373, -0.8643627166748047, 1.3972587585449219, 3.658879280090332, 5.920499801635742, 8.182121276855469, 10.443742752075195, 12.705363273620605, 14.966983795166016, 17.228605270385742, 19.49022674560547, 21.751846313476562, 24.01346778869629, 26.27508544921875, 28.536706924438477, 30.798328399658203, 33.0599479675293, 35.321571350097656, 37.58319091796875, 39.844810485839844, 42.10643005371094, 44.3680534362793, 46.62967300415039, 48.89129638671875, 51.152915954589844, 53.41453552246094, 55.6761589050293, 57.93777847290039, 60.19940185546875, 62.461021423339844, 64.72264099121094, 66.98426055908203, 69.24588775634766, 71.50750732421875, 73.76912689208984, 76.03074645996094, 78.29236602783203, 80.55398559570312, 82.81560516357422, 85.07722473144531, 87.33885192871094, 89.60047149658203, 91.86209106445312, 94.12371063232422, 96.38533020019531, 98.64695739746094]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 13.0, 10.0, 6.0, 7.0, 11.0, 14.0, 21.0, 18.0, 21.0, 26.0, 30.0, 26.0, 33.0, 27.0, 33.0, 35.0, 33.0, 45.0, 44.0, 39.0, 40.0, 37.0, 49.0, 25.0, 42.0, 37.0, 28.0, 33.0, 31.0, 23.0, 25.0, 18.0, 26.0, 12.0, 11.0, 19.0, 12.0, 6.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.42755889892578, -23.595754623413086, -22.763952255249023, -21.932147979736328, -21.100343704223633, -20.268539428710938, -19.436737060546875, -18.60493278503418, -17.773128509521484, -16.94132423400879, -16.109521865844727, -15.277717590332031, -14.445913314819336, -13.614109992980957, -12.782306671142578, -11.950502395629883, -11.11870002746582, -10.286896705627441, -9.455092430114746, -8.623289108276367, -7.79148530960083, -6.959681510925293, -6.127878189086914, -5.296074390411377, -4.46427059173584, -3.6324667930603027, -2.8006632328033447, -1.9688596725463867, -1.1370558738708496, -0.3052520751953125, 0.5265512466430664, 1.3583550453186035, 2.1901588439941406, 3.0219626426696777, 3.8537662029266357, 4.685569763183594, 5.517373561859131, 6.349177360534668, 7.180980682373047, 8.012784957885742, 8.844588279724121, 9.6763916015625, 10.508195877075195, 11.339999198913574, 12.171802520751953, 13.003606796264648, 13.835410118103027, 14.667213439941406, 15.499017715454102, 16.330821990966797, 17.16262435913086, 17.994428634643555, 18.82623291015625, 19.658035278320312, 20.489839553833008, 21.321643829345703, 22.153446197509766, 22.98525047302246, 23.817052841186523, 24.64885711669922, 25.480661392211914, 26.31246566772461, 27.144268035888672, 27.976072311401367, 28.807876586914062]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 14.0, 9.0, 12.0, 15.0, 19.0, 26.0, 19.0, 27.0, 33.0, 34.0, 37.0, 41.0, 41.0, 49.0, 35.0, 64.0, 45.0, 53.0, 62.0, 36.0, 39.0, 33.0, 42.0, 31.0, 30.0, 21.0, 21.0, 22.0, 10.0, 16.0, 11.0, 12.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.000732421875, -3.85693359375, -3.713134765625, -3.5693359375, -3.425537109375, -3.28173828125, -3.137939453125, -2.994140625, -2.850341796875, -2.70654296875, -2.562744140625, -2.4189453125, -2.275146484375, -2.13134765625, -1.987548828125, -1.84375, -1.699951171875, -1.55615234375, -1.412353515625, -1.2685546875, -1.124755859375, -0.98095703125, -0.837158203125, -0.693359375, -0.549560546875, -0.40576171875, -0.261962890625, -0.1181640625, 0.025634765625, 0.16943359375, 0.313232421875, 0.45703125, 0.600830078125, 0.74462890625, 0.888427734375, 1.0322265625, 1.176025390625, 1.31982421875, 1.463623046875, 1.607421875, 1.751220703125, 1.89501953125, 2.038818359375, 2.1826171875, 2.326416015625, 2.47021484375, 2.614013671875, 2.7578125, 2.901611328125, 3.04541015625, 3.189208984375, 3.3330078125, 3.476806640625, 3.62060546875, 3.764404296875, 3.908203125, 4.052001953125, 4.19580078125, 4.339599609375, 4.4833984375, 4.627197265625, 4.77099609375, 4.914794921875, 5.05859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 9.0, 14.0, 15.0, 21.0, 28.0, 41.0, 53.0, 63.0, 95.0, 144.0, 209.0, 374.0, 636.0, 1074.0, 2201.0, 4731.0, 12942.0, 52142.0, 429107.0, 2463962.0, 1074655.0, 116463.0, 21732.0, 7087.0, 2996.0, 1362.0, 774.0, 455.0, 284.0, 187.0, 118.0, 69.0, 55.0, 48.0, 33.0, 20.0, 19.0, 14.0, 14.0, 6.0, 5.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.44384765625, -7.1845703125, -6.92529296875, -6.666015625, -6.40673828125, -6.1474609375, -5.88818359375, -5.62890625, -5.36962890625, -5.1103515625, -4.85107421875, -4.591796875, -4.33251953125, -4.0732421875, -3.81396484375, -3.5546875, -3.29541015625, -3.0361328125, -2.77685546875, -2.517578125, -2.25830078125, -1.9990234375, -1.73974609375, -1.48046875, -1.22119140625, -0.9619140625, -0.70263671875, -0.443359375, -0.18408203125, 0.0751953125, 0.33447265625, 0.59375, 0.85302734375, 1.1123046875, 1.37158203125, 1.630859375, 1.89013671875, 2.1494140625, 2.40869140625, 2.66796875, 2.92724609375, 3.1865234375, 3.44580078125, 3.705078125, 3.96435546875, 4.2236328125, 4.48291015625, 4.7421875, 5.00146484375, 5.2607421875, 5.52001953125, 5.779296875, 6.03857421875, 6.2978515625, 6.55712890625, 6.81640625, 7.07568359375, 7.3349609375, 7.59423828125, 7.853515625, 8.11279296875, 8.3720703125, 8.63134765625, 8.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 5.0, 11.0, 12.0, 13.0, 19.0, 18.0, 32.0, 43.0, 37.0, 64.0, 81.0, 79.0, 128.0, 170.0, 191.0, 254.0, 309.0, 413.0, 417.0, 385.0, 317.0, 230.0, 155.0, 155.0, 96.0, 92.0, 67.0, 50.0, 42.0, 44.0, 37.0, 22.0, 13.0, 18.0, 14.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.11737060546875, -4.9534912109375, -4.78961181640625, -4.625732421875, -4.46185302734375, -4.2979736328125, -4.13409423828125, -3.97021484375, -3.80633544921875, -3.6424560546875, -3.47857666015625, -3.314697265625, -3.15081787109375, -2.9869384765625, -2.82305908203125, -2.6591796875, -2.49530029296875, -2.3314208984375, -2.16754150390625, -2.003662109375, -1.83978271484375, -1.6759033203125, -1.51202392578125, -1.34814453125, -1.18426513671875, -1.0203857421875, -0.85650634765625, -0.692626953125, -0.52874755859375, -0.3648681640625, -0.20098876953125, -0.037109375, 0.12677001953125, 0.2906494140625, 0.45452880859375, 0.618408203125, 0.78228759765625, 0.9461669921875, 1.11004638671875, 1.27392578125, 1.43780517578125, 1.6016845703125, 1.76556396484375, 1.929443359375, 2.09332275390625, 2.2572021484375, 2.42108154296875, 2.5849609375, 2.74884033203125, 2.9127197265625, 3.07659912109375, 3.240478515625, 3.40435791015625, 3.5682373046875, 3.73211669921875, 3.89599609375, 4.05987548828125, 4.2237548828125, 4.38763427734375, 4.551513671875, 4.71539306640625, 4.8792724609375, 5.04315185546875, 5.20703125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 18.0, 16.0, 36.0, 47.0, 70.0, 109.0, 146.0, 221.0, 360.0, 629.0, 1133.0, 2626.0, 7608.0, 34143.0, 221676.0, 2034447.0, 1662905.0, 186803.0, 29618.0, 6825.0, 2275.0, 984.0, 585.0, 337.0, 207.0, 125.0, 95.0, 67.0, 42.0, 20.0, 21.0, 16.0, 13.0, 11.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.05706787109375, -6.7742919921875, -6.49151611328125, -6.208740234375, -5.92596435546875, -5.6431884765625, -5.36041259765625, -5.07763671875, -4.79486083984375, -4.5120849609375, -4.22930908203125, -3.946533203125, -3.66375732421875, -3.3809814453125, -3.09820556640625, -2.8154296875, -2.53265380859375, -2.2498779296875, -1.96710205078125, -1.684326171875, -1.40155029296875, -1.1187744140625, -0.83599853515625, -0.55322265625, -0.27044677734375, 0.0123291015625, 0.29510498046875, 0.577880859375, 0.86065673828125, 1.1434326171875, 1.42620849609375, 1.708984375, 1.99176025390625, 2.2745361328125, 2.55731201171875, 2.840087890625, 3.12286376953125, 3.4056396484375, 3.68841552734375, 3.97119140625, 4.25396728515625, 4.5367431640625, 4.81951904296875, 5.102294921875, 5.38507080078125, 5.6678466796875, 5.95062255859375, 6.2333984375, 6.51617431640625, 6.7989501953125, 7.08172607421875, 7.364501953125, 7.64727783203125, 7.9300537109375, 8.21282958984375, 8.49560546875, 8.77838134765625, 9.0611572265625, 9.34393310546875, 9.626708984375, 9.90948486328125, 10.1922607421875, 10.47503662109375, 10.7578125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 43.0, 409.0, 498.0, 61.0, 2.0, 1.0, 2.0], "bins": [-292.6775207519531, -287.7196044921875, -282.76165771484375, -277.8037414550781, -272.8457946777344, -267.88787841796875, -262.929931640625, -257.9720153808594, -253.01406860351562, -248.05613708496094, -243.09820556640625, -238.14027404785156, -233.18234252929688, -228.2244110107422, -223.2664794921875, -218.30856323242188, -213.3506317138672, -208.3927001953125, -203.4347686767578, -198.47683715820312, -193.51890563964844, -188.56097412109375, -183.60304260253906, -178.64511108398438, -173.68719482421875, -168.72926330566406, -163.77133178710938, -158.8134002685547, -153.85546875, -148.8975372314453, -143.93960571289062, -138.981689453125, -134.02374267578125, -129.06581115722656, -124.10787963867188, -119.14994812011719, -114.1920166015625, -109.23408508300781, -104.27616119384766, -99.31822967529297, -94.36029052734375, -89.40235900878906, -84.44442749023438, -79.48649597167969, -74.528564453125, -69.57063293457031, -64.61270904541016, -59.65477752685547, -54.69684600830078, -49.738914489746094, -44.780982971191406, -39.823055267333984, -34.8651237487793, -29.90719223022461, -24.949262619018555, -19.9913330078125, -15.033403396606445, -10.075472831726074, -5.117542266845703, -0.15961170196533203, 4.798318862915039, 9.756250381469727, 14.714179992675781, 19.672109603881836, 24.630041122436523]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 14.0, 14.0, 20.0, 19.0, 21.0, 15.0, 27.0, 25.0, 28.0, 35.0, 39.0, 48.0, 64.0, 35.0, 35.0, 47.0, 48.0, 49.0, 46.0, 42.0, 47.0, 34.0, 31.0, 29.0, 27.0, 20.0, 31.0, 17.0, 19.0, 17.0, 16.0, 13.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.451316833496094, -28.645355224609375, -27.839391708374023, -27.033430099487305, -26.227468490600586, -25.421504974365234, -24.615543365478516, -23.809581756591797, -23.003620147705078, -22.19765853881836, -21.391695022583008, -20.58573341369629, -19.77977180480957, -18.97380828857422, -18.1678466796875, -17.36188507080078, -16.555923461914062, -15.749960899353027, -14.943999290466309, -14.138036727905273, -13.332075119018555, -12.52611255645752, -11.720149993896484, -10.914188385009766, -10.108224868774414, -9.302262306213379, -8.49630069732666, -7.690338134765625, -6.884376525878906, -6.078413963317871, -5.272451877593994, -4.466489791870117, -3.6605281829833984, -2.8545660972595215, -2.0486040115356445, -1.2426416873931885, -0.4366796016693115, 0.36928272247314453, 1.1752448081970215, 1.9812068939208984, 2.7871689796447754, 3.5931310653686523, 4.399093151092529, 5.205055236816406, 6.011017799377441, 6.816979885101318, 7.622941970825195, 8.428903579711914, 9.23486614227295, 10.040828704833984, 10.846790313720703, 11.652752876281738, 12.458714485168457, 13.264677047729492, 14.070638656616211, 14.876601219177246, 15.682563781738281, 16.488525390625, 17.29448890686035, 18.10045051574707, 18.90641212463379, 19.71237564086914, 20.51833724975586, 21.324298858642578, 22.130260467529297]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 21.0, 15.0, 20.0, 27.0, 31.0, 28.0, 32.0, 34.0, 40.0, 31.0, 43.0, 47.0, 48.0, 50.0, 35.0, 37.0, 43.0, 40.0, 35.0, 27.0, 44.0, 18.0, 23.0, 21.0, 21.0, 25.0, 18.0, 7.0, 14.0, 5.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.292022705078125, -3.18756103515625, -3.083099365234375, -2.9786376953125, -2.874176025390625, -2.76971435546875, -2.665252685546875, -2.560791015625, -2.456329345703125, -2.35186767578125, -2.247406005859375, -2.1429443359375, -2.038482666015625, -1.93402099609375, -1.829559326171875, -1.72509765625, -1.620635986328125, -1.51617431640625, -1.411712646484375, -1.3072509765625, -1.202789306640625, -1.09832763671875, -0.993865966796875, -0.889404296875, -0.784942626953125, -0.68048095703125, -0.576019287109375, -0.4715576171875, -0.367095947265625, -0.26263427734375, -0.158172607421875, -0.0537109375, 0.050750732421875, 0.15521240234375, 0.259674072265625, 0.3641357421875, 0.468597412109375, 0.57305908203125, 0.677520751953125, 0.781982421875, 0.886444091796875, 0.99090576171875, 1.095367431640625, 1.1998291015625, 1.304290771484375, 1.40875244140625, 1.513214111328125, 1.61767578125, 1.722137451171875, 1.82659912109375, 1.931060791015625, 2.0355224609375, 2.139984130859375, 2.24444580078125, 2.348907470703125, 2.453369140625, 2.557830810546875, 2.66229248046875, 2.766754150390625, 2.8712158203125, 2.975677490234375, 3.08013916015625, 3.184600830078125, 3.2890625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 14.0, 19.0, 27.0, 42.0, 62.0, 85.0, 116.0, 185.0, 243.0, 362.0, 591.0, 816.0, 1223.0, 1803.0, 2725.0, 4216.0, 6717.0, 10286.0, 16616.0, 26882.0, 45928.0, 81924.0, 168388.0, 337297.0, 152923.0, 76635.0, 43126.0, 25343.0, 15656.0, 9800.0, 6378.0, 3998.0, 2671.0, 1747.0, 1200.0, 812.0, 494.0, 381.0, 234.0, 177.0, 118.0, 92.0, 62.0, 37.0, 29.0, 16.0, 19.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0198974609375, -0.019264698028564453, -0.018631935119628906, -0.01799917221069336, -0.017366409301757812, -0.016733646392822266, -0.01610088348388672, -0.015468120574951172, -0.014835357666015625, -0.014202594757080078, -0.013569831848144531, -0.012937068939208984, -0.012304306030273438, -0.01167154312133789, -0.011038780212402344, -0.010406017303466797, -0.00977325439453125, -0.009140491485595703, -0.008507728576660156, -0.00787496566772461, -0.0072422027587890625, -0.006609439849853516, -0.005976676940917969, -0.005343914031982422, -0.004711151123046875, -0.004078388214111328, -0.0034456253051757812, -0.0028128623962402344, -0.0021800994873046875, -0.0015473365783691406, -0.0009145736694335938, -0.0002818107604980469, 0.0003509521484375, 0.0009837150573730469, 0.0016164779663085938, 0.0022492408752441406, 0.0028820037841796875, 0.0035147666931152344, 0.004147529602050781, 0.004780292510986328, 0.005413055419921875, 0.006045818328857422, 0.006678581237792969, 0.007311344146728516, 0.007944107055664062, 0.00857686996459961, 0.009209632873535156, 0.009842395782470703, 0.01047515869140625, 0.011107921600341797, 0.011740684509277344, 0.01237344741821289, 0.013006210327148438, 0.013638973236083984, 0.014271736145019531, 0.014904499053955078, 0.015537261962890625, 0.016170024871826172, 0.01680278778076172, 0.017435550689697266, 0.018068313598632812, 0.01870107650756836, 0.019333839416503906, 0.019966602325439453, 0.020599365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 4.0, 8.0, 8.0, 6.0, 10.0, 18.0, 22.0, 22.0, 20.0, 31.0, 30.0, 37.0, 46.0, 59.0, 46.0, 58.0, 40.0, 1076.0, 46.0, 74.0, 46.0, 50.0, 39.0, 43.0, 23.0, 27.0, 32.0, 24.0, 26.0, 12.0, 13.0, 8.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.4327392578125, -2.340087890625, -2.2474365234375, -2.15478515625, -2.0621337890625, -1.969482421875, -1.8768310546875, -1.7841796875, -1.6915283203125, -1.598876953125, -1.5062255859375, -1.41357421875, -1.3209228515625, -1.228271484375, -1.1356201171875, -1.04296875, -0.9503173828125, -0.857666015625, -0.7650146484375, -0.67236328125, -0.5797119140625, -0.487060546875, -0.3944091796875, -0.3017578125, -0.2091064453125, -0.116455078125, -0.0238037109375, 0.06884765625, 0.1614990234375, 0.254150390625, 0.3468017578125, 0.439453125, 0.5321044921875, 0.624755859375, 0.7174072265625, 0.81005859375, 0.9027099609375, 0.995361328125, 1.0880126953125, 1.1806640625, 1.2733154296875, 1.365966796875, 1.4586181640625, 1.55126953125, 1.6439208984375, 1.736572265625, 1.8292236328125, 1.921875, 2.0145263671875, 2.107177734375, 2.1998291015625, 2.29248046875, 2.3851318359375, 2.477783203125, 2.5704345703125, 2.6630859375, 2.7557373046875, 2.848388671875, 2.9410400390625, 3.03369140625, 3.1263427734375, 3.218994140625, 3.3116455078125, 3.404296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 12.0, 26.0, 31.0, 34.0, 72.0, 131.0, 187.0, 310.0, 559.0, 966.0, 1505.0, 2819.0, 4884.0, 9078.0, 16585.0, 31771.0, 63134.0, 143129.0, 1435359.0, 214457.0, 84159.0, 40976.0, 21011.0, 11405.0, 6330.0, 3413.0, 1958.0, 1134.0, 640.0, 428.0, 254.0, 103.0, 80.0, 63.0, 46.0, 23.0, 12.0, 4.0, 11.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.020538330078125, -0.019928693771362305, -0.01931905746459961, -0.018709421157836914, -0.01809978485107422, -0.017490148544311523, -0.016880512237548828, -0.016270875930786133, -0.015661239624023438, -0.015051603317260742, -0.014441967010498047, -0.013832330703735352, -0.013222694396972656, -0.012613058090209961, -0.012003421783447266, -0.01139378547668457, -0.010784149169921875, -0.01017451286315918, -0.009564876556396484, -0.008955240249633789, -0.008345603942871094, -0.0077359676361083984, -0.007126331329345703, -0.006516695022583008, -0.0059070587158203125, -0.005297422409057617, -0.004687786102294922, -0.0040781497955322266, -0.0034685134887695312, -0.002858877182006836, -0.0022492408752441406, -0.0016396045684814453, -0.00102996826171875, -0.0004203319549560547, 0.00018930435180664062, 0.0007989406585693359, 0.0014085769653320312, 0.0020182132720947266, 0.002627849578857422, 0.003237485885620117, 0.0038471221923828125, 0.004456758499145508, 0.005066394805908203, 0.0056760311126708984, 0.006285667419433594, 0.006895303726196289, 0.007504940032958984, 0.00811457633972168, 0.008724212646484375, 0.00933384895324707, 0.009943485260009766, 0.010553121566772461, 0.011162757873535156, 0.011772394180297852, 0.012382030487060547, 0.012991666793823242, 0.013601303100585938, 0.014210939407348633, 0.014820575714111328, 0.015430212020874023, 0.01603984832763672, 0.016649484634399414, 0.01725912094116211, 0.017868757247924805, 0.0184783935546875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.0, 0.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 404.0, 0.0, 0.0, 0.0, 0.0, 0.0, 229.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.473833203315735e-07, -3.371387720108032e-07, -3.2689422369003296e-07, -3.166496753692627e-07, -3.0640512704849243e-07, -2.9616057872772217e-07, -2.859160304069519e-07, -2.7567148208618164e-07, -2.654269337654114e-07, -2.551823854446411e-07, -2.4493783712387085e-07, -2.3469328880310059e-07, -2.2444874048233032e-07, -2.1420419216156006e-07, -2.039596438407898e-07, -1.9371509552001953e-07, -1.8347054719924927e-07, -1.73225998878479e-07, -1.6298145055770874e-07, -1.5273690223693848e-07, -1.424923539161682e-07, -1.3224780559539795e-07, -1.2200325727462769e-07, -1.1175870895385742e-07, -1.0151416063308716e-07, -9.12696123123169e-08, -8.102506399154663e-08, -7.078051567077637e-08, -6.05359673500061e-08, -5.029141902923584e-08, -4.0046870708465576e-08, -2.9802322387695312e-08, -1.955777406692505e-08, -9.313225746154785e-09, 9.313225746154785e-10, 1.1175870895385742e-08, 2.1420419216156006e-08, 3.166496753692627e-08, 4.190951585769653e-08, 5.21540641784668e-08, 6.239861249923706e-08, 7.264316082000732e-08, 8.288770914077759e-08, 9.313225746154785e-08, 1.0337680578231812e-07, 1.1362135410308838e-07, 1.2386590242385864e-07, 1.341104507446289e-07, 1.4435499906539917e-07, 1.5459954738616943e-07, 1.648440957069397e-07, 1.7508864402770996e-07, 1.8533319234848022e-07, 1.955777406692505e-07, 2.0582228899002075e-07, 2.1606683731079102e-07, 2.2631138563156128e-07, 2.3655593395233154e-07, 2.468004822731018e-07, 2.5704503059387207e-07, 2.6728957891464233e-07, 2.775341272354126e-07, 2.8777867555618286e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 10.0, 1.0, 0.0, 6.0, 28.0, 34.0, 17.0, 8.0, 61.0, 21.0, 114.0, 74.0, 135.0, 289.0, 160.0, 577.0, 16222.0, 1012800.0, 16565.0, 542.0, 188.0, 223.0, 126.0, 93.0, 92.0, 39.0, 21.0, 10.0, 6.0, 14.0, 35.0, 3.0, 1.0, 3.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.398876965045929e-06, -5.194917321205139e-06, -4.990957677364349e-06, -4.7869980335235596e-06, -4.58303838968277e-06, -4.37907874584198e-06, -4.17511910200119e-06, -3.9711594581604e-06, -3.7671998143196106e-06, -3.563240170478821e-06, -3.359280526638031e-06, -3.155320882797241e-06, -2.9513612389564514e-06, -2.7474015951156616e-06, -2.543441951274872e-06, -2.339482307434082e-06, -2.1355226635932922e-06, -1.9315630197525024e-06, -1.7276033759117126e-06, -1.5236437320709229e-06, -1.319684088230133e-06, -1.1157244443893433e-06, -9.117648005485535e-07, -7.078051567077637e-07, -5.038455128669739e-07, -2.998858690261841e-07, -9.592622518539429e-08, 1.0803341865539551e-07, 3.119930624961853e-07, 5.159527063369751e-07, 7.199123501777649e-07, 9.238719940185547e-07, 1.1278316378593445e-06, 1.3317912817001343e-06, 1.535750925540924e-06, 1.7397105693817139e-06, 1.9436702132225037e-06, 2.1476298570632935e-06, 2.3515895009040833e-06, 2.555549144744873e-06, 2.759508788585663e-06, 2.9634684324264526e-06, 3.1674280762672424e-06, 3.3713877201080322e-06, 3.575347363948822e-06, 3.779307007789612e-06, 3.983266651630402e-06, 4.187226295471191e-06, 4.391185939311981e-06, 4.595145583152771e-06, 4.799105226993561e-06, 5.003064870834351e-06, 5.20702451467514e-06, 5.41098415851593e-06, 5.61494380235672e-06, 5.81890344619751e-06, 6.0228630900382996e-06, 6.226822733879089e-06, 6.430782377719879e-06, 6.634742021560669e-06, 6.838701665401459e-06, 7.0426613092422485e-06, 7.246620953083038e-06, 7.450580596923828e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 7.0, 9.0, 15.0, 18.0, 20.0, 17.0, 21.0, 21.0, 712.0, 19.0, 12.0, 16.0, 18.0, 20.0, 18.0, 11.0, 5.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3966374012852611e-07, -1.359658341471004e-07, -1.3226792816567468e-07, -1.2857003639510367e-07, -1.2487213041367795e-07, -1.2117422443225223e-07, -1.1747631845082651e-07, -1.1377841246940079e-07, -1.1008050648797507e-07, -1.0638260050654935e-07, -1.0268470163055099e-07, -9.898679564912527e-08, -9.528888966769955e-08, -9.159099079170119e-08, -8.789308481027547e-08, -8.419517882884975e-08, -8.049727995285139e-08, -7.679937397142567e-08, -7.31014750954273e-08, -6.940356911400158e-08, -6.570566313257586e-08, -6.200775715115014e-08, -5.830985827515178e-08, -5.461195229372606e-08, -5.091404986501402e-08, -4.721614743630198e-08, -4.351824145487626e-08, -3.982033902616422e-08, -3.612243659745218e-08, -3.242453061602646e-08, -2.8726628187314418e-08, -2.5028723982245538e-08, -2.1330819777176657e-08, -1.7632915572107777e-08, -1.3935012255217316e-08, -1.0237108938326855e-08, -6.539204733257975e-09, -2.8413005281890946e-09, 8.566019005229464e-10, 4.554506105591827e-09, 8.252410310660707e-09, 1.1950314515729588e-08, 1.5648218720798468e-08, 1.934612114951051e-08, 2.304402535457939e-08, 2.674192955964827e-08, 3.043983198836031e-08, 3.413773441707235e-08, 3.783564039849807e-08, 4.153354282721011e-08, 4.523144880863583e-08, 4.8929351237347873e-08, 5.262725721877359e-08, 5.6325159647485634e-08, 6.002306207619768e-08, 6.37209680576234e-08, 6.741886693362176e-08, 7.111677291504748e-08, 7.481467179104584e-08, 7.851257777247156e-08, 8.221048375389728e-08, 8.590838262989564e-08, 8.960628861132136e-08, 9.330419459274708e-08, 9.70021005741728e-08]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 160.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 701.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 140.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 21.0, 15.0, 20.0, 27.0, 31.0, 28.0, 32.0, 34.0, 40.0, 31.0, 43.0, 47.0, 48.0, 50.0, 35.0, 37.0, 43.0, 40.0, 35.0, 27.0, 44.0, 18.0, 23.0, 21.0, 21.0, 25.0, 18.0, 7.0, 14.0, 5.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.292022705078125, -3.18756103515625, -3.083099365234375, -2.9786376953125, -2.874176025390625, -2.76971435546875, -2.665252685546875, -2.560791015625, -2.456329345703125, -2.35186767578125, -2.247406005859375, -2.1429443359375, -2.038482666015625, -1.93402099609375, -1.829559326171875, -1.72509765625, -1.620635986328125, -1.51617431640625, -1.411712646484375, -1.3072509765625, -1.202789306640625, -1.09832763671875, -0.993865966796875, -0.889404296875, -0.784942626953125, -0.68048095703125, -0.576019287109375, -0.4715576171875, -0.367095947265625, -0.26263427734375, -0.158172607421875, -0.0537109375, 0.050750732421875, 0.15521240234375, 0.259674072265625, 0.3641357421875, 0.468597412109375, 0.57305908203125, 0.677520751953125, 0.781982421875, 0.886444091796875, 0.99090576171875, 1.095367431640625, 1.1998291015625, 1.304290771484375, 1.40875244140625, 1.513214111328125, 1.61767578125, 1.722137451171875, 1.82659912109375, 1.931060791015625, 2.0355224609375, 2.139984130859375, 2.24444580078125, 2.348907470703125, 2.453369140625, 2.557830810546875, 2.66229248046875, 2.766754150390625, 2.8712158203125, 2.975677490234375, 3.08013916015625, 3.184600830078125, 3.2890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 20.0, 31.0, 29.0, 58.0, 73.0, 103.0, 148.0, 212.0, 312.0, 432.0, 678.0, 1140.0, 1780.0, 3288.0, 7013.0, 17314.0, 52078.0, 207796.0, 538560.0, 149254.0, 40761.0, 14192.0, 5894.0, 2844.0, 1595.0, 944.0, 588.0, 423.0, 265.0, 226.0, 137.0, 85.0, 77.0, 43.0, 31.0, 35.0, 14.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96875, -5.77862548828125, -5.5885009765625, -5.39837646484375, -5.208251953125, -5.01812744140625, -4.8280029296875, -4.63787841796875, -4.44775390625, -4.25762939453125, -4.0675048828125, -3.87738037109375, -3.687255859375, -3.49713134765625, -3.3070068359375, -3.11688232421875, -2.9267578125, -2.73663330078125, -2.5465087890625, -2.35638427734375, -2.166259765625, -1.97613525390625, -1.7860107421875, -1.59588623046875, -1.40576171875, -1.21563720703125, -1.0255126953125, -0.83538818359375, -0.645263671875, -0.45513916015625, -0.2650146484375, -0.07489013671875, 0.115234375, 0.30535888671875, 0.4954833984375, 0.68560791015625, 0.875732421875, 1.06585693359375, 1.2559814453125, 1.44610595703125, 1.63623046875, 1.82635498046875, 2.0164794921875, 2.20660400390625, 2.396728515625, 2.58685302734375, 2.7769775390625, 2.96710205078125, 3.1572265625, 3.34735107421875, 3.5374755859375, 3.72760009765625, 3.917724609375, 4.10784912109375, 4.2979736328125, 4.48809814453125, 4.67822265625, 4.86834716796875, 5.0584716796875, 5.24859619140625, 5.438720703125, 5.62884521484375, 5.8189697265625, 6.00909423828125, 6.19921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 11.0, 5.0, 3.0, 10.0, 15.0, 11.0, 11.0, 16.0, 23.0, 33.0, 46.0, 32.0, 41.0, 52.0, 58.0, 100.0, 246.0, 1563.0, 269.0, 141.0, 58.0, 50.0, 45.0, 23.0, 32.0, 31.0, 34.0, 19.0, 17.0, 14.0, 14.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3984375, -11.0867919921875, -10.775146484375, -10.4635009765625, -10.15185546875, -9.8402099609375, -9.528564453125, -9.2169189453125, -8.9052734375, -8.5936279296875, -8.281982421875, -7.9703369140625, -7.65869140625, -7.3470458984375, -7.035400390625, -6.7237548828125, -6.412109375, -6.1004638671875, -5.788818359375, -5.4771728515625, -5.16552734375, -4.8538818359375, -4.542236328125, -4.2305908203125, -3.9189453125, -3.6072998046875, -3.295654296875, -2.9840087890625, -2.67236328125, -2.3607177734375, -2.049072265625, -1.7374267578125, -1.42578125, -1.1141357421875, -0.802490234375, -0.4908447265625, -0.17919921875, 0.1324462890625, 0.444091796875, 0.7557373046875, 1.0673828125, 1.3790283203125, 1.690673828125, 2.0023193359375, 2.31396484375, 2.6256103515625, 2.937255859375, 3.2489013671875, 3.560546875, 3.8721923828125, 4.183837890625, 4.4954833984375, 4.80712890625, 5.1187744140625, 5.430419921875, 5.7420654296875, 6.0537109375, 6.3653564453125, 6.677001953125, 6.9886474609375, 7.30029296875, 7.6119384765625, 7.923583984375, 8.2352294921875, 8.546875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 10.0, 5.0, 4.0, 16.0, 12.0, 13.0, 25.0, 38.0, 40.0, 59.0, 78.0, 120.0, 165.0, 304.0, 508.0, 971.0, 5699.0, 2750349.0, 381818.0, 3302.0, 864.0, 441.0, 231.0, 179.0, 103.0, 86.0, 49.0, 57.0, 30.0, 23.0, 18.0, 19.0, 10.0, 9.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.71875, -19.059326171875, -18.39990234375, -17.740478515625, -17.0810546875, -16.421630859375, -15.76220703125, -15.102783203125, -14.443359375, -13.783935546875, -13.12451171875, -12.465087890625, -11.8056640625, -11.146240234375, -10.48681640625, -9.827392578125, -9.16796875, -8.508544921875, -7.84912109375, -7.189697265625, -6.5302734375, -5.870849609375, -5.21142578125, -4.552001953125, -3.892578125, -3.233154296875, -2.57373046875, -1.914306640625, -1.2548828125, -0.595458984375, 0.06396484375, 0.723388671875, 1.3828125, 2.042236328125, 2.70166015625, 3.361083984375, 4.0205078125, 4.679931640625, 5.33935546875, 5.998779296875, 6.658203125, 7.317626953125, 7.97705078125, 8.636474609375, 9.2958984375, 9.955322265625, 10.61474609375, 11.274169921875, 11.93359375, 12.593017578125, 13.25244140625, 13.911865234375, 14.5712890625, 15.230712890625, 15.89013671875, 16.549560546875, 17.208984375, 17.868408203125, 18.52783203125, 19.187255859375, 19.8466796875, 20.506103515625, 21.16552734375, 21.824951171875, 22.484375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 145.0, 646.0, 201.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.77757263183594, -66.21517944335938, -62.652793884277344, -59.09040069580078, -55.528011322021484, -51.96562194824219, -48.403228759765625, -44.84083938598633, -41.27845001220703, -37.716060638427734, -34.15367126464844, -30.591278076171875, -27.028888702392578, -23.46649932861328, -19.90410804748535, -16.341716766357422, -12.779327392578125, -9.216937065124512, -5.654546737670898, -2.092156410217285, 1.4702339172363281, 5.032623291015625, 8.595014572143555, 12.157405853271484, 15.719795227050781, 19.282184600830078, 22.844575881958008, 26.406967163085938, 29.969356536865234, 33.53174591064453, 37.094139099121094, 40.65652847290039, 44.21891784667969, 47.781307220458984, 51.34369659423828, 54.906089782714844, 58.46847915649414, 62.03086853027344, 65.59326171875, 69.15565490722656, 72.7180404663086, 76.28043365478516, 79.84281921386719, 83.40521240234375, 86.96760559082031, 90.52999114990234, 94.0923843383789, 97.65476989746094, 101.2171630859375, 104.77955627441406, 108.3419418334961, 111.90433502197266, 115.46672058105469, 119.02911376953125, 122.59150695800781, 126.15390014648438, 129.71627807617188, 133.27867126464844, 136.841064453125, 140.4034423828125, 143.96583557128906, 147.52822875976562, 151.0906219482422, 154.65301513671875, 158.2154083251953]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 7.0, 9.0, 17.0, 18.0, 22.0, 23.0, 28.0, 26.0, 25.0, 36.0, 28.0, 26.0, 43.0, 30.0, 39.0, 37.0, 44.0, 39.0, 45.0, 53.0, 36.0, 29.0, 31.0, 41.0, 25.0, 28.0, 31.0, 25.0, 24.0, 20.0, 18.0, 19.0, 8.0, 12.0, 11.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.22344970703125, -20.473140716552734, -19.72283172607422, -18.972524642944336, -18.22221565246582, -17.471906661987305, -16.721599578857422, -15.971290588378906, -15.22098159790039, -14.470672607421875, -13.720364570617676, -12.970056533813477, -12.219747543334961, -11.469438552856445, -10.719130516052246, -9.968822479248047, -9.218513488769531, -8.468204498291016, -7.717896461486816, -6.967587947845459, -6.217279434204102, -5.466970920562744, -4.716662406921387, -3.9663538932800293, -3.216045379638672, -2.4657368659973145, -1.715428352355957, -0.9651198387145996, -0.2148113250732422, 0.5354971885681152, 1.2858057022094727, 2.03611421585083, 2.7864227294921875, 3.536731243133545, 4.287039756774902, 5.03734827041626, 5.787656784057617, 6.537965297698975, 7.288273811340332, 8.038581848144531, 8.788890838623047, 9.539199829101562, 10.289507865905762, 11.039815902709961, 11.790124893188477, 12.540433883666992, 13.290741920471191, 14.04104995727539, 14.791358947753906, 15.541667938232422, 16.291976928710938, 17.04228401184082, 17.792593002319336, 18.54290199279785, 19.293209075927734, 20.04351806640625, 20.793827056884766, 21.54413604736328, 22.294445037841797, 23.04475212097168, 23.795061111450195, 24.54537010192871, 25.295677185058594, 26.04598617553711, 26.796295166015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 5.0, 11.0, 14.0, 12.0, 8.0, 17.0, 16.0, 18.0, 27.0, 21.0, 30.0, 28.0, 25.0, 33.0, 38.0, 48.0, 42.0, 39.0, 37.0, 46.0, 47.0, 51.0, 38.0, 39.0, 31.0, 35.0, 30.0, 35.0, 24.0, 19.0, 24.0, 21.0, 16.0, 9.0, 22.0, 10.0, 7.0, 9.0, 2.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.556640625, -3.446624755859375, -3.33660888671875, -3.226593017578125, -3.1165771484375, -3.006561279296875, -2.89654541015625, -2.786529541015625, -2.676513671875, -2.566497802734375, -2.45648193359375, -2.346466064453125, -2.2364501953125, -2.126434326171875, -2.01641845703125, -1.906402587890625, -1.79638671875, -1.686370849609375, -1.57635498046875, -1.466339111328125, -1.3563232421875, -1.246307373046875, -1.13629150390625, -1.026275634765625, -0.916259765625, -0.806243896484375, -0.69622802734375, -0.586212158203125, -0.4761962890625, -0.366180419921875, -0.25616455078125, -0.146148681640625, -0.0361328125, 0.073883056640625, 0.18389892578125, 0.293914794921875, 0.4039306640625, 0.513946533203125, 0.62396240234375, 0.733978271484375, 0.843994140625, 0.954010009765625, 1.06402587890625, 1.174041748046875, 1.2840576171875, 1.394073486328125, 1.50408935546875, 1.614105224609375, 1.72412109375, 1.834136962890625, 1.94415283203125, 2.054168701171875, 2.1641845703125, 2.274200439453125, 2.38421630859375, 2.494232177734375, 2.604248046875, 2.714263916015625, 2.82427978515625, 2.934295654296875, 3.0443115234375, 3.154327392578125, 3.26434326171875, 3.374359130859375, 3.484375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 19.0, 8.0, 30.0, 43.0, 50.0, 63.0, 102.0, 155.0, 204.0, 279.0, 434.0, 602.0, 1015.0, 1408.0, 2341.0, 3624.0, 6061.0, 10235.0, 20663.0, 62738.0, 324182.0, 1309965.0, 1762358.0, 527646.0, 101484.0, 26915.0, 12470.0, 6968.0, 4256.0, 2694.0, 1699.0, 1138.0, 776.0, 537.0, 334.0, 236.0, 154.0, 113.0, 81.0, 69.0, 39.0, 20.0, 17.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.01953125, -4.87255859375, -4.7255859375, -4.57861328125, -4.431640625, -4.28466796875, -4.1376953125, -3.99072265625, -3.84375, -3.69677734375, -3.5498046875, -3.40283203125, -3.255859375, -3.10888671875, -2.9619140625, -2.81494140625, -2.66796875, -2.52099609375, -2.3740234375, -2.22705078125, -2.080078125, -1.93310546875, -1.7861328125, -1.63916015625, -1.4921875, -1.34521484375, -1.1982421875, -1.05126953125, -0.904296875, -0.75732421875, -0.6103515625, -0.46337890625, -0.31640625, -0.16943359375, -0.0224609375, 0.12451171875, 0.271484375, 0.41845703125, 0.5654296875, 0.71240234375, 0.859375, 1.00634765625, 1.1533203125, 1.30029296875, 1.447265625, 1.59423828125, 1.7412109375, 1.88818359375, 2.03515625, 2.18212890625, 2.3291015625, 2.47607421875, 2.623046875, 2.77001953125, 2.9169921875, 3.06396484375, 3.2109375, 3.35791015625, 3.5048828125, 3.65185546875, 3.798828125, 3.94580078125, 4.0927734375, 4.23974609375, 4.38671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 2.0, 6.0, 7.0, 10.0, 21.0, 13.0, 26.0, 44.0, 54.0, 84.0, 90.0, 140.0, 170.0, 200.0, 290.0, 386.0, 436.0, 467.0, 382.0, 303.0, 210.0, 167.0, 133.0, 112.0, 69.0, 59.0, 51.0, 47.0, 27.0, 18.0, 12.0, 4.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.1754150390625, -4.026611328125, -3.8778076171875, -3.72900390625, -3.5802001953125, -3.431396484375, -3.2825927734375, -3.1337890625, -2.9849853515625, -2.836181640625, -2.6873779296875, -2.53857421875, -2.3897705078125, -2.240966796875, -2.0921630859375, -1.943359375, -1.7945556640625, -1.645751953125, -1.4969482421875, -1.34814453125, -1.1993408203125, -1.050537109375, -0.9017333984375, -0.7529296875, -0.6041259765625, -0.455322265625, -0.3065185546875, -0.15771484375, -0.0089111328125, 0.139892578125, 0.2886962890625, 0.4375, 0.5863037109375, 0.735107421875, 0.8839111328125, 1.03271484375, 1.1815185546875, 1.330322265625, 1.4791259765625, 1.6279296875, 1.7767333984375, 1.925537109375, 2.0743408203125, 2.22314453125, 2.3719482421875, 2.520751953125, 2.6695556640625, 2.818359375, 2.9671630859375, 3.115966796875, 3.2647705078125, 3.41357421875, 3.5623779296875, 3.711181640625, 3.8599853515625, 4.0087890625, 4.1575927734375, 4.306396484375, 4.4552001953125, 4.60400390625, 4.7528076171875, 4.901611328125, 5.0504150390625, 5.19921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 3.0, 11.0, 8.0, 20.0, 19.0, 25.0, 51.0, 69.0, 94.0, 135.0, 227.0, 338.0, 576.0, 1358.0, 3852.0, 17046.0, 196039.0, 3015026.0, 896771.0, 51004.0, 7327.0, 2136.0, 866.0, 462.0, 271.0, 175.0, 109.0, 60.0, 44.0, 51.0, 25.0, 17.0, 17.0, 6.0, 11.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.5, -9.22662353515625, -8.9532470703125, -8.67987060546875, -8.406494140625, -8.13311767578125, -7.8597412109375, -7.58636474609375, -7.31298828125, -7.03961181640625, -6.7662353515625, -6.49285888671875, -6.219482421875, -5.94610595703125, -5.6727294921875, -5.39935302734375, -5.1259765625, -4.85260009765625, -4.5792236328125, -4.30584716796875, -4.032470703125, -3.75909423828125, -3.4857177734375, -3.21234130859375, -2.93896484375, -2.66558837890625, -2.3922119140625, -2.11883544921875, -1.845458984375, -1.57208251953125, -1.2987060546875, -1.02532958984375, -0.751953125, -0.47857666015625, -0.2052001953125, 0.06817626953125, 0.341552734375, 0.61492919921875, 0.8883056640625, 1.16168212890625, 1.43505859375, 1.70843505859375, 1.9818115234375, 2.25518798828125, 2.528564453125, 2.80194091796875, 3.0753173828125, 3.34869384765625, 3.6220703125, 3.89544677734375, 4.1688232421875, 4.44219970703125, 4.715576171875, 4.98895263671875, 5.2623291015625, 5.53570556640625, 5.80908203125, 6.08245849609375, 6.3558349609375, 6.62921142578125, 6.902587890625, 7.17596435546875, 7.4493408203125, 7.72271728515625, 7.99609375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 14.0, 39.0, 89.0, 209.0, 240.0, 221.0, 114.0, 47.0, 27.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.41825103759766, -66.94837188720703, -65.47850036621094, -64.00862121582031, -62.53874588012695, -61.068870544433594, -59.59899139404297, -58.12911605834961, -56.65924072265625, -55.18936538696289, -53.71949005126953, -52.249610900878906, -50.77973556518555, -49.30986022949219, -47.83998107910156, -46.3701057434082, -44.900230407714844, -43.430355072021484, -41.960479736328125, -40.4906005859375, -39.02072525024414, -37.55084991455078, -36.080970764160156, -34.6110954284668, -33.14122009277344, -31.671344757080078, -30.201467514038086, -28.731590270996094, -27.261714935302734, -25.791839599609375, -24.321962356567383, -22.85208511352539, -21.382213592529297, -19.912338256835938, -18.442461013793945, -16.972583770751953, -15.502708435058594, -14.032832145690918, -12.562955856323242, -11.093079566955566, -9.62320327758789, -8.153326988220215, -6.683450698852539, -5.213574409484863, -3.7436981201171875, -2.2738218307495117, -0.8039455413818359, 0.6659307479858398, 2.1358070373535156, 3.6056833267211914, 5.075559616088867, 6.545435905456543, 8.015312194824219, 9.485188484191895, 10.95506477355957, 12.424941062927246, 13.894817352294922, 15.364693641662598, 16.834569931030273, 18.304447174072266, 19.774322509765625, 21.244197845458984, 22.714075088500977, 24.18395233154297, 25.653827667236328]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 4.0, 6.0, 18.0, 14.0, 19.0, 36.0, 25.0, 27.0, 28.0, 30.0, 48.0, 34.0, 39.0, 30.0, 50.0, 45.0, 42.0, 42.0, 39.0, 42.0, 35.0, 39.0, 39.0, 32.0, 30.0, 27.0, 27.0, 23.0, 21.0, 17.0, 17.0, 18.0, 4.0, 7.0, 8.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.364112854003906, -18.760364532470703, -18.156618118286133, -17.55286979675293, -16.94912338256836, -16.345375061035156, -15.74162769317627, -15.137880325317383, -14.53413200378418, -13.930384635925293, -13.326637268066406, -12.722888946533203, -12.119141578674316, -11.51539421081543, -10.911646842956543, -10.307899475097656, -9.70415210723877, -9.100404739379883, -8.496657371520996, -7.892909526824951, -7.289161682128906, -6.6854143142700195, -6.081666946411133, -5.477919101715088, -4.874171733856201, -4.2704243659973145, -3.6666765213012695, -3.062929153442383, -2.459181547164917, -1.8554339408874512, -1.2516865730285645, -0.6479387283325195, -0.04419136047363281, 0.5595561861991882, 1.1633037328720093, 1.7670512199401855, 2.3707988262176514, 2.974546432495117, 3.578293800354004, 4.182041645050049, 4.7857890129089355, 5.389536380767822, 5.993284225463867, 6.597031593322754, 7.200778961181641, 7.8045268058776855, 8.408273696899414, 9.012022018432617, 9.615769386291504, 10.21951675415039, 10.823264122009277, 11.427011489868164, 12.030759811401367, 12.634507179260254, 13.23825454711914, 13.842002868652344, 14.445749282836914, 15.0494966506958, 15.653244018554688, 16.25699234008789, 16.86073875427246, 17.464487075805664, 18.068233489990234, 18.671981811523438, 19.27573013305664]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 2.0, 12.0, 9.0, 17.0, 19.0, 11.0, 22.0, 23.0, 16.0, 28.0, 28.0, 32.0, 28.0, 37.0, 42.0, 29.0, 40.0, 36.0, 52.0, 36.0, 32.0, 45.0, 38.0, 34.0, 29.0, 39.0, 35.0, 20.0, 22.0, 27.0, 19.0, 24.0, 17.0, 19.0, 11.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0], "bins": [-3.029296875, -2.941070556640625, -2.85284423828125, -2.764617919921875, -2.6763916015625, -2.588165283203125, -2.49993896484375, -2.411712646484375, -2.323486328125, -2.235260009765625, -2.14703369140625, -2.058807373046875, -1.9705810546875, -1.882354736328125, -1.79412841796875, -1.705902099609375, -1.61767578125, -1.529449462890625, -1.44122314453125, -1.352996826171875, -1.2647705078125, -1.176544189453125, -1.08831787109375, -1.000091552734375, -0.911865234375, -0.823638916015625, -0.73541259765625, -0.647186279296875, -0.5589599609375, -0.470733642578125, -0.38250732421875, -0.294281005859375, -0.2060546875, -0.117828369140625, -0.02960205078125, 0.058624267578125, 0.1468505859375, 0.235076904296875, 0.32330322265625, 0.411529541015625, 0.499755859375, 0.587982177734375, 0.67620849609375, 0.764434814453125, 0.8526611328125, 0.940887451171875, 1.02911376953125, 1.117340087890625, 1.20556640625, 1.293792724609375, 1.38201904296875, 1.470245361328125, 1.5584716796875, 1.646697998046875, 1.73492431640625, 1.823150634765625, 1.911376953125, 1.999603271484375, 2.08782958984375, 2.176055908203125, 2.2642822265625, 2.352508544921875, 2.44073486328125, 2.528961181640625, 2.6171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 13.0, 19.0, 33.0, 33.0, 52.0, 80.0, 119.0, 162.0, 226.0, 308.0, 429.0, 642.0, 892.0, 1370.0, 2018.0, 2982.0, 4198.0, 6332.0, 9563.0, 14720.0, 22831.0, 36483.0, 61853.0, 112841.0, 268656.0, 241313.0, 104588.0, 57631.0, 34511.0, 21469.0, 14150.0, 9182.0, 5935.0, 4000.0, 2704.0, 2002.0, 1246.0, 885.0, 580.0, 477.0, 266.0, 213.0, 159.0, 113.0, 82.0, 57.0, 40.0, 31.0, 23.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.017024755477905273, -0.016456127166748047, -0.01588749885559082, -0.015318870544433594, -0.014750242233276367, -0.01418161392211914, -0.013612985610961914, -0.013044357299804688, -0.012475728988647461, -0.011907100677490234, -0.011338472366333008, -0.010769844055175781, -0.010201215744018555, -0.009632587432861328, -0.009063959121704102, -0.008495330810546875, -0.007926702499389648, -0.007358074188232422, -0.006789445877075195, -0.006220817565917969, -0.005652189254760742, -0.005083560943603516, -0.004514932632446289, -0.0039463043212890625, -0.003377676010131836, -0.0028090476989746094, -0.002240419387817383, -0.0016717910766601562, -0.0011031627655029297, -0.0005345344543457031, 3.409385681152344e-05, 0.00060272216796875, 0.0011713504791259766, 0.0017399787902832031, 0.0023086071014404297, 0.0028772354125976562, 0.003445863723754883, 0.004014492034912109, 0.004583120346069336, 0.0051517486572265625, 0.005720376968383789, 0.006289005279541016, 0.006857633590698242, 0.007426261901855469, 0.007994890213012695, 0.008563518524169922, 0.009132146835327148, 0.009700775146484375, 0.010269403457641602, 0.010838031768798828, 0.011406660079956055, 0.011975288391113281, 0.012543916702270508, 0.013112545013427734, 0.013681173324584961, 0.014249801635742188, 0.014818429946899414, 0.01538705825805664, 0.015955686569213867, 0.016524314880371094, 0.01709294319152832, 0.017661571502685547, 0.018230199813842773, 0.018798828125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 5.0, 13.0, 8.0, 14.0, 15.0, 16.0, 15.0, 39.0, 35.0, 24.0, 29.0, 33.0, 25.0, 37.0, 40.0, 47.0, 36.0, 40.0, 1063.0, 46.0, 32.0, 39.0, 38.0, 39.0, 30.0, 29.0, 33.0, 29.0, 25.0, 20.0, 23.0, 22.0, 17.0, 7.0, 15.0, 9.0, 10.0, 6.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.12890625, -2.06378173828125, -1.9986572265625, -1.93353271484375, -1.868408203125, -1.80328369140625, -1.7381591796875, -1.67303466796875, -1.60791015625, -1.54278564453125, -1.4776611328125, -1.41253662109375, -1.347412109375, -1.28228759765625, -1.2171630859375, -1.15203857421875, -1.0869140625, -1.02178955078125, -0.9566650390625, -0.89154052734375, -0.826416015625, -0.76129150390625, -0.6961669921875, -0.63104248046875, -0.56591796875, -0.50079345703125, -0.4356689453125, -0.37054443359375, -0.305419921875, -0.24029541015625, -0.1751708984375, -0.11004638671875, -0.044921875, 0.02020263671875, 0.0853271484375, 0.15045166015625, 0.215576171875, 0.28070068359375, 0.3458251953125, 0.41094970703125, 0.47607421875, 0.54119873046875, 0.6063232421875, 0.67144775390625, 0.736572265625, 0.80169677734375, 0.8668212890625, 0.93194580078125, 0.9970703125, 1.06219482421875, 1.1273193359375, 1.19244384765625, 1.257568359375, 1.32269287109375, 1.3878173828125, 1.45294189453125, 1.51806640625, 1.58319091796875, 1.6483154296875, 1.71343994140625, 1.778564453125, 1.84368896484375, 1.9088134765625, 1.97393798828125, 2.0390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 9.0, 11.0, 18.0, 32.0, 36.0, 53.0, 71.0, 132.0, 161.0, 261.0, 370.0, 599.0, 872.0, 1283.0, 2029.0, 3183.0, 4787.0, 7816.0, 11923.0, 19465.0, 31159.0, 50667.0, 84919.0, 171766.0, 1351274.0, 150326.0, 78786.0, 46948.0, 28839.0, 17881.0, 11363.0, 7018.0, 4582.0, 2882.0, 1858.0, 1284.0, 785.0, 534.0, 384.0, 234.0, 156.0, 101.0, 92.0, 63.0, 39.0, 30.0, 22.0, 11.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.012054443359375, -0.011670827865600586, -0.011287212371826172, -0.010903596878051758, -0.010519981384277344, -0.01013636589050293, -0.009752750396728516, -0.009369134902954102, -0.008985519409179688, -0.008601903915405273, -0.00821828842163086, -0.007834672927856445, -0.007451057434082031, -0.007067441940307617, -0.006683826446533203, -0.006300210952758789, -0.005916595458984375, -0.005532979965209961, -0.005149364471435547, -0.004765748977661133, -0.004382133483886719, -0.003998517990112305, -0.0036149024963378906, -0.0032312870025634766, -0.0028476715087890625, -0.0024640560150146484, -0.0020804405212402344, -0.0016968250274658203, -0.0013132095336914062, -0.0009295940399169922, -0.0005459785461425781, -0.00016236305236816406, 0.00022125244140625, 0.0006048679351806641, 0.0009884834289550781, 0.0013720989227294922, 0.0017557144165039062, 0.0021393299102783203, 0.0025229454040527344, 0.0029065608978271484, 0.0032901763916015625, 0.0036737918853759766, 0.004057407379150391, 0.004441022872924805, 0.004824638366699219, 0.005208253860473633, 0.005591869354248047, 0.005975484848022461, 0.006359100341796875, 0.006742715835571289, 0.007126331329345703, 0.007509946823120117, 0.007893562316894531, 0.008277177810668945, 0.00866079330444336, 0.009044408798217773, 0.009428024291992188, 0.009811639785766602, 0.010195255279541016, 0.01057887077331543, 0.010962486267089844, 0.011346101760864258, 0.011729717254638672, 0.012113332748413086, 0.0124969482421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 166.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 528.0, 0.0, 0.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.980232238769531e-07, -2.8870999813079834e-07, -2.7939677238464355e-07, -2.7008354663848877e-07, -2.60770320892334e-07, -2.514570951461792e-07, -2.421438694000244e-07, -2.3283064365386963e-07, -2.2351741790771484e-07, -2.1420419216156006e-07, -2.0489096641540527e-07, -1.955777406692505e-07, -1.862645149230957e-07, -1.7695128917694092e-07, -1.6763806343078613e-07, -1.5832483768463135e-07, -1.4901161193847656e-07, -1.3969838619232178e-07, -1.30385160446167e-07, -1.210719347000122e-07, -1.1175870895385742e-07, -1.0244548320770264e-07, -9.313225746154785e-08, -8.381903171539307e-08, -7.450580596923828e-08, -6.51925802230835e-08, -5.587935447692871e-08, -4.6566128730773926e-08, -3.725290298461914e-08, -2.7939677238464355e-08, -1.862645149230957e-08, -9.313225746154785e-09, 0.0, 9.313225746154785e-09, 1.862645149230957e-08, 2.7939677238464355e-08, 3.725290298461914e-08, 4.6566128730773926e-08, 5.587935447692871e-08, 6.51925802230835e-08, 7.450580596923828e-08, 8.381903171539307e-08, 9.313225746154785e-08, 1.0244548320770264e-07, 1.1175870895385742e-07, 1.210719347000122e-07, 1.30385160446167e-07, 1.3969838619232178e-07, 1.4901161193847656e-07, 1.5832483768463135e-07, 1.6763806343078613e-07, 1.7695128917694092e-07, 1.862645149230957e-07, 1.955777406692505e-07, 2.0489096641540527e-07, 2.1420419216156006e-07, 2.2351741790771484e-07, 2.3283064365386963e-07, 2.421438694000244e-07, 2.514570951461792e-07, 2.60770320892334e-07, 2.7008354663848877e-07, 2.7939677238464355e-07, 2.8870999813079834e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 4.0, 9.0, 6.0, 6.0, 22.0, 29.0, 40.0, 19.0, 7.0, 40.0, 92.0, 201.0, 182.0, 47.0, 411.0, 640.0, 123459.0, 920055.0, 2043.0, 446.0, 107.0, 90.0, 240.0, 114.0, 58.0, 7.0, 13.0, 36.0, 20.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 7.0, 9.0, 5.0, 6.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7220458984375e-06, -5.544163286685944e-06, -5.366280674934387e-06, -5.188398063182831e-06, -5.010515451431274e-06, -4.832632839679718e-06, -4.654750227928162e-06, -4.476867616176605e-06, -4.298985004425049e-06, -4.1211023926734924e-06, -3.943219780921936e-06, -3.7653371691703796e-06, -3.5874545574188232e-06, -3.409571945667267e-06, -3.2316893339157104e-06, -3.053806722164154e-06, -2.8759241104125977e-06, -2.6980414986610413e-06, -2.520158886909485e-06, -2.3422762751579285e-06, -2.164393663406372e-06, -1.9865110516548157e-06, -1.8086284399032593e-06, -1.6307458281517029e-06, -1.4528632164001465e-06, -1.27498060464859e-06, -1.0970979928970337e-06, -9.192153811454773e-07, -7.413327693939209e-07, -5.634501576423645e-07, -3.855675458908081e-07, -2.076849341392517e-07, -2.9802322387695312e-08, 1.4808028936386108e-07, 3.259629011154175e-07, 5.038455128669739e-07, 6.817281246185303e-07, 8.596107363700867e-07, 1.037493348121643e-06, 1.2153759598731995e-06, 1.3932585716247559e-06, 1.5711411833763123e-06, 1.7490237951278687e-06, 1.926906406879425e-06, 2.1047890186309814e-06, 2.282671630382538e-06, 2.4605542421340942e-06, 2.6384368538856506e-06, 2.816319465637207e-06, 2.9942020773887634e-06, 3.17208468914032e-06, 3.3499673008918762e-06, 3.5278499126434326e-06, 3.705732524394989e-06, 3.883615136146545e-06, 4.061497747898102e-06, 4.239380359649658e-06, 4.417262971401215e-06, 4.595145583152771e-06, 4.773028194904327e-06, 4.950910806655884e-06, 5.12879341840744e-06, 5.306676030158997e-06, 5.484558641910553e-06, 5.662441253662109e-06]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 9.0, 6.0, 7.0, 4.0, 4.0, 9.0, 5.0, 864.0, 7.0, 7.0, 9.0, 10.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1453262516170071e-07, -1.1141437994410808e-07, -1.0829613472651545e-07, -1.0517788950892282e-07, -1.0205964429133019e-07, -9.894139907373756e-08, -9.582315385614493e-08, -9.27049086385523e-08, -8.958666342095967e-08, -8.646841820336704e-08, -8.335017298577441e-08, -8.023192776818178e-08, -7.711368255058915e-08, -7.399543733299652e-08, -7.087719211540389e-08, -6.775894689781126e-08, -6.464070878564598e-08, -6.152246356805335e-08, -5.8404218350460724e-08, -5.5285973132868094e-08, -5.2167727915275464e-08, -4.9049482697682834e-08, -4.593124103280388e-08, -4.281299581521125e-08, -3.969475059761862e-08, -3.657650538002599e-08, -3.345826016243336e-08, -3.034001849755441e-08, -2.722177150360494e-08, -2.410352628601231e-08, -2.098528284477652e-08, -1.786703762718389e-08, -1.4748785304163903e-08, -1.1630540086571273e-08, -8.512295757157062e-09, -5.394051427742852e-09, -2.275806210150222e-09, 8.424390074424082e-10, 3.960682448678199e-09, 7.078927666270829e-09, 1.0197172883863459e-08, 1.3315418101456089e-08, 1.643366331904872e-08, 1.955190676028451e-08, 2.267015197787714e-08, 2.578839719546977e-08, 2.890664063670556e-08, 3.202488585429819e-08, 3.514313107189082e-08, 3.826137628948345e-08, 4.137962150707608e-08, 4.449786672466871e-08, 4.761611194226134e-08, 5.073435715985397e-08, 5.385259882473292e-08, 5.697084404232555e-08, 6.008909281263186e-08, 6.320733803022449e-08, 6.632558324781712e-08, 6.944382846540975e-08, 7.256207368300238e-08, 7.568031890059501e-08, 7.879856411818764e-08, 8.191680933578027e-08, 8.503504744794554e-08]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 861.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 2.0, 12.0, 9.0, 17.0, 19.0, 11.0, 22.0, 23.0, 16.0, 28.0, 28.0, 32.0, 28.0, 37.0, 42.0, 29.0, 40.0, 36.0, 52.0, 36.0, 32.0, 45.0, 38.0, 34.0, 29.0, 39.0, 35.0, 20.0, 22.0, 27.0, 19.0, 24.0, 17.0, 19.0, 11.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0], "bins": [-3.029296875, -2.941070556640625, -2.85284423828125, -2.764617919921875, -2.6763916015625, -2.588165283203125, -2.49993896484375, -2.411712646484375, -2.323486328125, -2.235260009765625, -2.14703369140625, -2.058807373046875, -1.9705810546875, -1.882354736328125, -1.79412841796875, -1.705902099609375, -1.61767578125, -1.529449462890625, -1.44122314453125, -1.352996826171875, -1.2647705078125, -1.176544189453125, -1.08831787109375, -1.000091552734375, -0.911865234375, -0.823638916015625, -0.73541259765625, -0.647186279296875, -0.5589599609375, -0.470733642578125, -0.38250732421875, -0.294281005859375, -0.2060546875, -0.117828369140625, -0.02960205078125, 0.058624267578125, 0.1468505859375, 0.235076904296875, 0.32330322265625, 0.411529541015625, 0.499755859375, 0.587982177734375, 0.67620849609375, 0.764434814453125, 0.8526611328125, 0.940887451171875, 1.02911376953125, 1.117340087890625, 1.20556640625, 1.293792724609375, 1.38201904296875, 1.470245361328125, 1.5584716796875, 1.646697998046875, 1.73492431640625, 1.823150634765625, 1.911376953125, 1.999603271484375, 2.08782958984375, 2.176055908203125, 2.2642822265625, 2.352508544921875, 2.44073486328125, 2.528961181640625, 2.6171875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 8.0, 11.0, 20.0, 19.0, 24.0, 37.0, 37.0, 51.0, 84.0, 121.0, 149.0, 231.0, 351.0, 605.0, 1070.0, 2217.0, 5289.0, 16021.0, 66148.0, 328596.0, 474613.0, 114100.0, 24934.0, 7513.0, 2866.0, 1409.0, 724.0, 378.0, 251.0, 163.0, 117.0, 76.0, 62.0, 38.0, 43.0, 32.0, 27.0, 18.0, 13.0, 17.0, 16.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0], "bins": [-4.55078125, -4.41357421875, -4.2763671875, -4.13916015625, -4.001953125, -3.86474609375, -3.7275390625, -3.59033203125, -3.453125, -3.31591796875, -3.1787109375, -3.04150390625, -2.904296875, -2.76708984375, -2.6298828125, -2.49267578125, -2.35546875, -2.21826171875, -2.0810546875, -1.94384765625, -1.806640625, -1.66943359375, -1.5322265625, -1.39501953125, -1.2578125, -1.12060546875, -0.9833984375, -0.84619140625, -0.708984375, -0.57177734375, -0.4345703125, -0.29736328125, -0.16015625, -0.02294921875, 0.1142578125, 0.25146484375, 0.388671875, 0.52587890625, 0.6630859375, 0.80029296875, 0.9375, 1.07470703125, 1.2119140625, 1.34912109375, 1.486328125, 1.62353515625, 1.7607421875, 1.89794921875, 2.03515625, 2.17236328125, 2.3095703125, 2.44677734375, 2.583984375, 2.72119140625, 2.8583984375, 2.99560546875, 3.1328125, 3.27001953125, 3.4072265625, 3.54443359375, 3.681640625, 3.81884765625, 3.9560546875, 4.09326171875, 4.23046875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 9.0, 18.0, 19.0, 19.0, 21.0, 31.0, 30.0, 49.0, 56.0, 62.0, 56.0, 126.0, 389.0, 1583.0, 168.0, 80.0, 67.0, 49.0, 49.0, 40.0, 32.0, 28.0, 15.0, 11.0, 18.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.392333984375, -7.07373046875, -6.755126953125, -6.4365234375, -6.117919921875, -5.79931640625, -5.480712890625, -5.162109375, -4.843505859375, -4.52490234375, -4.206298828125, -3.8876953125, -3.569091796875, -3.25048828125, -2.931884765625, -2.61328125, -2.294677734375, -1.97607421875, -1.657470703125, -1.3388671875, -1.020263671875, -0.70166015625, -0.383056640625, -0.064453125, 0.254150390625, 0.57275390625, 0.891357421875, 1.2099609375, 1.528564453125, 1.84716796875, 2.165771484375, 2.484375, 2.802978515625, 3.12158203125, 3.440185546875, 3.7587890625, 4.077392578125, 4.39599609375, 4.714599609375, 5.033203125, 5.351806640625, 5.67041015625, 5.989013671875, 6.3076171875, 6.626220703125, 6.94482421875, 7.263427734375, 7.58203125, 7.900634765625, 8.21923828125, 8.537841796875, 8.8564453125, 9.175048828125, 9.49365234375, 9.812255859375, 10.130859375, 10.449462890625, 10.76806640625, 11.086669921875, 11.4052734375, 11.723876953125, 12.04248046875, 12.361083984375, 12.6796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 12.0, 15.0, 17.0, 54.0, 68.0, 126.0, 219.0, 393.0, 1004.0, 32904.0, 3106531.0, 2945.0, 642.0, 311.0, 154.0, 100.0, 57.0, 28.0, 21.0, 18.0, 11.0, 12.0, 17.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.0625, -29.297119140625, -28.53173828125, -27.766357421875, -27.0009765625, -26.235595703125, -25.47021484375, -24.704833984375, -23.939453125, -23.174072265625, -22.40869140625, -21.643310546875, -20.8779296875, -20.112548828125, -19.34716796875, -18.581787109375, -17.81640625, -17.051025390625, -16.28564453125, -15.520263671875, -14.7548828125, -13.989501953125, -13.22412109375, -12.458740234375, -11.693359375, -10.927978515625, -10.16259765625, -9.397216796875, -8.6318359375, -7.866455078125, -7.10107421875, -6.335693359375, -5.5703125, -4.804931640625, -4.03955078125, -3.274169921875, -2.5087890625, -1.743408203125, -0.97802734375, -0.212646484375, 0.552734375, 1.318115234375, 2.08349609375, 2.848876953125, 3.6142578125, 4.379638671875, 5.14501953125, 5.910400390625, 6.67578125, 7.441162109375, 8.20654296875, 8.971923828125, 9.7373046875, 10.502685546875, 11.26806640625, 12.033447265625, 12.798828125, 13.564208984375, 14.32958984375, 15.094970703125, 15.8603515625, 16.625732421875, 17.39111328125, 18.156494140625, 18.921875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 31.0, 436.0, 487.0, 57.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.99073314666748, -6.779177188873291, -4.567621231079102, -2.356065273284912, -0.14450931549072266, 2.0670461654663086, 4.278602600097656, 6.490159034729004, 8.701714515686035, 10.913270950317383, 13.124826431274414, 15.336381912231445, 17.54793930053711, 19.75949478149414, 21.971050262451172, 24.182605743408203, 26.394161224365234, 28.605716705322266, 30.817272186279297, 33.02882766723633, 35.240386962890625, 37.451942443847656, 39.66349792480469, 41.87505340576172, 44.08660888671875, 46.29816436767578, 48.50971984863281, 50.721275329589844, 52.932830810546875, 55.144386291503906, 57.3559455871582, 59.567501068115234, 61.779052734375, 63.99060821533203, 66.20216369628906, 68.4137191772461, 70.62527465820312, 72.83683013916016, 75.04838562011719, 77.25994873046875, 79.47149658203125, 81.68305206298828, 83.89460754394531, 86.10616302490234, 88.31771850585938, 90.5292739868164, 92.74082946777344, 94.952392578125, 97.16394805908203, 99.37550354003906, 101.5870590209961, 103.79861450195312, 106.01016998291016, 108.22172546386719, 110.43328094482422, 112.64483642578125, 114.85639953613281, 117.06795501708984, 119.27951049804688, 121.4910659790039, 123.70262145996094, 125.91417694091797, 128.125732421875, 130.33729553222656, 132.54884338378906]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 10.0, 14.0, 15.0, 16.0, 12.0, 18.0, 15.0, 20.0, 26.0, 29.0, 40.0, 28.0, 30.0, 27.0, 34.0, 37.0, 45.0, 36.0, 39.0, 43.0, 23.0, 31.0, 36.0, 41.0, 28.0, 39.0, 29.0, 26.0, 25.0, 29.0, 18.0, 18.0, 17.0, 17.0, 16.0, 16.0, 13.0, 6.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.852767944335938, -15.32209587097168, -14.791422843933105, -14.260750770568848, -13.73007869720459, -13.199405670166016, -12.668733596801758, -12.1380615234375, -11.607389450073242, -11.076717376708984, -10.54604434967041, -10.015372276306152, -9.484700202941895, -8.95402717590332, -8.423355102539062, -7.892683029174805, -7.3620100021362305, -6.8313374519348145, -6.300665378570557, -5.769992828369141, -5.239320755004883, -4.708648204803467, -4.177975654602051, -3.647303342819214, -3.116631031036377, -2.58595871925354, -2.055286407470703, -1.524613857269287, -0.9939415454864502, -0.4632692337036133, 0.06740331649780273, 0.5980756282806396, 1.1287479400634766, 1.6594202518463135, 2.1900925636291504, 2.7207651138305664, 3.2514374256134033, 3.7821097373962402, 4.312782287597656, 4.843454360961914, 5.37412691116333, 5.904799461364746, 6.435471534729004, 6.96614408493042, 7.496816635131836, 8.027488708496094, 8.558160781860352, 9.088833808898926, 9.619505882263184, 10.150177955627441, 10.680850982666016, 11.211523056030273, 11.742195129394531, 12.272867202758789, 12.803540229797363, 13.334212303161621, 13.864885330200195, 14.395557403564453, 14.926230430603027, 15.456902503967285, 15.987574577331543, 16.518247604370117, 17.048919677734375, 17.579591751098633, 18.11026382446289]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 3.0, 8.0, 13.0, 2.0, 13.0, 11.0, 10.0, 18.0, 20.0, 25.0, 31.0, 33.0, 30.0, 26.0, 45.0, 31.0, 42.0, 37.0, 33.0, 43.0, 36.0, 48.0, 35.0, 39.0, 35.0, 52.0, 33.0, 27.0, 20.0, 28.0, 26.0, 17.0, 23.0, 13.0, 17.0, 20.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.12109375, -3.0208740234375, -2.920654296875, -2.8204345703125, -2.72021484375, -2.6199951171875, -2.519775390625, -2.4195556640625, -2.3193359375, -2.2191162109375, -2.118896484375, -2.0186767578125, -1.91845703125, -1.8182373046875, -1.718017578125, -1.6177978515625, -1.517578125, -1.4173583984375, -1.317138671875, -1.2169189453125, -1.11669921875, -1.0164794921875, -0.916259765625, -0.8160400390625, -0.7158203125, -0.6156005859375, -0.515380859375, -0.4151611328125, -0.31494140625, -0.2147216796875, -0.114501953125, -0.0142822265625, 0.0859375, 0.1861572265625, 0.286376953125, 0.3865966796875, 0.48681640625, 0.5870361328125, 0.687255859375, 0.7874755859375, 0.8876953125, 0.9879150390625, 1.088134765625, 1.1883544921875, 1.28857421875, 1.3887939453125, 1.489013671875, 1.5892333984375, 1.689453125, 1.7896728515625, 1.889892578125, 1.9901123046875, 2.09033203125, 2.1905517578125, 2.290771484375, 2.3909912109375, 2.4912109375, 2.5914306640625, 2.691650390625, 2.7918701171875, 2.89208984375, 2.9923095703125, 3.092529296875, 3.1927490234375, 3.29296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 11.0, 15.0, 17.0, 26.0, 27.0, 43.0, 51.0, 62.0, 88.0, 100.0, 164.0, 184.0, 237.0, 329.0, 480.0, 685.0, 1162.0, 2996.0, 14661.0, 156810.0, 2905548.0, 1047370.0, 51463.0, 6827.0, 1808.0, 871.0, 587.0, 381.0, 295.0, 250.0, 167.0, 135.0, 91.0, 67.0, 67.0, 49.0, 32.0, 31.0, 18.0, 22.0, 14.0, 9.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.765625, -15.2696533203125, -14.773681640625, -14.2777099609375, -13.78173828125, -13.2857666015625, -12.789794921875, -12.2938232421875, -11.7978515625, -11.3018798828125, -10.805908203125, -10.3099365234375, -9.81396484375, -9.3179931640625, -8.822021484375, -8.3260498046875, -7.830078125, -7.3341064453125, -6.838134765625, -6.3421630859375, -5.84619140625, -5.3502197265625, -4.854248046875, -4.3582763671875, -3.8623046875, -3.3663330078125, -2.870361328125, -2.3743896484375, -1.87841796875, -1.3824462890625, -0.886474609375, -0.3905029296875, 0.10546875, 0.6014404296875, 1.097412109375, 1.5933837890625, 2.08935546875, 2.5853271484375, 3.081298828125, 3.5772705078125, 4.0732421875, 4.5692138671875, 5.065185546875, 5.5611572265625, 6.05712890625, 6.5531005859375, 7.049072265625, 7.5450439453125, 8.041015625, 8.5369873046875, 9.032958984375, 9.5289306640625, 10.02490234375, 10.5208740234375, 11.016845703125, 11.5128173828125, 12.0087890625, 12.5047607421875, 13.000732421875, 13.4967041015625, 13.99267578125, 14.4886474609375, 14.984619140625, 15.4805908203125, 15.9765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 8.0, 27.0, 39.0, 52.0, 72.0, 100.0, 148.0, 217.0, 280.0, 425.0, 529.0, 618.0, 463.0, 356.0, 215.0, 160.0, 113.0, 78.0, 51.0, 38.0, 19.0, 21.0, 7.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.0355224609375, -5.774169921875, -5.5128173828125, -5.25146484375, -4.9901123046875, -4.728759765625, -4.4674072265625, -4.2060546875, -3.9447021484375, -3.683349609375, -3.4219970703125, -3.16064453125, -2.8992919921875, -2.637939453125, -2.3765869140625, -2.115234375, -1.8538818359375, -1.592529296875, -1.3311767578125, -1.06982421875, -0.8084716796875, -0.547119140625, -0.2857666015625, -0.0244140625, 0.2369384765625, 0.498291015625, 0.7596435546875, 1.02099609375, 1.2823486328125, 1.543701171875, 1.8050537109375, 2.06640625, 2.3277587890625, 2.589111328125, 2.8504638671875, 3.11181640625, 3.3731689453125, 3.634521484375, 3.8958740234375, 4.1572265625, 4.4185791015625, 4.679931640625, 4.9412841796875, 5.20263671875, 5.4639892578125, 5.725341796875, 5.9866943359375, 6.248046875, 6.5093994140625, 6.770751953125, 7.0321044921875, 7.29345703125, 7.5548095703125, 7.816162109375, 8.0775146484375, 8.3388671875, 8.6002197265625, 8.861572265625, 9.1229248046875, 9.38427734375, 9.6456298828125, 9.906982421875, 10.1683349609375, 10.4296875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 20.0, 25.0, 26.0, 45.0, 40.0, 51.0, 109.0, 157.0, 315.0, 592.0, 1681.0, 6035.0, 31417.0, 239177.0, 2276049.0, 1463771.0, 146692.0, 21119.0, 4436.0, 1252.0, 487.0, 240.0, 142.0, 115.0, 65.0, 55.0, 35.0, 33.0, 22.0, 14.0, 13.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.190673828125, -7.89697265625, -7.603271484375, -7.3095703125, -7.015869140625, -6.72216796875, -6.428466796875, -6.134765625, -5.841064453125, -5.54736328125, -5.253662109375, -4.9599609375, -4.666259765625, -4.37255859375, -4.078857421875, -3.78515625, -3.491455078125, -3.19775390625, -2.904052734375, -2.6103515625, -2.316650390625, -2.02294921875, -1.729248046875, -1.435546875, -1.141845703125, -0.84814453125, -0.554443359375, -0.2607421875, 0.032958984375, 0.32666015625, 0.620361328125, 0.9140625, 1.207763671875, 1.50146484375, 1.795166015625, 2.0888671875, 2.382568359375, 2.67626953125, 2.969970703125, 3.263671875, 3.557373046875, 3.85107421875, 4.144775390625, 4.4384765625, 4.732177734375, 5.02587890625, 5.319580078125, 5.61328125, 5.906982421875, 6.20068359375, 6.494384765625, 6.7880859375, 7.081787109375, 7.37548828125, 7.669189453125, 7.962890625, 8.256591796875, 8.55029296875, 8.843994140625, 9.1376953125, 9.431396484375, 9.72509765625, 10.018798828125, 10.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 17.0, 19.0, 29.0, 29.0, 43.0, 49.0, 73.0, 65.0, 46.0, 88.0, 79.0, 71.0, 66.0, 61.0, 57.0, 53.0, 30.0, 29.0, 21.0, 21.0, 6.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.623638153076172, -30.243188858032227, -28.86273956298828, -27.48229217529297, -26.101842880249023, -24.721393585205078, -23.340946197509766, -21.96049690246582, -20.580047607421875, -19.19959831237793, -17.819149017333984, -16.438701629638672, -15.058252334594727, -13.677803039550781, -12.297354698181152, -10.916906356811523, -9.536457061767578, -8.156007766723633, -6.775559425354004, -5.395110607147217, -4.01466178894043, -2.6342129707336426, -1.2537641525268555, 0.12668418884277344, 1.5071334838867188, 2.887582302093506, 4.268031120300293, 5.64847993850708, 7.028928756713867, 8.409378051757812, 9.789826393127441, 11.17027473449707, 12.550724029541016, 13.931173324584961, 15.31162166595459, 16.69207000732422, 18.072519302368164, 19.45296859741211, 20.833415985107422, 22.213865280151367, 23.594314575195312, 24.974763870239258, 26.355213165283203, 27.735660552978516, 29.11610984802246, 30.496559143066406, 31.87700653076172, 33.25745391845703, 34.63790512084961, 36.01835250854492, 37.3988037109375, 38.77925109863281, 40.159698486328125, 41.5401496887207, 42.920597076416016, 44.301048278808594, 45.681495666503906, 47.06194305419922, 48.4423942565918, 49.82284164428711, 51.20329284667969, 52.583740234375, 53.96418762207031, 55.344635009765625, 56.7250862121582]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 13.0, 14.0, 7.0, 13.0, 16.0, 18.0, 17.0, 23.0, 29.0, 28.0, 29.0, 43.0, 44.0, 46.0, 44.0, 37.0, 43.0, 42.0, 38.0, 36.0, 35.0, 42.0, 39.0, 29.0, 34.0, 26.0, 27.0, 23.0, 16.0, 17.0, 15.0, 10.0, 12.0, 11.0, 16.0, 14.0, 8.0, 5.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.3070011138916, -29.419960021972656, -28.53291893005371, -27.645877838134766, -26.75883674621582, -25.871795654296875, -24.984756469726562, -24.097713470458984, -23.210674285888672, -22.323633193969727, -21.43659210205078, -20.549551010131836, -19.66250991821289, -18.775468826293945, -17.888427734375, -17.001388549804688, -16.11434555053711, -15.227304458618164, -14.340263366699219, -13.453222274780273, -12.566181182861328, -11.679140090942383, -10.792099952697754, -9.905058860778809, -9.018017768859863, -8.130976676940918, -7.243935585021973, -6.3568949699401855, -5.46985387802124, -4.582812786102295, -3.695772171020508, -2.8087310791015625, -1.9216880798339844, -1.0346471071243286, -0.14760613441467285, 0.7394347190856934, 1.6264758110046387, 2.513516902923584, 3.400557518005371, 4.287598609924316, 5.174639701843262, 6.061680793762207, 6.948721885681152, 7.8357625007629395, 8.722803115844727, 9.609844207763672, 10.496885299682617, 11.383926391601562, 12.270967483520508, 13.158008575439453, 14.045049667358398, 14.932090759277344, 15.819131851196289, 16.706172943115234, 17.593212127685547, 18.480255126953125, 19.367294311523438, 20.254335403442383, 21.141376495361328, 22.028417587280273, 22.91545867919922, 23.802499771118164, 24.68954086303711, 25.576580047607422, 26.463623046875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 14.0, 13.0, 11.0, 19.0, 20.0, 23.0, 34.0, 37.0, 34.0, 51.0, 43.0, 48.0, 37.0, 49.0, 45.0, 46.0, 45.0, 43.0, 45.0, 35.0, 30.0, 29.0, 25.0, 25.0, 18.0, 23.0, 14.0, 11.0, 16.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-60.21875, -58.46728515625, -56.7158203125, -54.96435546875, -53.212890625, -51.46142578125, -49.7099609375, -47.95849609375, -46.20703125, -44.45556640625, -42.7041015625, -40.95263671875, -39.201171875, -37.44970703125, -35.6982421875, -33.94677734375, -32.1953125, -30.44384765625, -28.6923828125, -26.94091796875, -25.189453125, -23.43798828125, -21.6865234375, -19.93505859375, -18.18359375, -16.43212890625, -14.6806640625, -12.92919921875, -11.177734375, -9.42626953125, -7.6748046875, -5.92333984375, -4.171875, -2.42041015625, -0.6689453125, 1.08251953125, 2.833984375, 4.58544921875, 6.3369140625, 8.08837890625, 9.83984375, 11.59130859375, 13.3427734375, 15.09423828125, 16.845703125, 18.59716796875, 20.3486328125, 22.10009765625, 23.8515625, 25.60302734375, 27.3544921875, 29.10595703125, 30.857421875, 32.60888671875, 34.3603515625, 36.11181640625, 37.86328125, 39.61474609375, 41.3662109375, 43.11767578125, 44.869140625, 46.62060546875, 48.3720703125, 50.12353515625, 51.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 13.0, 15.0, 18.0, 31.0, 55.0, 105.0, 153.0, 209.0, 280.0, 474.0, 685.0, 1058.0, 1589.0, 2379.0, 3564.0, 5329.0, 7980.0, 12144.0, 18246.0, 28914.0, 47594.0, 84932.0, 185914.0, 337393.0, 132043.0, 67286.0, 39374.0, 24134.0, 15655.0, 10247.0, 6907.0, 4601.0, 3135.0, 2008.0, 1347.0, 906.0, 620.0, 420.0, 265.0, 172.0, 111.0, 69.0, 52.0, 46.0, 31.0, 17.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4056587219238281, -0.39310455322265625, -0.3805503845214844, -0.3679962158203125, -0.3554420471191406, -0.34288787841796875, -0.3303337097167969, -0.317779541015625, -0.3052253723144531, -0.29267120361328125, -0.2801170349121094, -0.2675628662109375, -0.2550086975097656, -0.24245452880859375, -0.22990036010742188, -0.21734619140625, -0.20479202270507812, -0.19223785400390625, -0.17968368530273438, -0.1671295166015625, -0.15457534790039062, -0.14202117919921875, -0.12946701049804688, -0.116912841796875, -0.10435867309570312, -0.09180450439453125, -0.07925033569335938, -0.0666961669921875, -0.054141998291015625, -0.04158782958984375, -0.029033660888671875, -0.0164794921875, -0.003925323486328125, 0.00862884521484375, 0.021183013916015625, 0.0337371826171875, 0.046291351318359375, 0.05884552001953125, 0.07139968872070312, 0.083953857421875, 0.09650802612304688, 0.10906219482421875, 0.12161636352539062, 0.1341705322265625, 0.14672470092773438, 0.15927886962890625, 0.17183303833007812, 0.18438720703125, 0.19694137573242188, 0.20949554443359375, 0.22204971313476562, 0.2346038818359375, 0.24715805053710938, 0.25971221923828125, 0.2722663879394531, 0.284820556640625, 0.2973747253417969, 0.30992889404296875, 0.3224830627441406, 0.3350372314453125, 0.3475914001464844, 0.36014556884765625, 0.3726997375488281, 0.38525390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 5.0, 12.0, 14.0, 17.0, 17.0, 17.0, 20.0, 21.0, 26.0, 40.0, 25.0, 33.0, 28.0, 38.0, 39.0, 40.0, 27.0, 48.0, 1060.0, 39.0, 37.0, 44.0, 43.0, 44.0, 41.0, 25.0, 22.0, 27.0, 26.0, 20.0, 17.0, 20.0, 19.0, 8.0, 11.0, 10.0, 7.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-36.03125, -34.976318359375, -33.92138671875, -32.866455078125, -31.8115234375, -30.756591796875, -29.70166015625, -28.646728515625, -27.591796875, -26.536865234375, -25.48193359375, -24.427001953125, -23.3720703125, -22.317138671875, -21.26220703125, -20.207275390625, -19.15234375, -18.097412109375, -17.04248046875, -15.987548828125, -14.9326171875, -13.877685546875, -12.82275390625, -11.767822265625, -10.712890625, -9.657958984375, -8.60302734375, -7.548095703125, -6.4931640625, -5.438232421875, -4.38330078125, -3.328369140625, -2.2734375, -1.218505859375, -0.16357421875, 0.891357421875, 1.9462890625, 3.001220703125, 4.05615234375, 5.111083984375, 6.166015625, 7.220947265625, 8.27587890625, 9.330810546875, 10.3857421875, 11.440673828125, 12.49560546875, 13.550537109375, 14.60546875, 15.660400390625, 16.71533203125, 17.770263671875, 18.8251953125, 19.880126953125, 20.93505859375, 21.989990234375, 23.044921875, 24.099853515625, 25.15478515625, 26.209716796875, 27.2646484375, 28.319580078125, 29.37451171875, 30.429443359375, 31.484375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 14.0, 10.0, 16.0, 24.0, 33.0, 50.0, 69.0, 137.0, 167.0, 221.0, 388.0, 600.0, 897.0, 1187.0, 1995.0, 3051.0, 4543.0, 7172.0, 11436.0, 17735.0, 28453.0, 47114.0, 81255.0, 161640.0, 1353225.0, 165386.0, 83171.0, 47526.0, 29407.0, 18021.0, 11282.0, 7386.0, 4677.0, 3035.0, 1975.0, 1297.0, 838.0, 538.0, 361.0, 283.0, 183.0, 95.0, 81.0, 56.0, 54.0, 20.0, 11.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1943359375, -0.18796730041503906, -0.18159866333007812, -0.1752300262451172, -0.16886138916015625, -0.1624927520751953, -0.15612411499023438, -0.14975547790527344, -0.1433868408203125, -0.13701820373535156, -0.13064956665039062, -0.12428092956542969, -0.11791229248046875, -0.11154365539550781, -0.10517501831054688, -0.09880638122558594, -0.092437744140625, -0.08606910705566406, -0.07970046997070312, -0.07333183288574219, -0.06696319580078125, -0.06059455871582031, -0.054225921630859375, -0.04785728454589844, -0.0414886474609375, -0.03512001037597656, -0.028751373291015625, -0.022382736206054688, -0.01601409912109375, -0.009645462036132812, -0.003276824951171875, 0.0030918121337890625, 0.00946044921875, 0.015829086303710938, 0.022197723388671875, 0.028566360473632812, 0.03493499755859375, 0.04130363464355469, 0.047672271728515625, 0.05404090881347656, 0.0604095458984375, 0.06677818298339844, 0.07314682006835938, 0.07951545715332031, 0.08588409423828125, 0.09225273132324219, 0.09862136840820312, 0.10499000549316406, 0.111358642578125, 0.11772727966308594, 0.12409591674804688, 0.1304645538330078, 0.13683319091796875, 0.1432018280029297, 0.14957046508789062, 0.15593910217285156, 0.1623077392578125, 0.16867637634277344, 0.17504501342773438, 0.1814136505126953, 0.18778228759765625, 0.1941509246826172, 0.20051956176757812, 0.20688819885253906, 0.2132568359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 15.0, 14.0, 12.0, 7.0, 16.0, 29.0, 21.0, 30.0, 52.0, 39.0, 24.0, 32.0, 43.0, 28.0, 41.0, 42.0, 35.0, 54.0, 43.0, 47.0, 37.0, 35.0, 33.0, 28.0, 35.0, 29.0, 23.0, 21.0, 28.0, 17.0, 9.0, 10.0, 14.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.5138800740242004e-06, -3.3918768167495728e-06, -3.269873559474945e-06, -3.1478703022003174e-06, -3.0258670449256897e-06, -2.903863787651062e-06, -2.7818605303764343e-06, -2.6598572731018066e-06, -2.537854015827179e-06, -2.4158507585525513e-06, -2.2938475012779236e-06, -2.171844244003296e-06, -2.0498409867286682e-06, -1.9278377294540405e-06, -1.8058344721794128e-06, -1.6838312149047852e-06, -1.5618279576301575e-06, -1.4398247003555298e-06, -1.317821443080902e-06, -1.1958181858062744e-06, -1.0738149285316467e-06, -9.51811671257019e-07, -8.298084139823914e-07, -7.078051567077637e-07, -5.85801899433136e-07, -4.637986421585083e-07, -3.417953848838806e-07, -2.1979212760925293e-07, -9.778887033462524e-08, 2.421438694000244e-08, 1.4621764421463013e-07, 2.682209014892578e-07, 3.902241587638855e-07, 5.122274160385132e-07, 6.342306733131409e-07, 7.562339305877686e-07, 8.782371878623962e-07, 1.000240445137024e-06, 1.1222437024116516e-06, 1.2442469596862793e-06, 1.366250216960907e-06, 1.4882534742355347e-06, 1.6102567315101624e-06, 1.73225998878479e-06, 1.8542632460594177e-06, 1.9762665033340454e-06, 2.098269760608673e-06, 2.2202730178833008e-06, 2.3422762751579285e-06, 2.464279532432556e-06, 2.586282789707184e-06, 2.7082860469818115e-06, 2.830289304256439e-06, 2.952292561531067e-06, 3.0742958188056946e-06, 3.1962990760803223e-06, 3.31830233335495e-06, 3.4403055906295776e-06, 3.5623088479042053e-06, 3.684312105178833e-06, 3.8063153624534607e-06, 3.928318619728088e-06, 4.050321877002716e-06, 4.172325134277344e-06]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 2.0, 15.0, 17.0, 32.0, 29.0, 56.0, 86.0, 107.0, 167.0, 241.0, 416.0, 783.0, 1357.0, 2637.0, 5792.0, 13435.0, 36698.0, 79836.0, 159044.0, 236346.0, 231018.0, 149760.0, 73429.0, 31910.0, 13394.0, 5853.0, 2768.0, 1329.0, 709.0, 493.0, 244.0, 159.0, 122.0, 76.0, 58.0, 54.0, 23.0, 16.0, 10.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.680385321378708e-05, -1.6203150153160095e-05, -1.560244709253311e-05, -1.5001744031906128e-05, -1.4401040971279144e-05, -1.380033791065216e-05, -1.3199634850025177e-05, -1.2598931789398193e-05, -1.199822872877121e-05, -1.1397525668144226e-05, -1.0796822607517242e-05, -1.0196119546890259e-05, -9.595416486263275e-06, -8.994713425636292e-06, -8.394010365009308e-06, -7.793307304382324e-06, -7.1926042437553406e-06, -6.591901183128357e-06, -5.991198122501373e-06, -5.39049506187439e-06, -4.789792001247406e-06, -4.189088940620422e-06, -3.5883858799934387e-06, -2.987682819366455e-06, -2.3869797587394714e-06, -1.7862766981124878e-06, -1.1855736374855042e-06, -5.848705768585205e-07, 1.5832483768463135e-08, 6.165355443954468e-07, 1.2172386050224304e-06, 1.817941665649414e-06, 2.4186447262763977e-06, 3.0193477869033813e-06, 3.620050847530365e-06, 4.220753908157349e-06, 4.821456968784332e-06, 5.422160029411316e-06, 6.0228630900382996e-06, 6.623566150665283e-06, 7.224269211292267e-06, 7.82497227191925e-06, 8.425675332546234e-06, 9.026378393173218e-06, 9.627081453800201e-06, 1.0227784514427185e-05, 1.0828487575054169e-05, 1.1429190635681152e-05, 1.2029893696308136e-05, 1.263059675693512e-05, 1.3231299817562103e-05, 1.3832002878189087e-05, 1.443270593881607e-05, 1.5033408999443054e-05, 1.5634112060070038e-05, 1.623481512069702e-05, 1.6835518181324005e-05, 1.743622124195099e-05, 1.8036924302577972e-05, 1.8637627363204956e-05, 1.923833042383194e-05, 1.9839033484458923e-05, 2.0439736545085907e-05, 2.104043960571289e-05]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 16.0, 19.0, 16.0, 29.0, 26.0, 46.0, 31.0, 40.0, 58.0, 73.0, 77.0, 75.0, 70.0, 63.0, 60.0, 65.0, 47.0, 45.0, 41.0, 24.0, 17.0, 12.0, 17.0, 15.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05051878260565e-06, -3.9237920645973645e-06, -3.7970648918417282e-06, -3.6703379464597674e-06, -3.5436110010778066e-06, -3.416884283069521e-06, -3.2901573376875604e-06, -3.1634303923055995e-06, -3.0367034469236387e-06, -2.909976501541678e-06, -2.783249556159717e-06, -2.656522610777756e-06, -2.529795892769471e-06, -2.4030687200138345e-06, -2.276342002005549e-06, -2.1496150566235883e-06, -2.0228881112416275e-06, -1.8961611658596667e-06, -1.7694342204777058e-06, -1.6427073887825827e-06, -1.5159804434006219e-06, -1.389253498018661e-06, -1.262526666323538e-06, -1.1357997209415771e-06, -1.0090727755596163e-06, -8.823458301776554e-07, -7.556189416391135e-07, -6.288920531005715e-07, -5.021651077186107e-07, -3.7543816233664984e-07, -2.4871127379810787e-07, -1.219843852595659e-07, 4.742560122394934e-09, 1.3146947708264634e-07, 2.5819639404289774e-07, 3.8492331100314914e-07, 5.116502279634005e-07, 6.383771733453614e-07, 7.651040618839033e-07, 8.918309504224453e-07, 1.0185578958044061e-06, 1.145284841186367e-06, 1.2720117865683278e-06, 1.398738618263451e-06, 1.5254655636454117e-06, 1.6521925090273726e-06, 1.7789193407224957e-06, 1.9056462861044565e-06, 2.0323732314864174e-06, 2.159100176868378e-06, 2.285827122250339e-06, 2.4125540676323e-06, 2.5392810130142607e-06, 2.666007731022546e-06, 2.792734676404507e-06, 2.9194616217864677e-06, 3.0461885671684286e-06, 3.1729155125503894e-06, 3.2996424579323502e-06, 3.426369403314311e-06, 3.5530961213225964e-06, 3.6798232940782327e-06, 3.806550012086518e-06, 3.933277184842154e-06, 4.06000390285044e-06]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 1.0, 9.0, 1.0, 8.0, 12.0, 6.0, 27.0, 13.0, 21.0, 14.0, 18.0, 57.0, 22.0, 44.0, 25.0, 28.0, 59.0, 34.0, 64.0, 24.0, 38.0, 52.0, 25.0, 56.0, 26.0, 62.0, 24.0, 26.0, 38.0, 17.0, 43.0, 13.0, 16.0, 24.0, 9.0, 9.0, 2.0, 4.0, 12.0, 2.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5387853384017944e-06, -2.4549663066864014e-06, -2.3711472749710083e-06, -2.2873282432556152e-06, -2.203509211540222e-06, -2.119690179824829e-06, -2.035871148109436e-06, -1.952052116394043e-06, -1.86823308467865e-06, -1.7844140529632568e-06, -1.7005950212478638e-06, -1.6167759895324707e-06, -1.5329569578170776e-06, -1.4491379261016846e-06, -1.3653188943862915e-06, -1.2814998626708984e-06, -1.1976808309555054e-06, -1.1138617992401123e-06, -1.0300427675247192e-06, -9.462237358093262e-07, -8.624047040939331e-07, -7.7858567237854e-07, -6.94766640663147e-07, -6.109476089477539e-07, -5.271285772323608e-07, -4.4330954551696777e-07, -3.594905138015747e-07, -2.7567148208618164e-07, -1.9185245037078857e-07, -1.0803341865539551e-07, -2.421438694000244e-08, 5.960464477539063e-08, 1.434236764907837e-07, 2.2724270820617676e-07, 3.110617399215698e-07, 3.948807716369629e-07, 4.78699803352356e-07, 5.62518835067749e-07, 6.463378667831421e-07, 7.301568984985352e-07, 8.139759302139282e-07, 8.977949619293213e-07, 9.816139936447144e-07, 1.0654330253601074e-06, 1.1492520570755005e-06, 1.2330710887908936e-06, 1.3168901205062866e-06, 1.4007091522216797e-06, 1.4845281839370728e-06, 1.5683472156524658e-06, 1.6521662473678589e-06, 1.735985279083252e-06, 1.819804310798645e-06, 1.903623342514038e-06, 1.987442374229431e-06, 2.0712614059448242e-06, 2.1550804376602173e-06, 2.2388994693756104e-06, 2.3227185010910034e-06, 2.4065375328063965e-06, 2.4903565645217896e-06, 2.5741755962371826e-06, 2.6579946279525757e-06, 2.7418136596679688e-06]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 14.0, 13.0, 11.0, 19.0, 20.0, 23.0, 34.0, 37.0, 34.0, 51.0, 43.0, 48.0, 37.0, 49.0, 45.0, 46.0, 45.0, 43.0, 45.0, 35.0, 30.0, 29.0, 25.0, 25.0, 18.0, 23.0, 14.0, 11.0, 16.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-60.21875, -58.46728515625, -56.7158203125, -54.96435546875, -53.212890625, -51.46142578125, -49.7099609375, -47.95849609375, -46.20703125, -44.45556640625, -42.7041015625, -40.95263671875, -39.201171875, -37.44970703125, -35.6982421875, -33.94677734375, -32.1953125, -30.44384765625, -28.6923828125, -26.94091796875, -25.189453125, -23.43798828125, -21.6865234375, -19.93505859375, -18.18359375, -16.43212890625, -14.6806640625, -12.92919921875, -11.177734375, -9.42626953125, -7.6748046875, -5.92333984375, -4.171875, -2.42041015625, -0.6689453125, 1.08251953125, 2.833984375, 4.58544921875, 6.3369140625, 8.08837890625, 9.83984375, 11.59130859375, 13.3427734375, 15.09423828125, 16.845703125, 18.59716796875, 20.3486328125, 22.10009765625, 23.8515625, 25.60302734375, 27.3544921875, 29.10595703125, 30.857421875, 32.60888671875, 34.3603515625, 36.11181640625, 37.86328125, 39.61474609375, 41.3662109375, 43.11767578125, 44.869140625, 46.62060546875, 48.3720703125, 50.12353515625, 51.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 4.0, 10.0, 11.0, 16.0, 15.0, 20.0, 27.0, 34.0, 35.0, 61.0, 89.0, 158.0, 194.0, 372.0, 653.0, 1731.0, 5349.0, 22181.0, 109695.0, 433628.0, 367119.0, 82693.0, 17141.0, 4397.0, 1388.0, 588.0, 303.0, 170.0, 121.0, 71.0, 64.0, 54.0, 20.0, 30.0, 26.0, 18.0, 19.0, 14.0, 9.0, 7.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.4140625, -9.136474609375, -8.85888671875, -8.581298828125, -8.3037109375, -8.026123046875, -7.74853515625, -7.470947265625, -7.193359375, -6.915771484375, -6.63818359375, -6.360595703125, -6.0830078125, -5.805419921875, -5.52783203125, -5.250244140625, -4.97265625, -4.695068359375, -4.41748046875, -4.139892578125, -3.8623046875, -3.584716796875, -3.30712890625, -3.029541015625, -2.751953125, -2.474365234375, -2.19677734375, -1.919189453125, -1.6416015625, -1.364013671875, -1.08642578125, -0.808837890625, -0.53125, -0.253662109375, 0.02392578125, 0.301513671875, 0.5791015625, 0.856689453125, 1.13427734375, 1.411865234375, 1.689453125, 1.967041015625, 2.24462890625, 2.522216796875, 2.7998046875, 3.077392578125, 3.35498046875, 3.632568359375, 3.91015625, 4.187744140625, 4.46533203125, 4.742919921875, 5.0205078125, 5.298095703125, 5.57568359375, 5.853271484375, 6.130859375, 6.408447265625, 6.68603515625, 6.963623046875, 7.2412109375, 7.518798828125, 7.79638671875, 8.073974609375, 8.3515625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 13.0, 15.0, 28.0, 36.0, 46.0, 63.0, 62.0, 64.0, 91.0, 2142.0, 86.0, 86.0, 74.0, 52.0, 57.0, 33.0, 19.0, 32.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.875, -149.5517578125, -145.228515625, -140.9052734375, -136.58203125, -132.2587890625, -127.935546875, -123.6123046875, -119.2890625, -114.9658203125, -110.642578125, -106.3193359375, -101.99609375, -97.6728515625, -93.349609375, -89.0263671875, -84.703125, -80.3798828125, -76.056640625, -71.7333984375, -67.41015625, -63.0869140625, -58.763671875, -54.4404296875, -50.1171875, -45.7939453125, -41.470703125, -37.1474609375, -32.82421875, -28.5009765625, -24.177734375, -19.8544921875, -15.53125, -11.2080078125, -6.884765625, -2.5615234375, 1.76171875, 6.0849609375, 10.408203125, 14.7314453125, 19.0546875, 23.3779296875, 27.701171875, 32.0244140625, 36.34765625, 40.6708984375, 44.994140625, 49.3173828125, 53.640625, 57.9638671875, 62.287109375, 66.6103515625, 70.93359375, 75.2568359375, 79.580078125, 83.9033203125, 88.2265625, 92.5498046875, 96.873046875, 101.1962890625, 105.51953125, 109.8427734375, 114.166015625, 118.4892578125, 122.8125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 16.0, 21.0, 22.0, 34.0, 45.0, 75.0, 112.0, 140.0, 231.0, 328.0, 606.0, 1361.0, 4914.0, 68310.0, 2915417.0, 143219.0, 7353.0, 1562.0, 739.0, 426.0, 248.0, 158.0, 106.0, 78.0, 40.0, 41.0, 23.0, 20.0, 17.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6640625, -14.1849365234375, -13.705810546875, -13.2266845703125, -12.74755859375, -12.2684326171875, -11.789306640625, -11.3101806640625, -10.8310546875, -10.3519287109375, -9.872802734375, -9.3936767578125, -8.91455078125, -8.4354248046875, -7.956298828125, -7.4771728515625, -6.998046875, -6.5189208984375, -6.039794921875, -5.5606689453125, -5.08154296875, -4.6024169921875, -4.123291015625, -3.6441650390625, -3.1650390625, -2.6859130859375, -2.206787109375, -1.7276611328125, -1.24853515625, -0.7694091796875, -0.290283203125, 0.1888427734375, 0.66796875, 1.1470947265625, 1.626220703125, 2.1053466796875, 2.58447265625, 3.0635986328125, 3.542724609375, 4.0218505859375, 4.5009765625, 4.9801025390625, 5.459228515625, 5.9383544921875, 6.41748046875, 6.8966064453125, 7.375732421875, 7.8548583984375, 8.333984375, 8.8131103515625, 9.292236328125, 9.7713623046875, 10.25048828125, 10.7296142578125, 11.208740234375, 11.6878662109375, 12.1669921875, 12.6461181640625, 13.125244140625, 13.6043701171875, 14.08349609375, 14.5626220703125, 15.041748046875, 15.5208740234375, 16.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 28.0, 96.0, 313.0, 319.0, 148.0, 44.0, 20.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.9063720703125, -93.5420150756836, -84.17765808105469, -74.81330108642578, -65.44894409179688, -56.08458709716797, -46.72023010253906, -37.355873107910156, -27.99151611328125, -18.627159118652344, -9.262802124023438, 0.10155487060546875, 9.465911865234375, 18.83026885986328, 28.194625854492188, 37.558982849121094, 46.92333984375, 56.287696838378906, 65.65205383300781, 75.01641082763672, 84.38076782226562, 93.74512481689453, 103.10948181152344, 112.47383880615234, 121.83819580078125, 131.20254516601562, 140.56690979003906, 149.9312744140625, 159.29562377929688, 168.65997314453125, 178.0243377685547, 187.38870239257812, 196.7530517578125, 206.11740112304688, 215.4817657470703, 224.84613037109375, 234.21047973632812, 243.5748291015625, 252.93919372558594, 262.3035583496094, 271.66790771484375, 281.0322570800781, 290.3966064453125, 299.760986328125, 309.1253356933594, 318.48968505859375, 327.85406494140625, 337.2184143066406, 346.582763671875, 355.9471130371094, 365.31146240234375, 374.67584228515625, 384.0401916503906, 393.404541015625, 402.7689208984375, 412.1332702636719, 421.49761962890625, 430.8619689941406, 440.226318359375, 449.5906982421875, 458.9550476074219, 468.31939697265625, 477.68377685546875, 487.0481262207031, 496.4124755859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 10.0, 7.0, 11.0, 10.0, 18.0, 11.0, 20.0, 28.0, 15.0, 36.0, 40.0, 38.0, 41.0, 41.0, 46.0, 45.0, 53.0, 43.0, 57.0, 50.0, 44.0, 41.0, 42.0, 28.0, 39.0, 20.0, 28.0, 26.0, 19.0, 20.0, 15.0, 8.0, 13.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.92298889160156, -126.03353118896484, -122.14407348632812, -118.25460815429688, -114.36515045166016, -110.47569274902344, -106.58622741699219, -102.69676971435547, -98.80731201171875, -94.91785430908203, -91.02839660644531, -87.13893127441406, -83.24947357177734, -79.36001586914062, -75.47055053710938, -71.58109283447266, -67.69163513183594, -63.80217742919922, -59.912715911865234, -56.02325439453125, -52.13379669189453, -48.24433898925781, -44.35487747192383, -40.465415954589844, -36.575958251953125, -32.686500549316406, -28.797039031982422, -24.90757942199707, -21.01811981201172, -17.128660202026367, -13.239200592041016, -9.349740982055664, -5.4602813720703125, -1.570821762084961, 2.3186378479003906, 6.208097457885742, 10.097557067871094, 13.987016677856445, 17.876476287841797, 21.76593589782715, 25.6553955078125, 29.54485511779785, 33.4343147277832, 37.32377624511719, 41.213233947753906, 45.102691650390625, 48.99215316772461, 52.881614685058594, 56.77107238769531, 60.66053009033203, 64.54998779296875, 68.439453125, 72.32891082763672, 76.21836853027344, 80.10783386230469, 83.9972915649414, 87.88674926757812, 91.77620697021484, 95.66566467285156, 99.55513000488281, 103.44458770751953, 107.33404541015625, 111.2235107421875, 115.11296844482422, 119.00242614746094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 11.0, 13.0, 22.0, 26.0, 28.0, 47.0, 50.0, 54.0, 95.0, 110.0, 155.0, 167.0, 229.0, 311.0, 412.0, 473.0, 521.0, 763.0, 1471.0, 1040028.0, 771.0, 579.0, 447.0, 347.0, 322.0, 245.0, 196.0, 154.0, 116.0, 76.0, 72.0, 47.0, 55.0, 31.0, 22.0, 18.0, 9.0, 9.0, 7.0, 11.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.341537475585938, -29.36426544189453, -28.386991500854492, -27.409719467163086, -26.432445526123047, -25.45517349243164, -24.477901458740234, -23.500627517700195, -22.523353576660156, -21.54608154296875, -20.56880760192871, -19.591535568237305, -18.614261627197266, -17.63698959350586, -16.659717559814453, -15.682443618774414, -14.705171585083008, -13.727898597717285, -12.750625610351562, -11.773353576660156, -10.796079635620117, -9.818807601928711, -8.841534614562988, -7.864261627197266, -6.886988639831543, -5.90971565246582, -4.932442665100098, -3.955170154571533, -2.9778971672058105, -2.000624179840088, -1.0233516693115234, -0.04607868194580078, 0.9311943054199219, 1.908467173576355, 2.885740041732788, 3.8630127906799316, 4.840285778045654, 5.817558765411377, 6.794831275939941, 7.772104263305664, 8.749377250671387, 9.72665023803711, 10.703923225402832, 11.681196212768555, 12.658468246459961, 13.6357421875, 14.613014221191406, 15.590287208557129, 16.56756019592285, 17.544832229614258, 18.522106170654297, 19.499378204345703, 20.476652145385742, 21.45392417907715, 22.431198120117188, 23.408470153808594, 24.3857421875, 25.363014221191406, 26.340288162231445, 27.31756019592285, 28.29483413696289, 29.272106170654297, 30.249378204345703, 31.226652145385742, 32.20392608642578]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 12.0, 26.0, 25.0, 37.0, 82.0, 234.0, 120112.0, 51342560.0, 259.0, 57.0, 25.0, 19.0, 11.0, 7.0, 5.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1996.619873046875, -1946.710693359375, -1896.8016357421875, -1846.8924560546875, -1796.9833984375, -1747.07421875, -1697.1650390625, -1647.2559814453125, -1597.3468017578125, -1547.4376220703125, -1497.528564453125, -1447.619384765625, -1397.7103271484375, -1347.8011474609375, -1297.89208984375, -1247.98291015625, -1198.07373046875, -1148.16455078125, -1098.2554931640625, -1048.3463134765625, -998.4371948242188, -948.528076171875, -898.6189575195312, -848.7098388671875, -798.80078125, -748.8916625976562, -698.9825439453125, -649.0733642578125, -599.1642456054688, -549.255126953125, -499.34600830078125, -449.4368591308594, -399.5277099609375, -349.61859130859375, -299.7094421386719, -249.80032348632812, -199.8911895751953, -149.9820556640625, -100.07293701171875, -50.163787841796875, -0.254669189453125, 49.65446090698242, 99.56359100341797, 149.47271728515625, 199.38185119628906, 249.29098510742188, 299.2001037597656, 349.1092529296875, 399.01837158203125, 448.927490234375, 498.8366394042969, 548.7457275390625, 598.6549072265625, 648.5640258789062, 698.47314453125, 748.38232421875, 798.2913818359375, 848.2005004882812, 898.109619140625, 948.018798828125, 997.9279174804688, 1047.8370361328125, 1097.74609375, 1147.6552734375, 1197.564453125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 13.0, 14.0, 27.0, 41.0, 50.0, 61.0, 90.0, 139.0, 189.0, 324.0, 483.0, 746.0, 1079.0, 1743.0, 2764.0, 4256.0, 6813.0, 11148.0, 18251.0, 29892.0, 49717.0, 83167.0, 142782.0, 266478.0, 591608.0, 4075678.0, 472707.0, 222321.0, 123369.0, 72456.0, 43701.0, 26404.0, 16049.0, 10146.0, 6020.0, 3774.0, 2436.0, 1587.0, 958.0, 678.0, 438.0, 271.0, 183.0, 128.0, 80.0, 62.0, 35.0, 23.0, 17.0, 13.0, 8.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.101318359375, -0.09818840026855469, -0.09505844116210938, -0.09192848205566406, -0.08879852294921875, -0.08566856384277344, -0.08253860473632812, -0.07940864562988281, -0.0762786865234375, -0.07314872741699219, -0.07001876831054688, -0.06688880920410156, -0.06375885009765625, -0.06062889099121094, -0.057498931884765625, -0.05436897277832031, -0.051239013671875, -0.04810905456542969, -0.044979095458984375, -0.04184913635253906, -0.03871917724609375, -0.03558921813964844, -0.032459259033203125, -0.029329299926757812, -0.0261993408203125, -0.023069381713867188, -0.019939422607421875, -0.016809463500976562, -0.01367950439453125, -0.010549545288085938, -0.007419586181640625, -0.0042896270751953125, -0.00115966796875, 0.0019702911376953125, 0.005100250244140625, 0.008230209350585938, 0.01136016845703125, 0.014490127563476562, 0.017620086669921875, 0.020750045776367188, 0.0238800048828125, 0.027009963989257812, 0.030139923095703125, 0.03326988220214844, 0.03639984130859375, 0.03952980041503906, 0.042659759521484375, 0.04578971862792969, 0.048919677734375, 0.05204963684082031, 0.055179595947265625, 0.05830955505371094, 0.06143951416015625, 0.06456947326660156, 0.06769943237304688, 0.07082939147949219, 0.0739593505859375, 0.07708930969238281, 0.08021926879882812, 0.08334922790527344, 0.08647918701171875, 0.08960914611816406, 0.09273910522460938, 0.09586906433105469, 0.0989990234375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 13.0, 8.0, 11.0, 19.0, 25.0, 22.0, 37.0, 26.0, 23.0, 34.0, 41.0, 33.0, 30.0, 40.0, 39.0, 1069.0, 33.0, 54.0, 55.0, 44.0, 39.0, 31.0, 38.0, 28.0, 36.0, 26.0, 26.0, 22.0, 14.0, 18.0, 12.0, 21.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.296875, -13.817626953125, -13.33837890625, -12.859130859375, -12.3798828125, -11.900634765625, -11.42138671875, -10.942138671875, -10.462890625, -9.983642578125, -9.50439453125, -9.025146484375, -8.5458984375, -8.066650390625, -7.58740234375, -7.108154296875, -6.62890625, -6.149658203125, -5.67041015625, -5.191162109375, -4.7119140625, -4.232666015625, -3.75341796875, -3.274169921875, -2.794921875, -2.315673828125, -1.83642578125, -1.357177734375, -0.8779296875, -0.398681640625, 0.08056640625, 0.559814453125, 1.0390625, 1.518310546875, 1.99755859375, 2.476806640625, 2.9560546875, 3.435302734375, 3.91455078125, 4.393798828125, 4.873046875, 5.352294921875, 5.83154296875, 6.310791015625, 6.7900390625, 7.269287109375, 7.74853515625, 8.227783203125, 8.70703125, 9.186279296875, 9.66552734375, 10.144775390625, 10.6240234375, 11.103271484375, 11.58251953125, 12.061767578125, 12.541015625, 13.020263671875, 13.49951171875, 13.978759765625, 14.4580078125, 14.937255859375, 15.41650390625, 15.895751953125, 16.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 4.0, 7.0, 19.0, 28.0, 45.0, 42.0, 69.0, 116.0, 184.0, 210.0, 330.0, 478.0, 695.0, 915.0, 1404.0, 2115.0, 2982.0, 4445.0, 6577.0, 10065.0, 15507.0, 23893.0, 38134.0, 60700.0, 100150.0, 169191.0, 310873.0, 624007.0, 3924688.0, 434143.0, 222109.0, 127098.0, 77113.0, 47436.0, 29689.0, 19003.0, 12203.0, 8152.0, 5412.0, 3561.0, 2329.0, 1622.0, 1130.0, 774.0, 473.0, 369.0, 304.0, 193.0, 137.0, 104.0, 70.0, 43.0, 31.0, 22.0, 19.0, 12.0, 5.0, 7.0, 2.0, 4.0, 2.0], "bins": [-0.07647705078125, -0.07402896881103516, -0.07158088684082031, -0.06913280487060547, -0.06668472290039062, -0.06423664093017578, -0.06178855895996094, -0.059340476989746094, -0.05689239501953125, -0.054444313049316406, -0.05199623107910156, -0.04954814910888672, -0.047100067138671875, -0.04465198516845703, -0.04220390319824219, -0.039755821228027344, -0.0373077392578125, -0.034859657287597656, -0.03241157531738281, -0.02996349334716797, -0.027515411376953125, -0.02506732940673828, -0.022619247436523438, -0.020171165466308594, -0.01772308349609375, -0.015275001525878906, -0.012826919555664062, -0.010378837585449219, -0.007930755615234375, -0.005482673645019531, -0.0030345916748046875, -0.0005865097045898438, 0.001861572265625, 0.004309654235839844, 0.0067577362060546875, 0.009205818176269531, 0.011653900146484375, 0.014101982116699219, 0.016550064086914062, 0.018998146057128906, 0.02144622802734375, 0.023894309997558594, 0.026342391967773438, 0.02879047393798828, 0.031238555908203125, 0.03368663787841797, 0.03613471984863281, 0.038582801818847656, 0.0410308837890625, 0.043478965759277344, 0.04592704772949219, 0.04837512969970703, 0.050823211669921875, 0.05327129364013672, 0.05571937561035156, 0.058167457580566406, 0.06061553955078125, 0.0630636215209961, 0.06551170349121094, 0.06795978546142578, 0.07040786743164062, 0.07285594940185547, 0.07530403137207031, 0.07775211334228516, 0.0802001953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 0.0, 6.0, 0.0, 14.0, 8.0, 13.0, 18.0, 15.0, 25.0, 25.0, 24.0, 30.0, 28.0, 32.0, 37.0, 48.0, 38.0, 50.0, 41.0, 1070.0, 45.0, 49.0, 38.0, 47.0, 44.0, 36.0, 29.0, 31.0, 30.0, 24.0, 19.0, 19.0, 19.0, 19.0, 11.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.609375, -12.2337646484375, -11.858154296875, -11.4825439453125, -11.10693359375, -10.7313232421875, -10.355712890625, -9.9801025390625, -9.6044921875, -9.2288818359375, -8.853271484375, -8.4776611328125, -8.10205078125, -7.7264404296875, -7.350830078125, -6.9752197265625, -6.599609375, -6.2239990234375, -5.848388671875, -5.4727783203125, -5.09716796875, -4.7215576171875, -4.345947265625, -3.9703369140625, -3.5947265625, -3.2191162109375, -2.843505859375, -2.4678955078125, -2.09228515625, -1.7166748046875, -1.341064453125, -0.9654541015625, -0.58984375, -0.2142333984375, 0.161376953125, 0.5369873046875, 0.91259765625, 1.2882080078125, 1.663818359375, 2.0394287109375, 2.4150390625, 2.7906494140625, 3.166259765625, 3.5418701171875, 3.91748046875, 4.2930908203125, 4.668701171875, 5.0443115234375, 5.419921875, 5.7955322265625, 6.171142578125, 6.5467529296875, 6.92236328125, 7.2979736328125, 7.673583984375, 8.0491943359375, 8.4248046875, 8.8004150390625, 9.176025390625, 9.5516357421875, 9.92724609375, 10.3028564453125, 10.678466796875, 11.0540771484375, 11.4296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 9.0, 5.0, 7.0, 6.0, 9.0, 6.0, 12.0, 24.0, 34.0, 48.0, 46.0, 47.0, 59.0, 86.0, 108.0, 125.0, 141.0, 216.0, 272.0, 326.0, 504.0, 723.0, 1282.0, 3934.0, 19601.0, 158735.0, 6034468.0, 55662.0, 9478.0, 2250.0, 933.0, 556.0, 376.0, 263.0, 198.0, 168.0, 141.0, 93.0, 97.0, 56.0, 73.0, 52.0, 47.0, 40.0, 21.0, 32.0, 21.0, 5.0, 15.0, 15.0, 2.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.44140625, -0.4272918701171875, -0.413177490234375, -0.3990631103515625, -0.38494873046875, -0.3708343505859375, -0.356719970703125, -0.3426055908203125, -0.3284912109375, -0.3143768310546875, -0.300262451171875, -0.2861480712890625, -0.27203369140625, -0.2579193115234375, -0.243804931640625, -0.2296905517578125, -0.215576171875, -0.2014617919921875, -0.187347412109375, -0.1732330322265625, -0.15911865234375, -0.1450042724609375, -0.130889892578125, -0.1167755126953125, -0.1026611328125, -0.0885467529296875, -0.074432373046875, -0.0603179931640625, -0.04620361328125, -0.0320892333984375, -0.017974853515625, -0.0038604736328125, 0.01025390625, 0.0243682861328125, 0.038482666015625, 0.0525970458984375, 0.06671142578125, 0.0808258056640625, 0.094940185546875, 0.1090545654296875, 0.1231689453125, 0.1372833251953125, 0.151397705078125, 0.1655120849609375, 0.17962646484375, 0.1937408447265625, 0.207855224609375, 0.2219696044921875, 0.236083984375, 0.2501983642578125, 0.264312744140625, 0.2784271240234375, 0.29254150390625, 0.3066558837890625, 0.320770263671875, 0.3348846435546875, 0.3489990234375, 0.3631134033203125, 0.377227783203125, 0.3913421630859375, 0.40545654296875, 0.4195709228515625, 0.433685302734375, 0.4477996826171875, 0.4619140625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 10.0, 11.0, 16.0, 11.0, 14.0, 11.0, 26.0, 23.0, 19.0, 24.0, 24.0, 40.0, 36.0, 36.0, 36.0, 34.0, 37.0, 37.0, 39.0, 1050.0, 49.0, 35.0, 42.0, 40.0, 34.0, 32.0, 32.0, 27.0, 25.0, 24.0, 19.0, 14.0, 19.0, 19.0, 10.0, 15.0, 14.0, 6.0, 8.0, 9.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.7578125, -7.510986328125, -7.26416015625, -7.017333984375, -6.7705078125, -6.523681640625, -6.27685546875, -6.030029296875, -5.783203125, -5.536376953125, -5.28955078125, -5.042724609375, -4.7958984375, -4.549072265625, -4.30224609375, -4.055419921875, -3.80859375, -3.561767578125, -3.31494140625, -3.068115234375, -2.8212890625, -2.574462890625, -2.32763671875, -2.080810546875, -1.833984375, -1.587158203125, -1.34033203125, -1.093505859375, -0.8466796875, -0.599853515625, -0.35302734375, -0.106201171875, 0.140625, 0.387451171875, 0.63427734375, 0.881103515625, 1.1279296875, 1.374755859375, 1.62158203125, 1.868408203125, 2.115234375, 2.362060546875, 2.60888671875, 2.855712890625, 3.1025390625, 3.349365234375, 3.59619140625, 3.843017578125, 4.08984375, 4.336669921875, 4.58349609375, 4.830322265625, 5.0771484375, 5.323974609375, 5.57080078125, 5.817626953125, 6.064453125, 6.311279296875, 6.55810546875, 6.804931640625, 7.0517578125, 7.298583984375, 7.54541015625, 7.792236328125, 8.0390625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 650.0, 356.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.42967224121094, -31.19765853881836, -28.96564292907715, -26.73362922668457, -24.50161361694336, -22.26959991455078, -20.037586212158203, -17.805572509765625, -15.573556900024414, -13.34154224395752, -11.109527587890625, -8.877513885498047, -6.645499229431152, -4.413484573364258, -2.1814708709716797, 0.050543785095214844, 2.2825584411621094, 4.514573097229004, 6.74658727645874, 8.978601455688477, 11.210616111755371, 13.442630767822266, 15.674644470214844, 17.906658172607422, 20.138673782348633, 22.37068748474121, 24.602703094482422, 26.834716796875, 29.066730499267578, 31.29874610900879, 33.53076171875, 35.76277542114258, 37.994789123535156, 40.226802825927734, 42.45881652832031, 44.690834045410156, 46.922847747802734, 49.15486145019531, 51.38687515258789, 53.61888885498047, 55.85090637207031, 58.08292007446289, 60.31493377685547, 62.54695129394531, 64.77896118164062, 67.01097869873047, 69.24299621582031, 71.47500610351562, 73.70701599121094, 75.93903350830078, 78.1710433959961, 80.40306091308594, 82.63507080078125, 84.8670883178711, 87.09910583496094, 89.33111572265625, 91.5631332397461, 93.79515075683594, 96.02716064453125, 98.2591781616211, 100.4911880493164, 102.72320556640625, 104.95521545410156, 107.1872329711914, 109.41925048828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 6.0, 7.0, 10.0, 15.0, 16.0, 11.0, 14.0, 18.0, 21.0, 29.0, 18.0, 17.0, 25.0, 35.0, 31.0, 31.0, 43.0, 33.0, 47.0, 37.0, 33.0, 44.0, 53.0, 49.0, 34.0, 19.0, 24.0, 29.0, 28.0, 24.0, 20.0, 22.0, 17.0, 14.0, 17.0, 21.0, 13.0, 9.0, 8.0, 7.0, 8.0, 9.0, 10.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.5479736328125, -16.06859588623047, -15.589218139648438, -15.109840393066406, -14.630461692810059, -14.151083946228027, -13.671706199645996, -13.192328453063965, -12.712950706481934, -12.233572959899902, -11.754195213317871, -11.274816513061523, -10.795438766479492, -10.316061019897461, -9.83668327331543, -9.357305526733398, -8.877927780151367, -8.398550033569336, -7.9191718101501465, -7.439794063568115, -6.960416316986084, -6.4810380935668945, -6.001660346984863, -5.522282600402832, -5.042903900146484, -4.563526153564453, -4.084147930145264, -3.6047701835632324, -3.125392436981201, -2.646014451980591, -2.1666364669799805, -1.6872587203979492, -1.207880973815918, -0.7285031080245972, -0.2491251826286316, 0.23025274276733398, 0.7096306085586548, 1.1890084743499756, 1.668386459350586, 2.147764205932617, 2.6271421909332275, 3.106520175933838, 3.585897922515869, 4.065276145935059, 4.54465389251709, 5.024031639099121, 5.503409385681152, 5.982787132263184, 6.462165355682373, 6.941543102264404, 7.420921325683594, 7.900299072265625, 8.379676818847656, 8.859054565429688, 9.338432312011719, 9.81781005859375, 10.297188758850098, 10.776566505432129, 11.25594425201416, 11.735322952270508, 12.214700698852539, 12.69407844543457, 13.173456192016602, 13.652833938598633, 14.132211685180664]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 9.0, 3.0, 11.0, 11.0, 12.0, 21.0, 33.0, 28.0, 33.0, 64.0, 82.0, 65.0, 102.0, 151.0, 195.0, 294.0, 419.0, 770.0, 3967.0, 17672.0, 3853001.0, 300593.0, 10316.0, 3324.0, 841.0, 522.0, 375.0, 296.0, 232.0, 164.0, 114.0, 122.0, 76.0, 81.0, 56.0, 39.0, 31.0, 20.0, 18.0, 25.0, 9.0, 13.0, 16.0, 4.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.036346435546875, -0.03517293930053711, -0.03399944305419922, -0.03282594680786133, -0.03165245056152344, -0.030478954315185547, -0.029305458068847656, -0.028131961822509766, -0.026958465576171875, -0.025784969329833984, -0.024611473083496094, -0.023437976837158203, -0.022264480590820312, -0.021090984344482422, -0.01991748809814453, -0.01874399185180664, -0.01757049560546875, -0.01639699935913086, -0.015223503112792969, -0.014050006866455078, -0.012876510620117188, -0.011703014373779297, -0.010529518127441406, -0.009356021881103516, -0.008182525634765625, -0.007009029388427734, -0.005835533142089844, -0.004662036895751953, -0.0034885406494140625, -0.002315044403076172, -0.0011415481567382812, 3.1948089599609375e-05, 0.0012054443359375, 0.0023789405822753906, 0.0035524368286132812, 0.004725933074951172, 0.0058994293212890625, 0.007072925567626953, 0.008246421813964844, 0.009419918060302734, 0.010593414306640625, 0.011766910552978516, 0.012940406799316406, 0.014113903045654297, 0.015287399291992188, 0.016460895538330078, 0.01763439178466797, 0.01880788803100586, 0.01998138427734375, 0.02115488052368164, 0.02232837677001953, 0.023501873016357422, 0.024675369262695312, 0.025848865509033203, 0.027022361755371094, 0.028195858001708984, 0.029369354248046875, 0.030542850494384766, 0.031716346740722656, 0.03288984298706055, 0.03406333923339844, 0.03523683547973633, 0.03641033172607422, 0.03758382797241211, 0.03875732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 0.0, 5.0, 7.0, 5.0, 6.0, 14.0, 7.0, 14.0, 22.0, 781.0, 36.0, 11.0, 12.0, 14.0, 10.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0189361572265625, -0.0183258056640625, -0.0177154541015625, -0.0171051025390625, -0.0164947509765625, -0.0158843994140625, -0.0152740478515625, -0.0146636962890625, -0.0140533447265625, -0.0134429931640625, -0.0128326416015625, -0.0122222900390625, -0.0116119384765625, -0.0110015869140625, -0.0103912353515625, -0.0097808837890625, -0.0091705322265625, -0.0085601806640625, -0.0079498291015625, -0.0073394775390625, -0.0067291259765625, -0.0061187744140625, -0.0055084228515625, -0.0048980712890625, -0.0042877197265625, -0.0036773681640625, -0.0030670166015625, -0.0024566650390625, -0.0018463134765625, -0.0012359619140625, -0.0006256103515625, -1.52587890625e-05, 0.0005950927734375, 0.0012054443359375, 0.0018157958984375, 0.0024261474609375, 0.0030364990234375, 0.0036468505859375, 0.0042572021484375, 0.0048675537109375, 0.0054779052734375, 0.0060882568359375, 0.0066986083984375, 0.0073089599609375, 0.0079193115234375, 0.0085296630859375, 0.0091400146484375, 0.0097503662109375, 0.0103607177734375, 0.0109710693359375, 0.0115814208984375, 0.0121917724609375, 0.0128021240234375, 0.0134124755859375, 0.0140228271484375, 0.0146331787109375, 0.0152435302734375, 0.0158538818359375, 0.0164642333984375, 0.0170745849609375, 0.0176849365234375, 0.0182952880859375, 0.0189056396484375, 0.0195159912109375, 0.0201263427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 15.0, 10.0, 14.0, 17.0, 24.0, 37.0, 49.0, 96.0, 243.0, 992.0, 6034.0, 569871.0, 3608951.0, 5860.0, 1334.0, 324.0, 141.0, 72.0, 52.0, 29.0, 14.0, 12.0, 11.0, 11.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.10882568359375, -0.10552978515625, -0.10223388671875, -0.09893798828125, -0.09564208984375, -0.09234619140625, -0.08905029296875, -0.08575439453125, -0.08245849609375, -0.07916259765625, -0.07586669921875, -0.07257080078125, -0.06927490234375, -0.06597900390625, -0.06268310546875, -0.05938720703125, -0.05609130859375, -0.05279541015625, -0.04949951171875, -0.04620361328125, -0.04290771484375, -0.03961181640625, -0.03631591796875, -0.03302001953125, -0.02972412109375, -0.02642822265625, -0.02313232421875, -0.01983642578125, -0.01654052734375, -0.01324462890625, -0.00994873046875, -0.00665283203125, -0.00335693359375, -6.103515625e-05, 0.00323486328125, 0.00653076171875, 0.00982666015625, 0.01312255859375, 0.01641845703125, 0.01971435546875, 0.02301025390625, 0.02630615234375, 0.02960205078125, 0.03289794921875, 0.03619384765625, 0.03948974609375, 0.04278564453125, 0.04608154296875, 0.04937744140625, 0.05267333984375, 0.05596923828125, 0.05926513671875, 0.06256103515625, 0.06585693359375, 0.06915283203125, 0.07244873046875, 0.07574462890625, 0.07904052734375, 0.08233642578125, 0.08563232421875, 0.08892822265625, 0.09222412109375, 0.09552001953125, 0.09881591796875, 0.10211181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 5.0, 4.0, 7.0, 8.0, 5.0, 13.0, 7.0, 49.0, 208.0, 1669.0, 1761.0, 190.0, 53.0, 19.0, 9.0, 4.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.036468505859375, -0.03529214859008789, -0.03411579132080078, -0.03293943405151367, -0.03176307678222656, -0.030586719512939453, -0.029410362243652344, -0.028234004974365234, -0.027057647705078125, -0.025881290435791016, -0.024704933166503906, -0.023528575897216797, -0.022352218627929688, -0.021175861358642578, -0.01999950408935547, -0.01882314682006836, -0.01764678955078125, -0.01647043228149414, -0.015294075012207031, -0.014117717742919922, -0.012941360473632812, -0.011765003204345703, -0.010588645935058594, -0.009412288665771484, -0.008235931396484375, -0.007059574127197266, -0.005883216857910156, -0.004706859588623047, -0.0035305023193359375, -0.002354145050048828, -0.0011777877807617188, -1.430511474609375e-06, 0.0011749267578125, 0.0023512840270996094, 0.0035276412963867188, 0.004703998565673828, 0.0058803558349609375, 0.007056713104248047, 0.008233070373535156, 0.009409427642822266, 0.010585784912109375, 0.011762142181396484, 0.012938499450683594, 0.014114856719970703, 0.015291213989257812, 0.016467571258544922, 0.01764392852783203, 0.01882028579711914, 0.01999664306640625, 0.02117300033569336, 0.02234935760498047, 0.023525714874267578, 0.024702072143554688, 0.025878429412841797, 0.027054786682128906, 0.028231143951416016, 0.029407501220703125, 0.030583858489990234, 0.031760215759277344, 0.03293657302856445, 0.03411293029785156, 0.03528928756713867, 0.03646564483642578, 0.03764200210571289, 0.038818359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1016.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939869165420532, -0.2597557604312897, -0.22552458941936493, -0.19129341840744019, -0.15706226229667664, -0.12283110618591309, -0.08859993517398834, -0.0543687641620636, -0.02013760805130005, 0.014093555510044098, 0.048324719071388245, 0.08255588263273239, 0.11678704619407654, 0.1510182023048401, 0.18524937331676483, 0.21948054432868958, 0.2537117004394531, 0.2879428565502167, 0.3221740126609802, 0.35640519857406616, 0.3906363546848297, 0.42486751079559326, 0.4590986967086792, 0.49332985281944275, 0.5275610089302063, 0.5617921948432922, 0.5960233211517334, 0.6302545070648193, 0.6644856929779053, 0.6987168192863464, 0.7329480051994324, 0.7671791315078735, 0.8014103174209595, 0.8356415033340454, 0.8698726296424866, 0.9041038155555725, 0.9383349418640137, 0.9725661277770996, 1.0067973136901855, 1.0410284996032715, 1.0752596855163574, 1.1094908714294434, 1.1437220573425293, 1.1779531240463257, 1.2121843099594116, 1.2464154958724976, 1.2806466817855835, 1.3148778676986694, 1.3491089344024658, 1.3833401203155518, 1.4175713062286377, 1.451802372932434, 1.48603355884552, 1.520264744758606, 1.554495930671692, 1.5887271165847778, 1.6229581832885742, 1.6571893692016602, 1.691420555114746, 1.7256516218185425, 1.7598828077316284, 1.7941139936447144, 1.8283451795578003, 1.8625763654708862, 1.8968075513839722]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 22.0, 24.0, 42.0, 50.0, 68.0, 76.0, 94.0, 112.0, 90.0, 82.0, 63.0, 40.0, 39.0, 29.0, 20.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11265707015991211, -0.10868007689714432, -0.10470308363437653, -0.10072609037160873, -0.09674909710884094, -0.09277210384607315, -0.08879511058330536, -0.08481811732053757, -0.08084112405776978, -0.07686413079500198, -0.07288713753223419, -0.0689101442694664, -0.06493315100669861, -0.06095615774393082, -0.056979164481163025, -0.05300217121839523, -0.04902517795562744, -0.04504818469285965, -0.04107119143009186, -0.037094198167324066, -0.033117204904556274, -0.029140211641788483, -0.02516321837902069, -0.0211862251162529, -0.017209231853485107, -0.013232238590717316, -0.009255245327949524, -0.005278252065181732, -0.0013012588024139404, 0.0026757344603538513, 0.006652727723121643, 0.010629720985889435, 0.014606714248657227, 0.01858370751142502, 0.02256070077419281, 0.026537694036960602, 0.030514687299728394, 0.034491680562496185, 0.03846867382526398, 0.04244566708803177, 0.04642266035079956, 0.05039965361356735, 0.054376646876335144, 0.058353640139102936, 0.06233063340187073, 0.06630762666463852, 0.07028461992740631, 0.0742616131901741, 0.0782386064529419, 0.08221559971570969, 0.08619259297847748, 0.09016958624124527, 0.09414657950401306, 0.09812357276678085, 0.10210056602954865, 0.10607755929231644, 0.11005455255508423, 0.11403154581785202, 0.11800853908061981, 0.1219855323433876, 0.1259625256061554, 0.12993952631950378, 0.13391651213169098, 0.13789349794387817, 0.14187049865722656]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 6.0, 6.0, 14.0, 20.0, 28.0, 37.0, 62.0, 76.0, 109.0, 147.0, 213.0, 279.0, 374.0, 493.0, 743.0, 1064.0, 1574.0, 2263.0, 3521.0, 5967.0, 10781.0, 25431.0, 903992.0, 53916.0, 16257.0, 7750.0, 4448.0, 2725.0, 1816.0, 1286.0, 883.0, 613.0, 457.0, 333.0, 237.0, 176.0, 133.0, 101.0, 79.0, 47.0, 28.0, 21.0, 18.0, 10.0, 6.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0206298828125, -0.019959211349487305, -0.01928853988647461, -0.018617868423461914, -0.01794719696044922, -0.017276525497436523, -0.016605854034423828, -0.015935182571411133, -0.015264511108398438, -0.014593839645385742, -0.013923168182373047, -0.013252496719360352, -0.012581825256347656, -0.011911153793334961, -0.011240482330322266, -0.01056981086730957, -0.009899139404296875, -0.00922846794128418, -0.008557796478271484, -0.007887125015258789, -0.007216453552246094, -0.0065457820892333984, -0.005875110626220703, -0.005204439163208008, -0.0045337677001953125, -0.003863096237182617, -0.003192424774169922, -0.0025217533111572266, -0.0018510818481445312, -0.001180410385131836, -0.0005097389221191406, 0.0001609325408935547, 0.00083160400390625, 0.0015022754669189453, 0.0021729469299316406, 0.002843618392944336, 0.0035142898559570312, 0.0041849613189697266, 0.004855632781982422, 0.005526304244995117, 0.0061969757080078125, 0.006867647171020508, 0.007538318634033203, 0.008208990097045898, 0.008879661560058594, 0.009550333023071289, 0.010221004486083984, 0.01089167594909668, 0.011562347412109375, 0.01223301887512207, 0.012903690338134766, 0.013574361801147461, 0.014245033264160156, 0.014915704727172852, 0.015586376190185547, 0.016257047653198242, 0.016927719116210938, 0.017598390579223633, 0.018269062042236328, 0.018939733505249023, 0.01961040496826172, 0.020281076431274414, 0.02095174789428711, 0.021622419357299805, 0.0222930908203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 12.0, 8.0, 9.0, 17.0, 27.0, 777.0, 34.0, 10.0, 14.0, 9.0, 12.0, 2.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0182342529296875, -0.017642498016357422, -0.017050743103027344, -0.016458988189697266, -0.015867233276367188, -0.01527547836303711, -0.014683723449707031, -0.014091968536376953, -0.013500213623046875, -0.012908458709716797, -0.012316703796386719, -0.01172494888305664, -0.011133193969726562, -0.010541439056396484, -0.009949684143066406, -0.009357929229736328, -0.00876617431640625, -0.008174419403076172, -0.007582664489746094, -0.006990909576416016, -0.0063991546630859375, -0.005807399749755859, -0.005215644836425781, -0.004623889923095703, -0.004032135009765625, -0.003440380096435547, -0.0028486251831054688, -0.0022568702697753906, -0.0016651153564453125, -0.0010733604431152344, -0.00048160552978515625, 0.00011014938354492188, 0.000701904296875, 0.0012936592102050781, 0.0018854141235351562, 0.0024771690368652344, 0.0030689239501953125, 0.0036606788635253906, 0.004252433776855469, 0.004844188690185547, 0.005435943603515625, 0.006027698516845703, 0.006619453430175781, 0.007211208343505859, 0.0078029632568359375, 0.008394718170166016, 0.008986473083496094, 0.009578227996826172, 0.01016998291015625, 0.010761737823486328, 0.011353492736816406, 0.011945247650146484, 0.012537002563476562, 0.01312875747680664, 0.013720512390136719, 0.014312267303466797, 0.014904022216796875, 0.015495777130126953, 0.01608753204345703, 0.01667928695678711, 0.017271041870117188, 0.017862796783447266, 0.018454551696777344, 0.019046306610107422, 0.0196380615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 16.0, 19.0, 8.0, 21.0, 25.0, 29.0, 49.0, 38.0, 69.0, 77.0, 118.0, 133.0, 197.0, 348.0, 860.0, 3310.0, 31131.0, 879679.0, 122150.0, 7400.0, 1420.0, 491.0, 254.0, 141.0, 97.0, 83.0, 63.0, 59.0, 44.0, 36.0, 31.0, 21.0, 25.0, 24.0, 9.0, 8.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07224559783935547, -0.06996726989746094, -0.0676889419555664, -0.06541061401367188, -0.06313228607177734, -0.06085395812988281, -0.05857563018798828, -0.05629730224609375, -0.05401897430419922, -0.05174064636230469, -0.049462318420410156, -0.047183990478515625, -0.044905662536621094, -0.04262733459472656, -0.04034900665283203, -0.0380706787109375, -0.03579235076904297, -0.03351402282714844, -0.031235694885253906, -0.028957366943359375, -0.026679039001464844, -0.024400711059570312, -0.02212238311767578, -0.01984405517578125, -0.01756572723388672, -0.015287399291992188, -0.013009071350097656, -0.010730743408203125, -0.008452415466308594, -0.0061740875244140625, -0.0038957595825195312, -0.001617431640625, 0.0006608963012695312, 0.0029392242431640625, 0.005217552185058594, 0.007495880126953125, 0.009774208068847656, 0.012052536010742188, 0.014330863952636719, 0.01660919189453125, 0.01888751983642578, 0.021165847778320312, 0.023444175720214844, 0.025722503662109375, 0.028000831604003906, 0.030279159545898438, 0.03255748748779297, 0.0348358154296875, 0.03711414337158203, 0.03939247131347656, 0.041670799255371094, 0.043949127197265625, 0.046227455139160156, 0.04850578308105469, 0.05078411102294922, 0.05306243896484375, 0.05534076690673828, 0.05761909484863281, 0.059897422790527344, 0.062175750732421875, 0.0644540786743164, 0.06673240661621094, 0.06901073455810547, 0.0712890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 15.0, 13.0, 6.0, 15.0, 17.0, 15.0, 29.0, 18.0, 25.0, 28.0, 40.0, 31.0, 34.0, 39.0, 36.0, 39.0, 41.0, 45.0, 33.0, 44.0, 34.0, 31.0, 37.0, 33.0, 24.0, 27.0, 20.0, 29.0, 25.0, 16.0, 26.0, 13.0, 18.0, 23.0, 7.0, 6.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.0652627944946289, -0.06320381164550781, -0.06114482879638672, -0.059085845947265625, -0.05702686309814453, -0.05496788024902344, -0.052908897399902344, -0.05084991455078125, -0.048790931701660156, -0.04673194885253906, -0.04467296600341797, -0.042613983154296875, -0.04055500030517578, -0.03849601745605469, -0.036437034606933594, -0.0343780517578125, -0.032319068908691406, -0.030260086059570312, -0.02820110321044922, -0.026142120361328125, -0.02408313751220703, -0.022024154663085938, -0.019965171813964844, -0.01790618896484375, -0.015847206115722656, -0.013788223266601562, -0.011729240417480469, -0.009670257568359375, -0.007611274719238281, -0.0055522918701171875, -0.0034933090209960938, -0.001434326171875, 0.0006246566772460938, 0.0026836395263671875, 0.004742622375488281, 0.006801605224609375, 0.008860588073730469, 0.010919570922851562, 0.012978553771972656, 0.01503753662109375, 0.017096519470214844, 0.019155502319335938, 0.02121448516845703, 0.023273468017578125, 0.02533245086669922, 0.027391433715820312, 0.029450416564941406, 0.0315093994140625, 0.033568382263183594, 0.03562736511230469, 0.03768634796142578, 0.039745330810546875, 0.04180431365966797, 0.04386329650878906, 0.045922279357910156, 0.04798126220703125, 0.050040245056152344, 0.05209922790527344, 0.05415821075439453, 0.056217193603515625, 0.05827617645263672, 0.06033515930175781, 0.062394142150878906, 0.064453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 11.0, 9.0, 13.0, 26.0, 28.0, 29.0, 50.0, 69.0, 85.0, 158.0, 237.0, 447.0, 784.0, 1823.0, 6740.0, 45448.0, 937093.0, 45165.0, 6293.0, 2084.0, 795.0, 461.0, 181.0, 140.0, 117.0, 71.0, 45.0, 34.0, 17.0, 16.0, 19.0, 8.0, 6.0, 14.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.6226043701171875e-05, -2.54875048995018e-05, -2.4748966097831726e-05, -2.401042729616165e-05, -2.3271888494491577e-05, -2.2533349692821503e-05, -2.1794810891151428e-05, -2.1056272089481354e-05, -2.031773328781128e-05, -1.9579194486141205e-05, -1.884065568447113e-05, -1.8102116882801056e-05, -1.736357808113098e-05, -1.6625039279460907e-05, -1.5886500477790833e-05, -1.5147961676120758e-05, -1.4409422874450684e-05, -1.3670884072780609e-05, -1.2932345271110535e-05, -1.219380646944046e-05, -1.1455267667770386e-05, -1.0716728866100311e-05, -9.978190064430237e-06, -9.239651262760162e-06, -8.501112461090088e-06, -7.762573659420013e-06, -7.024034857749939e-06, -6.2854960560798645e-06, -5.54695725440979e-06, -4.8084184527397156e-06, -4.069879651069641e-06, -3.3313408493995667e-06, -2.592802047729492e-06, -1.8542632460594177e-06, -1.1157244443893433e-06, -3.771856427192688e-07, 3.6135315895080566e-07, 1.0998919606208801e-06, 1.8384307622909546e-06, 2.576969563961029e-06, 3.3155083656311035e-06, 4.054047167301178e-06, 4.7925859689712524e-06, 5.531124770641327e-06, 6.269663572311401e-06, 7.008202373981476e-06, 7.74674117565155e-06, 8.485279977321625e-06, 9.2238187789917e-06, 9.962357580661774e-06, 1.0700896382331848e-05, 1.1439435184001923e-05, 1.2177973985671997e-05, 1.2916512787342072e-05, 1.3655051589012146e-05, 1.439359039068222e-05, 1.5132129192352295e-05, 1.587066799402237e-05, 1.6609206795692444e-05, 1.734774559736252e-05, 1.8086284399032593e-05, 1.8824823200702667e-05, 1.9563362002372742e-05, 2.0301900804042816e-05, 2.104043960571289e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 1.0, 11.0, 9.0, 20.0, 13.0, 20.0, 35.0, 15.0, 32.0, 28.0, 41.0, 55.0, 51.0, 48.0, 53.0, 55.0, 61.0, 34.0, 45.0, 71.0, 60.0, 40.0, 34.0, 27.0, 32.0, 25.0, 14.0, 18.0, 2.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3974647521972656e-06, -3.2838433980941772e-06, -3.170222043991089e-06, -3.0566006898880005e-06, -2.942979335784912e-06, -2.8293579816818237e-06, -2.7157366275787354e-06, -2.602115273475647e-06, -2.4884939193725586e-06, -2.3748725652694702e-06, -2.261251211166382e-06, -2.1476298570632935e-06, -2.034008502960205e-06, -1.9203871488571167e-06, -1.8067657947540283e-06, -1.69314444065094e-06, -1.5795230865478516e-06, -1.4659017324447632e-06, -1.3522803783416748e-06, -1.2386590242385864e-06, -1.125037670135498e-06, -1.0114163160324097e-06, -8.977949619293213e-07, -7.841736078262329e-07, -6.705522537231445e-07, -5.569308996200562e-07, -4.4330954551696777e-07, -3.296881914138794e-07, -2.1606683731079102e-07, -1.0244548320770264e-07, 1.1175870895385742e-08, 1.2479722499847412e-07, 2.384185791015625e-07, 3.520399332046509e-07, 4.6566128730773926e-07, 5.792826414108276e-07, 6.92903995513916e-07, 8.065253496170044e-07, 9.201467037200928e-07, 1.0337680578231812e-06, 1.1473894119262695e-06, 1.261010766029358e-06, 1.3746321201324463e-06, 1.4882534742355347e-06, 1.601874828338623e-06, 1.7154961824417114e-06, 1.8291175365447998e-06, 1.942738890647888e-06, 2.0563602447509766e-06, 2.169981598854065e-06, 2.2836029529571533e-06, 2.3972243070602417e-06, 2.51084566116333e-06, 2.6244670152664185e-06, 2.738088369369507e-06, 2.8517097234725952e-06, 2.9653310775756836e-06, 3.078952431678772e-06, 3.1925737857818604e-06, 3.3061951398849487e-06, 3.419816493988037e-06, 3.5334378480911255e-06, 3.647059202194214e-06, 3.7606805562973022e-06, 3.874301910400391e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 5.0, 4.0, 9.0, 12.0, 18.0, 24.0, 21.0, 28.0, 49.0, 57.0, 89.0, 91.0, 164.0, 335.0, 1073.0, 6464.0, 329889.0, 700357.0, 7728.0, 1115.0, 380.0, 184.0, 137.0, 76.0, 59.0, 44.0, 26.0, 20.0, 19.0, 18.0, 13.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7179718017578125e-05, -2.640392631292343e-05, -2.5628134608268738e-05, -2.4852342903614044e-05, -2.407655119895935e-05, -2.3300759494304657e-05, -2.2524967789649963e-05, -2.174917608499527e-05, -2.0973384380340576e-05, -2.0197592675685883e-05, -1.942180097103119e-05, -1.8646009266376495e-05, -1.7870217561721802e-05, -1.7094425857067108e-05, -1.6318634152412415e-05, -1.554284244775772e-05, -1.4767050743103027e-05, -1.3991259038448334e-05, -1.321546733379364e-05, -1.2439675629138947e-05, -1.1663883924484253e-05, -1.088809221982956e-05, -1.0112300515174866e-05, -9.336508810520172e-06, -8.560717105865479e-06, -7.784925401210785e-06, -7.009133696556091e-06, -6.233341991901398e-06, -5.457550287246704e-06, -4.6817585825920105e-06, -3.905966877937317e-06, -3.1301751732826233e-06, -2.3543834686279297e-06, -1.578591763973236e-06, -8.028000593185425e-07, -2.7008354663848877e-08, 7.487833499908447e-07, 1.5245750546455383e-06, 2.300366759300232e-06, 3.0761584639549255e-06, 3.851950168609619e-06, 4.627741873264313e-06, 5.403533577919006e-06, 6.1793252825737e-06, 6.9551169872283936e-06, 7.730908691883087e-06, 8.50670039653778e-06, 9.282492101192474e-06, 1.0058283805847168e-05, 1.0834075510501862e-05, 1.1609867215156555e-05, 1.2385658919811249e-05, 1.3161450624465942e-05, 1.3937242329120636e-05, 1.471303403377533e-05, 1.5488825738430023e-05, 1.6264617443084717e-05, 1.704040914773941e-05, 1.7816200852394104e-05, 1.8591992557048798e-05, 1.936778426170349e-05, 2.0143575966358185e-05, 2.091936767101288e-05, 2.1695159375667572e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 19.0, 13.0, 15.0, 25.0, 30.0, 37.0, 20.0, 35.0, 37.0, 69.0, 69.0, 63.0, 71.0, 62.0, 69.0, 49.0, 57.0, 45.0, 27.0, 27.0, 24.0, 14.0, 15.0, 10.0, 12.0, 11.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4557113647460938e-05, -2.3855827748775482e-05, -2.3154541850090027e-05, -2.245325595140457e-05, -2.1751970052719116e-05, -2.105068415403366e-05, -2.0349398255348206e-05, -1.964811235666275e-05, -1.8946826457977295e-05, -1.824554055929184e-05, -1.7544254660606384e-05, -1.684296876192093e-05, -1.6141682863235474e-05, -1.544039696455002e-05, -1.4739111065864563e-05, -1.4037825167179108e-05, -1.3336539268493652e-05, -1.2635253369808197e-05, -1.1933967471122742e-05, -1.1232681572437286e-05, -1.0531395673751831e-05, -9.830109775066376e-06, -9.12882387638092e-06, -8.427537977695465e-06, -7.72625207901001e-06, -7.0249661803245544e-06, -6.323680281639099e-06, -5.622394382953644e-06, -4.9211084842681885e-06, -4.219822585582733e-06, -3.518536686897278e-06, -2.8172507882118225e-06, -2.115964889526367e-06, -1.4146789908409119e-06, -7.133930921554565e-07, -1.210719347000122e-08, 6.891787052154541e-07, 1.3904646039009094e-06, 2.0917505025863647e-06, 2.79303640127182e-06, 3.4943222999572754e-06, 4.195608198642731e-06, 4.896894097328186e-06, 5.598179996013641e-06, 6.299465894699097e-06, 7.000751793384552e-06, 7.702037692070007e-06, 8.403323590755463e-06, 9.104609489440918e-06, 9.805895388126373e-06, 1.0507181286811829e-05, 1.1208467185497284e-05, 1.190975308418274e-05, 1.2611038982868195e-05, 1.331232488155365e-05, 1.4013610780239105e-05, 1.471489667892456e-05, 1.5416182577610016e-05, 1.611746847629547e-05, 1.6818754374980927e-05, 1.7520040273666382e-05, 1.8221326172351837e-05, 1.8922612071037292e-05, 1.9623897969722748e-05, 2.0325183868408203e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 875.0, 136.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.669297218322754, -4.587241172790527, -4.505185127258301, -4.423129081726074, -4.341073036193848, -4.259017467498779, -4.176961421966553, -4.094905376434326, -4.0128493309021, -3.930793285369873, -3.8487372398376465, -3.766681432723999, -3.6846253871917725, -3.602569341659546, -3.5205135345458984, -3.438457489013672, -3.3564014434814453, -3.2743453979492188, -3.192289352416992, -3.1102335453033447, -3.028177499771118, -2.9461214542388916, -2.864065647125244, -2.7820096015930176, -2.699953556060791, -2.6178975105285645, -2.535841464996338, -2.4537856578826904, -2.371729612350464, -2.2896735668182373, -2.20761775970459, -2.1255617141723633, -2.0435056686401367, -1.9614496231079102, -1.8793936967849731, -1.7973377704620361, -1.7152817249298096, -1.633225679397583, -1.551169753074646, -1.469113826751709, -1.3870577812194824, -1.3050017356872559, -1.2229458093643188, -1.1408898830413818, -1.0588338375091553, -0.9767778515815735, -0.8947218656539917, -0.8126658797264099, -0.7306098341941833, -0.6485538482666016, -0.5664978623390198, -0.484441876411438, -0.4023858904838562, -0.3203299045562744, -0.23827391862869263, -0.15621793270111084, -0.07416194677352905, 0.007894039154052734, 0.08995002508163452, 0.1720060110092163, 0.2540619969367981, 0.3361179828643799, 0.41817396879196167, 0.5002299547195435, 0.5822859406471252]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 6.0, 5.0, 11.0, 14.0, 16.0, 18.0, 26.0, 49.0, 112.0, 144.0, 178.0, 141.0, 104.0, 59.0, 35.0, 16.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.386279821395874, -1.339289665222168, -1.2922996282577515, -1.2453094720840454, -1.198319435119629, -1.1513292789459229, -1.1043391227722168, -1.0573489665985107, -1.0103589296340942, -0.963368833065033, -0.9163787364959717, -0.8693885803222656, -0.8223984837532043, -0.7754083871841431, -0.728418231010437, -0.6814281344413757, -0.6344380378723145, -0.5874479413032532, -0.5404578447341919, -0.49346768856048584, -0.44647759199142456, -0.3994874954223633, -0.3524973690509796, -0.30550724267959595, -0.25851714611053467, -0.2115270346403122, -0.16453692317008972, -0.11754681169986725, -0.07055670022964478, -0.023566588759422302, 0.02342352271080017, 0.07041364908218384, 0.11740386486053467, 0.16439397633075714, 0.21138408780097961, 0.2583742141723633, 0.30536431074142456, 0.35235440731048584, 0.3993445336818695, 0.4463346600532532, 0.49332475662231445, 0.5403148531913757, 0.587304949760437, 0.6342951059341431, 0.6812852025032043, 0.7282752990722656, 0.7752654552459717, 0.822255551815033, 0.8692456483840942, 0.9162357449531555, 0.9632258415222168, 1.0102159976959229, 1.057206153869629, 1.1041961908340454, 1.1511863470077515, 1.198176383972168, 1.245166540145874, 1.29215669631958, 1.3391467332839966, 1.3861368894577026, 1.4331269264221191, 1.4801170825958252, 1.5271072387695312, 1.5740973949432373, 1.6210874319076538]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 10.0, 9.0, 7.0, 23.0, 33.0, 52.0, 105.0, 198.0, 500.0, 1144.0, 3897.0, 52441.0, 4125752.0, 6156.0, 2087.0, 877.0, 449.0, 213.0, 123.0, 63.0, 36.0, 17.0, 24.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.19035911560058594, -0.18333053588867188, -0.1763019561767578, -0.16927337646484375, -0.1622447967529297, -0.15521621704101562, -0.14818763732910156, -0.1411590576171875, -0.13413047790527344, -0.12710189819335938, -0.12007331848144531, -0.11304473876953125, -0.10601615905761719, -0.09898757934570312, -0.09195899963378906, -0.084930419921875, -0.07790184020996094, -0.07087326049804688, -0.06384468078613281, -0.05681610107421875, -0.04978752136230469, -0.042758941650390625, -0.03573036193847656, -0.0287017822265625, -0.021673202514648438, -0.014644622802734375, -0.0076160430908203125, -0.00058746337890625, 0.0064411163330078125, 0.013469696044921875, 0.020498275756835938, 0.02752685546875, 0.03455543518066406, 0.041584014892578125, 0.04861259460449219, 0.05564117431640625, 0.06266975402832031, 0.06969833374023438, 0.07672691345214844, 0.0837554931640625, 0.09078407287597656, 0.09781265258789062, 0.10484123229980469, 0.11186981201171875, 0.11889839172363281, 0.12592697143554688, 0.13295555114746094, 0.139984130859375, 0.14701271057128906, 0.15404129028320312, 0.1610698699951172, 0.16809844970703125, 0.1751270294189453, 0.18215560913085938, 0.18918418884277344, 0.1962127685546875, 0.20324134826660156, 0.21026992797851562, 0.2172985076904297, 0.22432708740234375, 0.2313556671142578, 0.23838424682617188, 0.24541282653808594, 0.25244140625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 10.0, 9.0, 4.0, 8.0, 4.0, 13.0, 15.0, 24.0, 613.0, 175.0, 17.0, 13.0, 10.0, 7.0, 8.0, 8.0, 6.0, 6.0, 4.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01276397705078125, -0.012310385704040527, -0.011856794357299805, -0.011403203010559082, -0.01094961166381836, -0.010496020317077637, -0.010042428970336914, -0.009588837623596191, -0.009135246276855469, -0.008681654930114746, -0.008228063583374023, -0.007774472236633301, -0.007320880889892578, -0.0068672895431518555, -0.006413698196411133, -0.00596010684967041, -0.0055065155029296875, -0.005052924156188965, -0.004599332809448242, -0.0041457414627075195, -0.003692150115966797, -0.0032385587692260742, -0.0027849674224853516, -0.002331376075744629, -0.0018777847290039062, -0.0014241933822631836, -0.0009706020355224609, -0.0005170106887817383, -6.341934204101562e-05, 0.00039017200469970703, 0.0008437633514404297, 0.0012973546981811523, 0.001750946044921875, 0.0022045373916625977, 0.0026581287384033203, 0.003111720085144043, 0.0035653114318847656, 0.004018902778625488, 0.004472494125366211, 0.004926085472106934, 0.005379676818847656, 0.005833268165588379, 0.0062868595123291016, 0.006740450859069824, 0.007194042205810547, 0.0076476335525512695, 0.008101224899291992, 0.008554816246032715, 0.009008407592773438, 0.00946199893951416, 0.009915590286254883, 0.010369181632995605, 0.010822772979736328, 0.01127636432647705, 0.011729955673217773, 0.012183547019958496, 0.012637138366699219, 0.013090729713439941, 0.013544321060180664, 0.013997912406921387, 0.01445150375366211, 0.014905095100402832, 0.015358686447143555, 0.015812277793884277, 0.016265869140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 3.0, 6.0, 9.0, 6.0, 12.0, 17.0, 19.0, 12.0, 28.0, 31.0, 49.0, 62.0, 113.0, 174.0, 394.0, 1131.0, 5581.0, 58051.0, 4104599.0, 19744.0, 2783.0, 719.0, 272.0, 135.0, 64.0, 58.0, 40.0, 28.0, 19.0, 24.0, 10.0, 15.0, 10.0, 8.0, 12.0, 5.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1766357421875, -0.17148590087890625, -0.1663360595703125, -0.16118621826171875, -0.156036376953125, -0.15088653564453125, -0.1457366943359375, -0.14058685302734375, -0.13543701171875, -0.13028717041015625, -0.1251373291015625, -0.11998748779296875, -0.114837646484375, -0.10968780517578125, -0.1045379638671875, -0.09938812255859375, -0.09423828125, -0.08908843994140625, -0.0839385986328125, -0.07878875732421875, -0.073638916015625, -0.06848907470703125, -0.0633392333984375, -0.05818939208984375, -0.05303955078125, -0.04788970947265625, -0.0427398681640625, -0.03759002685546875, -0.032440185546875, -0.02729034423828125, -0.0221405029296875, -0.01699066162109375, -0.0118408203125, -0.00669097900390625, -0.0015411376953125, 0.00360870361328125, 0.008758544921875, 0.01390838623046875, 0.0190582275390625, 0.02420806884765625, 0.02935791015625, 0.03450775146484375, 0.0396575927734375, 0.04480743408203125, 0.049957275390625, 0.05510711669921875, 0.0602569580078125, 0.06540679931640625, 0.070556640625, 0.07570648193359375, 0.0808563232421875, 0.08600616455078125, 0.091156005859375, 0.09630584716796875, 0.1014556884765625, 0.10660552978515625, 0.11175537109375, 0.11690521240234375, 0.1220550537109375, 0.12720489501953125, 0.132354736328125, 0.13750457763671875, 0.1426544189453125, 0.14780426025390625, 0.1529541015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 5.0, 8.0, 12.0, 19.0, 6.0, 19.0, 13.0, 21.0, 22.0, 36.0, 59.0, 3597.0, 30.0, 24.0, 22.0, 17.0, 14.0, 11.0, 13.0, 11.0, 15.0, 4.0, 14.0, 7.0, 7.0, 6.0, 5.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.025299072265625, -0.024561405181884766, -0.02382373809814453, -0.023086071014404297, -0.022348403930664062, -0.021610736846923828, -0.020873069763183594, -0.02013540267944336, -0.019397735595703125, -0.01866006851196289, -0.017922401428222656, -0.017184734344482422, -0.016447067260742188, -0.015709400177001953, -0.014971733093261719, -0.014234066009521484, -0.01349639892578125, -0.012758731842041016, -0.012021064758300781, -0.011283397674560547, -0.010545730590820312, -0.009808063507080078, -0.009070396423339844, -0.00833272933959961, -0.007595062255859375, -0.006857395172119141, -0.006119728088378906, -0.005382061004638672, -0.0046443939208984375, -0.003906726837158203, -0.0031690597534179688, -0.0024313926696777344, -0.0016937255859375, -0.0009560585021972656, -0.00021839141845703125, 0.0005192756652832031, 0.0012569427490234375, 0.001994609832763672, 0.0027322769165039062, 0.0034699440002441406, 0.004207611083984375, 0.004945278167724609, 0.005682945251464844, 0.006420612335205078, 0.0071582794189453125, 0.007895946502685547, 0.008633613586425781, 0.009371280670166016, 0.01010894775390625, 0.010846614837646484, 0.011584281921386719, 0.012321949005126953, 0.013059616088867188, 0.013797283172607422, 0.014534950256347656, 0.01527261734008789, 0.016010284423828125, 0.01674795150756836, 0.017485618591308594, 0.018223285675048828, 0.018960952758789062, 0.019698619842529297, 0.02043628692626953, 0.021173954010009766, 0.02191162109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1016.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814591646194458, -1.782610297203064, -1.75062894821167, -1.7186474800109863, -1.6866661310195923, -1.6546847820281982, -1.6227034330368042, -1.5907220840454102, -1.5587407350540161, -1.526759386062622, -1.494778037071228, -1.462796688079834, -1.4308152198791504, -1.3988338708877563, -1.3668525218963623, -1.3348711729049683, -1.3028898239135742, -1.2709084749221802, -1.2389271259307861, -1.2069456577301025, -1.1749643087387085, -1.1429829597473145, -1.1110016107559204, -1.0790202617645264, -1.0470387935638428, -1.0150574445724487, -0.9830760359764099, -0.9510946869850159, -0.9191133379936218, -0.887131929397583, -0.855150580406189, -0.8231692314147949, -0.7911879420280457, -0.7592065930366516, -0.7272251844406128, -0.6952438354492188, -0.6632624864578247, -0.6312811374664307, -0.5992997288703918, -0.5673183798789978, -0.5353370308876038, -0.5033556818962097, -0.4713743031024933, -0.43939292430877686, -0.4074115753173828, -0.3754301965236664, -0.34344881772994995, -0.3114674687385559, -0.2794860601425171, -0.24750469624996185, -0.21552333235740662, -0.18354195356369019, -0.15156058967113495, -0.11957922577857971, -0.08759784698486328, -0.055616483092308044, -0.023635134100914, 0.008346233516931534, 0.04032760113477707, 0.0723089724779129, 0.10429033637046814, 0.13627170026302338, 0.1682530790567398, 0.20023444294929504, 0.23221580684185028]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 10.0, 6.0, 18.0, 22.0, 42.0, 67.0, 109.0, 138.0, 171.0, 112.0, 95.0, 73.0, 32.0, 15.0, 12.0, 13.0, 10.0, 5.0, 10.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13524079322814941, -0.13109557330608368, -0.12695035338401794, -0.1228051483631134, -0.11865992844104767, -0.11451470851898193, -0.1103694960474968, -0.10622428357601166, -0.10207906365394592, -0.09793384373188019, -0.09378863126039505, -0.08964341878890991, -0.08549819886684418, -0.08135297894477844, -0.0772077664732933, -0.07306255400180817, -0.06891733407974243, -0.0647721141576767, -0.06062690168619156, -0.05648168548941612, -0.052336469292640686, -0.04819125309586525, -0.04404603689908981, -0.03990082070231438, -0.03575560450553894, -0.031610388308763504, -0.027465172111988068, -0.02331995591521263, -0.019174739718437195, -0.015029523521661758, -0.010884307324886322, -0.006739091128110886, -0.0025938749313354492, 0.0015513412654399872, 0.005696557462215424, 0.00984177365899086, 0.013986989855766296, 0.018132206052541733, 0.02227742224931717, 0.026422638446092606, 0.030567854642868042, 0.03471307083964348, 0.038858287036418915, 0.04300350323319435, 0.04714871942996979, 0.051293935626745224, 0.05543915182352066, 0.0595843680202961, 0.06372958421707153, 0.06787480413913727, 0.0720200166106224, 0.07616522908210754, 0.08031044900417328, 0.08445566892623901, 0.08860088139772415, 0.09274609386920929, 0.09689131379127502, 0.10103653371334076, 0.1051817461848259, 0.10932695865631104, 0.11347217857837677, 0.1176173985004425, 0.12176261097192764, 0.12590782344341278, 0.13005304336547852]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 21.0, 17.0, 29.0, 38.0, 38.0, 69.0, 91.0, 121.0, 152.0, 262.0, 322.0, 430.0, 607.0, 945.0, 1301.0, 2051.0, 2925.0, 4724.0, 7996.0, 13771.0, 29600.0, 866889.0, 70211.0, 18750.0, 10110.0, 5828.0, 3669.0, 2255.0, 1568.0, 1073.0, 747.0, 557.0, 372.0, 274.0, 214.0, 135.0, 101.0, 71.0, 58.0, 34.0, 22.0, 17.0, 17.0, 7.0, 10.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.043182373046875, -0.04190206527709961, -0.04062175750732422, -0.03934144973754883, -0.03806114196777344, -0.03678083419799805, -0.035500526428222656, -0.034220218658447266, -0.032939910888671875, -0.031659603118896484, -0.030379295349121094, -0.029098987579345703, -0.027818679809570312, -0.026538372039794922, -0.02525806427001953, -0.02397775650024414, -0.02269744873046875, -0.02141714096069336, -0.02013683319091797, -0.018856525421142578, -0.017576217651367188, -0.016295909881591797, -0.015015602111816406, -0.013735294342041016, -0.012454986572265625, -0.011174678802490234, -0.009894371032714844, -0.008614063262939453, -0.0073337554931640625, -0.006053447723388672, -0.004773139953613281, -0.0034928321838378906, -0.0022125244140625, -0.0009322166442871094, 0.00034809112548828125, 0.0016283988952636719, 0.0029087066650390625, 0.004189014434814453, 0.005469322204589844, 0.006749629974365234, 0.008029937744140625, 0.009310245513916016, 0.010590553283691406, 0.011870861053466797, 0.013151168823242188, 0.014431476593017578, 0.01571178436279297, 0.01699209213256836, 0.01827239990234375, 0.01955270767211914, 0.02083301544189453, 0.022113323211669922, 0.023393630981445312, 0.024673938751220703, 0.025954246520996094, 0.027234554290771484, 0.028514862060546875, 0.029795169830322266, 0.031075477600097656, 0.03235578536987305, 0.03363609313964844, 0.03491640090942383, 0.03619670867919922, 0.03747701644897461, 0.03875732421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 10.0, 4.0, 8.0, 9.0, 11.0, 15.0, 25.0, 482.0, 297.0, 24.0, 5.0, 12.0, 7.0, 9.0, 6.0, 8.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.01237177848815918, -0.01194906234741211, -0.011526346206665039, -0.011103630065917969, -0.010680913925170898, -0.010258197784423828, -0.009835481643676758, -0.009412765502929688, -0.008990049362182617, -0.008567333221435547, -0.008144617080688477, -0.007721900939941406, -0.007299184799194336, -0.006876468658447266, -0.006453752517700195, -0.006031036376953125, -0.005608320236206055, -0.005185604095458984, -0.004762887954711914, -0.004340171813964844, -0.0039174556732177734, -0.003494739532470703, -0.003072023391723633, -0.0026493072509765625, -0.002226591110229492, -0.0018038749694824219, -0.0013811588287353516, -0.0009584426879882812, -0.0005357265472412109, -0.00011301040649414062, 0.0003097057342529297, 0.000732421875, 0.0011551380157470703, 0.0015778541564941406, 0.002000570297241211, 0.0024232864379882812, 0.0028460025787353516, 0.003268718719482422, 0.003691434860229492, 0.0041141510009765625, 0.004536867141723633, 0.004959583282470703, 0.0053822994232177734, 0.005805015563964844, 0.006227731704711914, 0.006650447845458984, 0.007073163986206055, 0.007495880126953125, 0.007918596267700195, 0.008341312408447266, 0.008764028549194336, 0.009186744689941406, 0.009609460830688477, 0.010032176971435547, 0.010454893112182617, 0.010877609252929688, 0.011300325393676758, 0.011723041534423828, 0.012145757675170898, 0.012568473815917969, 0.012991189956665039, 0.01341390609741211, 0.01383662223815918, 0.01425933837890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 16.0, 10.0, 19.0, 13.0, 24.0, 39.0, 49.0, 53.0, 50.0, 58.0, 88.0, 116.0, 102.0, 169.0, 198.0, 366.0, 704.0, 3680.0, 90265.0, 927741.0, 21300.0, 1710.0, 523.0, 272.0, 191.0, 124.0, 111.0, 119.0, 76.0, 62.0, 53.0, 48.0, 37.0, 35.0, 21.0, 21.0, 17.0, 14.0, 10.0, 4.0, 7.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.0791482925415039, -0.07644844055175781, -0.07374858856201172, -0.07104873657226562, -0.06834888458251953, -0.06564903259277344, -0.06294918060302734, -0.06024932861328125, -0.057549476623535156, -0.05484962463378906, -0.05214977264404297, -0.049449920654296875, -0.04675006866455078, -0.04405021667480469, -0.041350364685058594, -0.0386505126953125, -0.035950660705566406, -0.03325080871582031, -0.03055095672607422, -0.027851104736328125, -0.02515125274658203, -0.022451400756835938, -0.019751548767089844, -0.01705169677734375, -0.014351844787597656, -0.011651992797851562, -0.008952140808105469, -0.006252288818359375, -0.0035524368286132812, -0.0008525848388671875, 0.0018472671508789062, 0.004547119140625, 0.007246971130371094, 0.009946823120117188, 0.012646675109863281, 0.015346527099609375, 0.01804637908935547, 0.020746231079101562, 0.023446083068847656, 0.02614593505859375, 0.028845787048339844, 0.03154563903808594, 0.03424549102783203, 0.036945343017578125, 0.03964519500732422, 0.04234504699707031, 0.045044898986816406, 0.0477447509765625, 0.050444602966308594, 0.05314445495605469, 0.05584430694580078, 0.058544158935546875, 0.06124401092529297, 0.06394386291503906, 0.06664371490478516, 0.06934356689453125, 0.07204341888427734, 0.07474327087402344, 0.07744312286376953, 0.08014297485351562, 0.08284282684326172, 0.08554267883300781, 0.0882425308227539, 0.0909423828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 7.0, 5.0, 8.0, 13.0, 6.0, 10.0, 4.0, 11.0, 15.0, 24.0, 21.0, 19.0, 25.0, 22.0, 30.0, 30.0, 41.0, 32.0, 40.0, 44.0, 36.0, 38.0, 44.0, 37.0, 38.0, 44.0, 37.0, 37.0, 38.0, 25.0, 39.0, 15.0, 18.0, 26.0, 24.0, 16.0, 12.0, 14.0, 9.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03826904296875, -0.03700685501098633, -0.035744667053222656, -0.034482479095458984, -0.03322029113769531, -0.03195810317993164, -0.03069591522216797, -0.029433727264404297, -0.028171539306640625, -0.026909351348876953, -0.02564716339111328, -0.02438497543334961, -0.023122787475585938, -0.021860599517822266, -0.020598411560058594, -0.019336223602294922, -0.01807403564453125, -0.016811847686767578, -0.015549659729003906, -0.014287471771240234, -0.013025283813476562, -0.01176309585571289, -0.010500907897949219, -0.009238719940185547, -0.007976531982421875, -0.006714344024658203, -0.005452156066894531, -0.004189968109130859, -0.0029277801513671875, -0.0016655921936035156, -0.00040340423583984375, 0.0008587837219238281, 0.0021209716796875, 0.003383159637451172, 0.004645347595214844, 0.005907535552978516, 0.0071697235107421875, 0.00843191146850586, 0.009694099426269531, 0.010956287384033203, 0.012218475341796875, 0.013480663299560547, 0.014742851257324219, 0.01600503921508789, 0.017267227172851562, 0.018529415130615234, 0.019791603088378906, 0.021053791046142578, 0.02231597900390625, 0.023578166961669922, 0.024840354919433594, 0.026102542877197266, 0.027364730834960938, 0.02862691879272461, 0.02988910675048828, 0.031151294708251953, 0.032413482666015625, 0.0336756706237793, 0.03493785858154297, 0.03620004653930664, 0.03746223449707031, 0.038724422454833984, 0.039986610412597656, 0.04124879837036133, 0.042510986328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 23.0, 47.0, 64.0, 165.0, 391.0, 1362.0, 9701.0, 1005077.0, 28689.0, 2099.0, 531.0, 185.0, 73.0, 42.0, 27.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001360177993774414, -0.00013185106217861176, -0.0001276843249797821, -0.00012351758778095245, -0.0001193508505821228, -0.00011518411338329315, -0.0001110173761844635, -0.00010685063898563385, -0.0001026839017868042, -9.851716458797455e-05, -9.43504273891449e-05, -9.018369019031525e-05, -8.60169529914856e-05, -8.185021579265594e-05, -7.76834785938263e-05, -7.351674139499664e-05, -6.935000419616699e-05, -6.518326699733734e-05, -6.101652979850769e-05, -5.684979259967804e-05, -5.268305540084839e-05, -4.851631820201874e-05, -4.434958100318909e-05, -4.0182843804359436e-05, -3.6016106605529785e-05, -3.1849369406700134e-05, -2.7682632207870483e-05, -2.3515895009040833e-05, -1.934915781021118e-05, -1.518242061138153e-05, -1.101568341255188e-05, -6.848946213722229e-06, -2.682209014892578e-06, 1.4845281839370728e-06, 5.651265382766724e-06, 9.818002581596375e-06, 1.3984739780426025e-05, 1.8151476979255676e-05, 2.2318214178085327e-05, 2.6484951376914978e-05, 3.065168857574463e-05, 3.481842577457428e-05, 3.898516297340393e-05, 4.315190017223358e-05, 4.731863737106323e-05, 5.148537456989288e-05, 5.5652111768722534e-05, 5.9818848967552185e-05, 6.398558616638184e-05, 6.815232336521149e-05, 7.231906056404114e-05, 7.648579776287079e-05, 8.065253496170044e-05, 8.481927216053009e-05, 8.898600935935974e-05, 9.315274655818939e-05, 9.731948375701904e-05, 0.0001014862209558487, 0.00010565295815467834, 0.000109819695353508, 0.00011398643255233765, 0.0001181531697511673, 0.00012231990694999695, 0.0001264866441488266, 0.00013065338134765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 5.0, 11.0, 15.0, 12.0, 24.0, 51.0, 65.0, 74.0, 90.0, 138.0, 98.0, 96.0, 80.0, 84.0, 52.0, 24.0, 20.0, 14.0, 18.0, 7.0, 7.0, 0.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0848045349121094e-05, -1.0595656931400299e-05, -1.0343268513679504e-05, -1.009088009595871e-05, -9.838491678237915e-06, -9.58610326051712e-06, -9.333714842796326e-06, -9.081326425075531e-06, -8.828938007354736e-06, -8.576549589633942e-06, -8.324161171913147e-06, -8.071772754192352e-06, -7.819384336471558e-06, -7.566995918750763e-06, -7.314607501029968e-06, -7.062219083309174e-06, -6.809830665588379e-06, -6.557442247867584e-06, -6.3050538301467896e-06, -6.052665412425995e-06, -5.8002769947052e-06, -5.5478885769844055e-06, -5.295500159263611e-06, -5.043111741542816e-06, -4.7907233238220215e-06, -4.538334906101227e-06, -4.285946488380432e-06, -4.0335580706596375e-06, -3.7811696529388428e-06, -3.528781235218048e-06, -3.2763928174972534e-06, -3.0240043997764587e-06, -2.771615982055664e-06, -2.5192275643348694e-06, -2.2668391466140747e-06, -2.01445072889328e-06, -1.7620623111724854e-06, -1.5096738934516907e-06, -1.257285475730896e-06, -1.0048970580101013e-06, -7.525086402893066e-07, -5.00120222568512e-07, -2.477318048477173e-07, 4.6566128730773926e-09, 2.5704503059387207e-07, 5.094334483146667e-07, 7.618218660354614e-07, 1.014210283756256e-06, 1.2665987014770508e-06, 1.5189871191978455e-06, 1.7713755369186401e-06, 2.023763954639435e-06, 2.2761523723602295e-06, 2.528540790081024e-06, 2.780929207801819e-06, 3.0333176255226135e-06, 3.285706043243408e-06, 3.538094460964203e-06, 3.7904828786849976e-06, 4.042871296405792e-06, 4.295259714126587e-06, 4.547648131847382e-06, 4.800036549568176e-06, 5.052424967288971e-06, 5.304813385009766e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 14.0, 16.0, 11.0, 31.0, 33.0, 45.0, 51.0, 76.0, 101.0, 143.0, 225.0, 321.0, 915.0, 7959.0, 966429.0, 68347.0, 2316.0, 552.0, 267.0, 175.0, 126.0, 81.0, 57.0, 57.0, 34.0, 31.0, 27.0, 18.0, 16.0, 7.0, 7.0, 9.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.328655242919922e-05, -5.13661652803421e-05, -4.9445778131484985e-05, -4.752539098262787e-05, -4.560500383377075e-05, -4.3684616684913635e-05, -4.176422953605652e-05, -3.98438423871994e-05, -3.7923455238342285e-05, -3.600306808948517e-05, -3.408268094062805e-05, -3.2162293791770935e-05, -3.024190664291382e-05, -2.83215194940567e-05, -2.6401132345199585e-05, -2.4480745196342468e-05, -2.256035804748535e-05, -2.0639970898628235e-05, -1.8719583749771118e-05, -1.6799196600914e-05, -1.4878809452056885e-05, -1.2958422303199768e-05, -1.1038035154342651e-05, -9.117648005485535e-06, -7.197260856628418e-06, -5.276873707771301e-06, -3.3564865589141846e-06, -1.4360994100570679e-06, 4.842877388000488e-07, 2.4046748876571655e-06, 4.325062036514282e-06, 6.245449185371399e-06, 8.165836334228516e-06, 1.0086223483085632e-05, 1.2006610631942749e-05, 1.3926997780799866e-05, 1.5847384929656982e-05, 1.77677720785141e-05, 1.9688159227371216e-05, 2.1608546376228333e-05, 2.352893352508545e-05, 2.5449320673942566e-05, 2.7369707822799683e-05, 2.92900949716568e-05, 3.1210482120513916e-05, 3.313086926937103e-05, 3.505125641822815e-05, 3.6971643567085266e-05, 3.889203071594238e-05, 4.08124178647995e-05, 4.2732805013656616e-05, 4.465319216251373e-05, 4.657357931137085e-05, 4.8493966460227966e-05, 5.041435360908508e-05, 5.23347407579422e-05, 5.4255127906799316e-05, 5.617551505565643e-05, 5.809590220451355e-05, 6.0016289353370667e-05, 6.193667650222778e-05, 6.38570636510849e-05, 6.577745079994202e-05, 6.769783794879913e-05, 6.961822509765625e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 6.0, 5.0, 5.0, 18.0, 12.0, 16.0, 19.0, 23.0, 40.0, 42.0, 41.0, 49.0, 62.0, 65.0, 87.0, 79.0, 64.0, 56.0, 47.0, 44.0, 44.0, 30.0, 20.0, 19.0, 18.0, 9.0, 16.0, 12.0, 9.0, 7.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.491474151611328e-05, -2.401694655418396e-05, -2.311915159225464e-05, -2.2221356630325317e-05, -2.1323561668395996e-05, -2.0425766706466675e-05, -1.9527971744537354e-05, -1.8630176782608032e-05, -1.773238182067871e-05, -1.683458685874939e-05, -1.593679189682007e-05, -1.5038996934890747e-05, -1.4141201972961426e-05, -1.3243407011032104e-05, -1.2345612049102783e-05, -1.1447817087173462e-05, -1.055002212524414e-05, -9.65222716331482e-06, -8.754432201385498e-06, -7.856637239456177e-06, -6.9588422775268555e-06, -6.061047315597534e-06, -5.163252353668213e-06, -4.265457391738892e-06, -3.3676624298095703e-06, -2.469867467880249e-06, -1.5720725059509277e-06, -6.742775440216064e-07, 2.2351741790771484e-07, 1.1213123798370361e-06, 2.0191073417663574e-06, 2.9169023036956787e-06, 3.814697265625e-06, 4.712492227554321e-06, 5.610287189483643e-06, 6.508082151412964e-06, 7.405877113342285e-06, 8.303672075271606e-06, 9.201467037200928e-06, 1.0099261999130249e-05, 1.099705696105957e-05, 1.1894851922988892e-05, 1.2792646884918213e-05, 1.3690441846847534e-05, 1.4588236808776855e-05, 1.5486031770706177e-05, 1.6383826732635498e-05, 1.728162169456482e-05, 1.817941665649414e-05, 1.9077211618423462e-05, 1.9975006580352783e-05, 2.0872801542282104e-05, 2.1770596504211426e-05, 2.2668391466140747e-05, 2.356618642807007e-05, 2.446398138999939e-05, 2.536177635192871e-05, 2.6259571313858032e-05, 2.7157366275787354e-05, 2.8055161237716675e-05, 2.8952956199645996e-05, 2.9850751161575317e-05, 3.074854612350464e-05, 3.164634108543396e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 965.0, 37.0, 6.0, 0.0, 1.0], "bins": [-2.155596971511841, -2.1194586753845215, -2.083320379257202, -2.0471818447113037, -2.0110435485839844, -1.974905252456665, -1.9387669563293457, -1.9026286602020264, -1.8664902448654175, -1.8303519487380981, -1.7942135334014893, -1.75807523727417, -1.7219369411468506, -1.6857985258102417, -1.6496602296829224, -1.6135218143463135, -1.5773835182189941, -1.5412452220916748, -1.505106806755066, -1.4689685106277466, -1.4328300952911377, -1.3966917991638184, -1.360553503036499, -1.3244152069091797, -1.2882767915725708, -1.2521384954452515, -1.2160000801086426, -1.1798617839813232, -1.143723487854004, -1.107585072517395, -1.0714467763900757, -1.0353083610534668, -0.9991700053215027, -0.9630316495895386, -0.9268933534622192, -0.8907549977302551, -0.854616641998291, -0.8184782862663269, -0.7823399305343628, -0.7462016344070435, -0.7100632786750793, -0.6739249229431152, -0.6377866268157959, -0.6016482710838318, -0.5655099153518677, -0.5293715596199036, -0.49323323369026184, -0.4570949077606201, -0.420956552028656, -0.3848181962966919, -0.34867987036705017, -0.31254154443740845, -0.27640318870544434, -0.24026484787464142, -0.2041265070438385, -0.16798818111419678, -0.13184982538223267, -0.09571148455142975, -0.05957314372062683, -0.023434802889823914, 0.012703537940979004, 0.04884187877178192, 0.08498021960258484, 0.12111854553222656, 0.15725690126419067]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 13.0, 12.0, 15.0, 21.0, 28.0, 40.0, 50.0, 72.0, 79.0, 107.0, 96.0, 96.0, 82.0, 71.0, 38.0, 45.0, 29.0, 22.0, 13.0, 12.0, 8.0, 6.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48047685623168945, -0.4644232988357544, -0.44836974143981934, -0.4323161840438843, -0.4162626266479492, -0.40020906925201416, -0.3841554820537567, -0.36810192465782166, -0.3520483672618866, -0.33599480986595154, -0.3199412524700165, -0.3038876950740814, -0.287834107875824, -0.2717805504798889, -0.25572699308395386, -0.2396734356880188, -0.22361987829208374, -0.20756632089614868, -0.19151276350021362, -0.17545919120311737, -0.1594056338071823, -0.14335207641124725, -0.127298504114151, -0.11124494671821594, -0.09519138932228088, -0.07913783192634583, -0.06308426707983017, -0.04703070595860481, -0.030977144837379456, -0.014923587441444397, 0.0011299774050712585, 0.017183542251586914, 0.0332370400428772, 0.049290601164102554, 0.06534416228532791, 0.08139772713184357, 0.09745128452777863, 0.11350484192371368, 0.12955841422080994, 0.145611971616745, 0.16166552901268005, 0.1777190864086151, 0.19377264380455017, 0.20982621610164642, 0.22587977349758148, 0.24193333089351654, 0.2579869031906128, 0.27404046058654785, 0.2900940179824829, 0.30614757537841797, 0.322201132774353, 0.3382546901702881, 0.35430824756622314, 0.3703618049621582, 0.38641539216041565, 0.4024689495563507, 0.41852250695228577, 0.4345760643482208, 0.4506296217441559, 0.46668317914009094, 0.4827367663383484, 0.49879032373428345, 0.5148438811302185, 0.5308974385261536, 0.5469509959220886]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 6.0, 15.0, 12.0, 27.0, 32.0, 51.0, 110.0, 171.0, 312.0, 607.0, 1264.0, 3046.0, 9516.0, 4055298.0, 105873.0, 10079.0, 3851.0, 1783.0, 940.0, 529.0, 278.0, 165.0, 101.0, 62.0, 42.0, 24.0, 23.0, 15.0, 10.0, 9.0, 3.0, 3.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134521484375, -0.1301727294921875, -0.125823974609375, -0.1214752197265625, -0.11712646484375, -0.1127777099609375, -0.108428955078125, -0.1040802001953125, -0.0997314453125, -0.0953826904296875, -0.091033935546875, -0.0866851806640625, -0.08233642578125, -0.0779876708984375, -0.073638916015625, -0.0692901611328125, -0.06494140625, -0.0605926513671875, -0.056243896484375, -0.0518951416015625, -0.04754638671875, -0.0431976318359375, -0.038848876953125, -0.0345001220703125, -0.0301513671875, -0.0258026123046875, -0.021453857421875, -0.0171051025390625, -0.01275634765625, -0.0084075927734375, -0.004058837890625, 0.0002899169921875, 0.004638671875, 0.0089874267578125, 0.013336181640625, 0.0176849365234375, 0.02203369140625, 0.0263824462890625, 0.030731201171875, 0.0350799560546875, 0.0394287109375, 0.0437774658203125, 0.048126220703125, 0.0524749755859375, 0.05682373046875, 0.0611724853515625, 0.065521240234375, 0.0698699951171875, 0.07421875, 0.0785675048828125, 0.082916259765625, 0.0872650146484375, 0.09161376953125, 0.0959625244140625, 0.100311279296875, 0.1046600341796875, 0.1090087890625, 0.1133575439453125, 0.117706298828125, 0.1220550537109375, 0.12640380859375, 0.1307525634765625, 0.135101318359375, 0.1394500732421875, 0.143798828125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 8.0, 8.0, 5.0, 12.0, 14.0, 13.0, 61.0, 586.0, 163.0, 17.0, 9.0, 9.0, 11.0, 11.0, 5.0, 8.0, 4.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01287078857421875, -0.012455344200134277, -0.012039899826049805, -0.011624455451965332, -0.01120901107788086, -0.010793566703796387, -0.010378122329711914, -0.009962677955627441, -0.009547233581542969, -0.009131789207458496, -0.008716344833374023, -0.00830090045928955, -0.007885456085205078, -0.0074700117111206055, -0.007054567337036133, -0.00663912296295166, -0.0062236785888671875, -0.005808234214782715, -0.005392789840698242, -0.0049773454666137695, -0.004561901092529297, -0.004146456718444824, -0.0037310123443603516, -0.003315567970275879, -0.0029001235961914062, -0.0024846792221069336, -0.002069234848022461, -0.0016537904739379883, -0.0012383460998535156, -0.000822901725769043, -0.0004074573516845703, 7.987022399902344e-06, 0.000423431396484375, 0.0008388757705688477, 0.0012543201446533203, 0.001669764518737793, 0.0020852088928222656, 0.0025006532669067383, 0.002916097640991211, 0.0033315420150756836, 0.0037469863891601562, 0.004162430763244629, 0.0045778751373291016, 0.004993319511413574, 0.005408763885498047, 0.0058242082595825195, 0.006239652633666992, 0.006655097007751465, 0.0070705413818359375, 0.00748598575592041, 0.007901430130004883, 0.008316874504089355, 0.008732318878173828, 0.0091477632522583, 0.009563207626342773, 0.009978652000427246, 0.010394096374511719, 0.010809540748596191, 0.011224985122680664, 0.011640429496765137, 0.01205587387084961, 0.012471318244934082, 0.012886762619018555, 0.013302206993103027, 0.0137176513671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 8.0, 15.0, 22.0, 17.0, 35.0, 34.0, 54.0, 80.0, 124.0, 188.0, 349.0, 933.0, 6635.0, 4133695.0, 48788.0, 2022.0, 522.0, 241.0, 146.0, 102.0, 64.0, 50.0, 29.0, 22.0, 14.0, 23.0, 11.0, 9.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.254638671875, -0.24686241149902344, -0.23908615112304688, -0.2313098907470703, -0.22353363037109375, -0.2157573699951172, -0.20798110961914062, -0.20020484924316406, -0.1924285888671875, -0.18465232849121094, -0.17687606811523438, -0.1690998077392578, -0.16132354736328125, -0.1535472869873047, -0.14577102661132812, -0.13799476623535156, -0.130218505859375, -0.12244224548339844, -0.11466598510742188, -0.10688972473144531, -0.09911346435546875, -0.09133720397949219, -0.08356094360351562, -0.07578468322753906, -0.0680084228515625, -0.06023216247558594, -0.052455902099609375, -0.04467964172363281, -0.03690338134765625, -0.029127120971679688, -0.021350860595703125, -0.013574600219726562, -0.00579833984375, 0.0019779205322265625, 0.009754180908203125, 0.017530441284179688, 0.02530670166015625, 0.03308296203613281, 0.040859222412109375, 0.04863548278808594, 0.0564117431640625, 0.06418800354003906, 0.07196426391601562, 0.07974052429199219, 0.08751678466796875, 0.09529304504394531, 0.10306930541992188, 0.11084556579589844, 0.118621826171875, 0.12639808654785156, 0.13417434692382812, 0.1419506072998047, 0.14972686767578125, 0.1575031280517578, 0.16527938842773438, 0.17305564880371094, 0.1808319091796875, 0.18860816955566406, 0.19638442993164062, 0.2041606903076172, 0.21193695068359375, 0.2197132110595703, 0.22748947143554688, 0.23526573181152344, 0.2430419921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 8.0, 4.0, 9.0, 16.0, 18.0, 20.0, 30.0, 32.0, 56.0, 54.0, 71.0, 135.0, 2481.0, 701.0, 117.0, 89.0, 54.0, 36.0, 32.0, 25.0, 18.0, 7.0, 10.0, 10.0, 8.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036457061767578125, -0.03531646728515625, -0.034175872802734375, -0.0330352783203125, -0.031894683837890625, -0.03075408935546875, -0.029613494873046875, -0.028472900390625, -0.027332305908203125, -0.02619171142578125, -0.025051116943359375, -0.0239105224609375, -0.022769927978515625, -0.02162933349609375, -0.020488739013671875, -0.01934814453125, -0.018207550048828125, -0.01706695556640625, -0.015926361083984375, -0.0147857666015625, -0.013645172119140625, -0.01250457763671875, -0.011363983154296875, -0.010223388671875, -0.009082794189453125, -0.00794219970703125, -0.006801605224609375, -0.0056610107421875, -0.004520416259765625, -0.00337982177734375, -0.002239227294921875, -0.0010986328125, 4.1961669921875e-05, 0.00118255615234375, 0.002323150634765625, 0.0034637451171875, 0.004604339599609375, 0.00574493408203125, 0.006885528564453125, 0.008026123046875, 0.009166717529296875, 0.01030731201171875, 0.011447906494140625, 0.0125885009765625, 0.013729095458984375, 0.01486968994140625, 0.016010284423828125, 0.01715087890625, 0.018291473388671875, 0.01943206787109375, 0.020572662353515625, 0.0217132568359375, 0.022853851318359375, 0.02399444580078125, 0.025135040283203125, 0.026275634765625, 0.027416229248046875, 0.02855682373046875, 0.029697418212890625, 0.0308380126953125, 0.031978607177734375, 0.03311920166015625, 0.034259796142578125, 0.035400390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 98.0, 855.0, 38.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262847900390625, -0.2575269937515259, -0.25220605731010437, -0.24688513576984406, -0.24156421422958374, -0.23624329268932343, -0.2309223711490631, -0.225601464509964, -0.22028052806854248, -0.21495960652828217, -0.20963868498802185, -0.20431776344776154, -0.19899684190750122, -0.1936759203672409, -0.1883549988269806, -0.18303409218788147, -0.17771317064762115, -0.17239224910736084, -0.16707132756710052, -0.1617504060268402, -0.1564294844865799, -0.15110856294631958, -0.14578765630722046, -0.14046671986579895, -0.13514581322669983, -0.12982489168643951, -0.1245039701461792, -0.11918304860591888, -0.11386212706565857, -0.10854120552539825, -0.10322029143571854, -0.09789936989545822, -0.09257844090461731, -0.087257519364357, -0.08193659782409668, -0.07661567628383636, -0.07129475474357605, -0.06597383320331573, -0.06065291911363602, -0.0553319975733757, -0.05001107603311539, -0.04469015449285507, -0.03936923295259476, -0.03404831513762474, -0.028727393597364426, -0.02340647205710411, -0.018085554242134094, -0.01276463270187378, -0.007443711161613464, -0.002122790552675724, 0.0031981300562620163, 0.008519049733877182, 0.013839971274137497, 0.019160892814397812, 0.02448181062936783, 0.029802732169628143, 0.03512365370988846, 0.04044457525014877, 0.04576549679040909, 0.051086414605379105, 0.05640733614563942, 0.061728257685899734, 0.06704917550086975, 0.07237009704113007, 0.07769101858139038]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 7.0, 2.0, 8.0, 11.0, 8.0, 11.0, 20.0, 25.0, 42.0, 54.0, 65.0, 99.0, 85.0, 92.0, 99.0, 94.0, 62.0, 53.0, 41.0, 37.0, 19.0, 17.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1677730679512024, -0.1625528782606125, -0.15733268857002258, -0.15211249887943268, -0.14689230918884277, -0.14167211949825287, -0.13645192980766296, -0.13123172521591187, -0.12601155042648315, -0.12079136073589325, -0.11557117104530334, -0.11035098135471344, -0.10513079166412354, -0.09991060197353363, -0.09469040483236313, -0.08947021514177322, -0.08425001800060272, -0.07902982831001282, -0.07380963861942291, -0.06858944892883301, -0.0633692592382431, -0.0581490658223629, -0.0529288724064827, -0.04770868271589279, -0.04248849302530289, -0.03726830333471298, -0.03204811364412308, -0.026827920228242874, -0.02160773053765297, -0.016387540847063065, -0.011167347431182861, -0.0059471577405929565, -0.0007269680500030518, 0.004493222571909428, 0.009713413193821907, 0.014933604747056961, 0.020153794437646866, 0.02537398412823677, 0.030594177544116974, 0.03581436723470688, 0.04103455692529678, 0.04625474661588669, 0.05147493630647659, 0.056695129722356796, 0.0619153194129467, 0.0671355128288269, 0.07235570251941681, 0.07757589221000671, 0.08279608190059662, 0.08801627159118652, 0.09323646128177643, 0.09845665097236633, 0.10367684066295624, 0.10889703035354614, 0.11411722749471664, 0.11933741718530655, 0.12455760687589645, 0.12977780401706696, 0.13499799370765686, 0.14021818339824677, 0.14543837308883667, 0.15065856277942657, 0.15587875247001648, 0.16109894216060638, 0.1663191318511963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 30.0, 33.0, 52.0, 63.0, 96.0, 143.0, 166.0, 251.0, 397.0, 527.0, 846.0, 1283.0, 2041.0, 3472.0, 6262.0, 13193.0, 42240.0, 904518.0, 43173.0, 13474.0, 6511.0, 3510.0, 2046.0, 1334.0, 842.0, 585.0, 401.0, 290.0, 201.0, 134.0, 111.0, 80.0, 57.0, 47.0, 28.0, 23.0, 13.0, 16.0, 7.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039581298828125, -0.0382843017578125, -0.0369873046875, -0.0356903076171875, -0.034393310546875, -0.0330963134765625, -0.03179931640625, -0.0305023193359375, -0.029205322265625, -0.0279083251953125, -0.026611328125, -0.0253143310546875, -0.024017333984375, -0.0227203369140625, -0.02142333984375, -0.0201263427734375, -0.018829345703125, -0.0175323486328125, -0.0162353515625, -0.0149383544921875, -0.013641357421875, -0.0123443603515625, -0.01104736328125, -0.0097503662109375, -0.008453369140625, -0.0071563720703125, -0.005859375, -0.0045623779296875, -0.003265380859375, -0.0019683837890625, -0.00067138671875, 0.0006256103515625, 0.001922607421875, 0.0032196044921875, 0.0045166015625, 0.0058135986328125, 0.007110595703125, 0.0084075927734375, 0.00970458984375, 0.0110015869140625, 0.012298583984375, 0.0135955810546875, 0.014892578125, 0.0161895751953125, 0.017486572265625, 0.0187835693359375, 0.02008056640625, 0.0213775634765625, 0.022674560546875, 0.0239715576171875, 0.0252685546875, 0.0265655517578125, 0.027862548828125, 0.0291595458984375, 0.03045654296875, 0.0317535400390625, 0.033050537109375, 0.0343475341796875, 0.03564453125, 0.0369415283203125, 0.038238525390625, 0.0395355224609375, 0.04083251953125, 0.0421295166015625, 0.043426513671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 10.0, 11.0, 6.0, 13.0, 10.0, 38.0, 259.0, 438.0, 84.0, 14.0, 13.0, 8.0, 9.0, 11.0, 7.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01080322265625, -0.010449647903442383, -0.010096073150634766, -0.009742498397827148, -0.009388923645019531, -0.009035348892211914, -0.008681774139404297, -0.00832819938659668, -0.007974624633789062, -0.007621049880981445, -0.007267475128173828, -0.006913900375366211, -0.006560325622558594, -0.0062067508697509766, -0.005853176116943359, -0.005499601364135742, -0.005146026611328125, -0.004792451858520508, -0.004438877105712891, -0.0040853023529052734, -0.0037317276000976562, -0.003378152847290039, -0.003024578094482422, -0.0026710033416748047, -0.0023174285888671875, -0.0019638538360595703, -0.0016102790832519531, -0.001256704330444336, -0.0009031295776367188, -0.0005495548248291016, -0.00019598007202148438, 0.0001575946807861328, 0.00051116943359375, 0.0008647441864013672, 0.0012183189392089844, 0.0015718936920166016, 0.0019254684448242188, 0.002279043197631836, 0.002632617950439453, 0.0029861927032470703, 0.0033397674560546875, 0.0036933422088623047, 0.004046916961669922, 0.004400491714477539, 0.004754066467285156, 0.0051076412200927734, 0.005461215972900391, 0.005814790725708008, 0.006168365478515625, 0.006521940231323242, 0.006875514984130859, 0.0072290897369384766, 0.007582664489746094, 0.007936239242553711, 0.008289813995361328, 0.008643388748168945, 0.008996963500976562, 0.00935053825378418, 0.009704113006591797, 0.010057687759399414, 0.010411262512207031, 0.010764837265014648, 0.011118412017822266, 0.011471986770629883, 0.0118255615234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 11.0, 13.0, 21.0, 24.0, 36.0, 34.0, 42.0, 46.0, 66.0, 70.0, 87.0, 97.0, 125.0, 175.0, 254.0, 539.0, 2198.0, 49141.0, 979576.0, 13276.0, 1228.0, 407.0, 223.0, 163.0, 134.0, 110.0, 81.0, 59.0, 57.0, 47.0, 31.0, 31.0, 25.0, 21.0, 19.0, 15.0, 11.0, 13.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0966796875, -0.093780517578125, -0.09088134765625, -0.087982177734375, -0.0850830078125, -0.082183837890625, -0.07928466796875, -0.076385498046875, -0.073486328125, -0.070587158203125, -0.06768798828125, -0.064788818359375, -0.0618896484375, -0.058990478515625, -0.05609130859375, -0.053192138671875, -0.05029296875, -0.047393798828125, -0.04449462890625, -0.041595458984375, -0.0386962890625, -0.035797119140625, -0.03289794921875, -0.029998779296875, -0.027099609375, -0.024200439453125, -0.02130126953125, -0.018402099609375, -0.0155029296875, -0.012603759765625, -0.00970458984375, -0.006805419921875, -0.00390625, -0.001007080078125, 0.00189208984375, 0.004791259765625, 0.0076904296875, 0.010589599609375, 0.01348876953125, 0.016387939453125, 0.019287109375, 0.022186279296875, 0.02508544921875, 0.027984619140625, 0.0308837890625, 0.033782958984375, 0.03668212890625, 0.039581298828125, 0.04248046875, 0.045379638671875, 0.04827880859375, 0.051177978515625, 0.0540771484375, 0.056976318359375, 0.05987548828125, 0.062774658203125, 0.065673828125, 0.068572998046875, 0.07147216796875, 0.074371337890625, 0.0772705078125, 0.080169677734375, 0.08306884765625, 0.085968017578125, 0.0888671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 5.0, 6.0, 9.0, 12.0, 17.0, 14.0, 24.0, 17.0, 27.0, 28.0, 28.0, 23.0, 27.0, 36.0, 44.0, 48.0, 50.0, 39.0, 56.0, 54.0, 38.0, 41.0, 35.0, 43.0, 44.0, 47.0, 21.0, 23.0, 15.0, 22.0, 14.0, 11.0, 9.0, 8.0, 9.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0308074951171875, -0.029883384704589844, -0.028959274291992188, -0.02803516387939453, -0.027111053466796875, -0.02618694305419922, -0.025262832641601562, -0.024338722229003906, -0.02341461181640625, -0.022490501403808594, -0.021566390991210938, -0.02064228057861328, -0.019718170166015625, -0.01879405975341797, -0.017869949340820312, -0.016945838928222656, -0.016021728515625, -0.015097618103027344, -0.014173507690429688, -0.013249397277832031, -0.012325286865234375, -0.011401176452636719, -0.010477066040039062, -0.009552955627441406, -0.00862884521484375, -0.007704734802246094, -0.0067806243896484375, -0.005856513977050781, -0.004932403564453125, -0.004008293151855469, -0.0030841827392578125, -0.0021600723266601562, -0.0012359619140625, -0.00031185150146484375, 0.0006122589111328125, 0.0015363693237304688, 0.002460479736328125, 0.0033845901489257812, 0.0043087005615234375, 0.005232810974121094, 0.00615692138671875, 0.007081031799316406, 0.008005142211914062, 0.008929252624511719, 0.009853363037109375, 0.010777473449707031, 0.011701583862304688, 0.012625694274902344, 0.0135498046875, 0.014473915100097656, 0.015398025512695312, 0.01632213592529297, 0.017246246337890625, 0.01817035675048828, 0.019094467163085938, 0.020018577575683594, 0.02094268798828125, 0.021866798400878906, 0.022790908813476562, 0.02371501922607422, 0.024639129638671875, 0.02556324005126953, 0.026487350463867188, 0.027411460876464844, 0.0283355712890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 14.0, 23.0, 42.0, 42.0, 57.0, 85.0, 153.0, 200.0, 368.0, 828.0, 2850.0, 51927.0, 981696.0, 7426.0, 1506.0, 490.0, 271.0, 170.0, 107.0, 69.0, 53.0, 39.0, 31.0, 14.0, 14.0, 13.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019669532775878906, -0.00019059516489505768, -0.0001844950020313263, -0.0001783948391675949, -0.00017229467630386353, -0.00016619451344013214, -0.00016009435057640076, -0.00015399418771266937, -0.000147894024848938, -0.0001417938619852066, -0.00013569369912147522, -0.00012959353625774384, -0.00012349337339401245, -0.00011739321053028107, -0.00011129304766654968, -0.0001051928848028183, -9.909272193908691e-05, -9.299255907535553e-05, -8.689239621162415e-05, -8.079223334789276e-05, -7.469207048416138e-05, -6.859190762042999e-05, -6.249174475669861e-05, -5.6391581892967224e-05, -5.029141902923584e-05, -4.4191256165504456e-05, -3.809109330177307e-05, -3.199093043804169e-05, -2.5890767574310303e-05, -1.979060471057892e-05, -1.3690441846847534e-05, -7.59027898311615e-06, -1.4901161193847656e-06, 4.610046744346619e-06, 1.0710209608078003e-05, 1.6810372471809387e-05, 2.291053533554077e-05, 2.9010698199272156e-05, 3.511086106300354e-05, 4.1211023926734924e-05, 4.731118679046631e-05, 5.341134965419769e-05, 5.951151251792908e-05, 6.561167538166046e-05, 7.171183824539185e-05, 7.781200110912323e-05, 8.391216397285461e-05, 9.0012326836586e-05, 9.611248970031738e-05, 0.00010221265256404877, 0.00010831281542778015, 0.00011441297829151154, 0.00012051314115524292, 0.0001266133040189743, 0.0001327134668827057, 0.00013881362974643707, 0.00014491379261016846, 0.00015101395547389984, 0.00015711411833763123, 0.0001632142812013626, 0.000169314444065094, 0.00017541460692882538, 0.00018151476979255676, 0.00018761493265628815, 0.00019371509552001953]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 14.0, 20.0, 33.0, 40.0, 65.0, 85.0, 61.0, 108.0, 81.0, 101.0, 76.0, 79.0, 43.0, 57.0, 23.0, 29.0, 19.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -4.974193871021271e-06, -4.762783646583557e-06, -4.5513734221458435e-06, -4.33996319770813e-06, -4.128552973270416e-06, -3.917142748832703e-06, -3.705732524394989e-06, -3.4943222999572754e-06, -3.2829120755195618e-06, -3.071501851081848e-06, -2.8600916266441345e-06, -2.648681402206421e-06, -2.4372711777687073e-06, -2.2258609533309937e-06, -2.01445072889328e-06, -1.8030405044555664e-06, -1.5916302800178528e-06, -1.3802200555801392e-06, -1.1688098311424255e-06, -9.57399606704712e-07, -7.459893822669983e-07, -5.345791578292847e-07, -3.2316893339157104e-07, -1.1175870895385742e-07, 9.96515154838562e-08, 3.110617399215698e-07, 5.224719643592834e-07, 7.338821887969971e-07, 9.452924132347107e-07, 1.1567026376724243e-06, 1.368112862110138e-06, 1.5795230865478516e-06, 1.7909333109855652e-06, 2.002343535423279e-06, 2.2137537598609924e-06, 2.425163984298706e-06, 2.6365742087364197e-06, 2.8479844331741333e-06, 3.059394657611847e-06, 3.2708048820495605e-06, 3.482215106487274e-06, 3.693625330924988e-06, 3.905035555362701e-06, 4.116445779800415e-06, 4.327856004238129e-06, 4.539266228675842e-06, 4.750676453113556e-06, 4.9620866775512695e-06, 5.173496901988983e-06, 5.384907126426697e-06, 5.59631735086441e-06, 5.807727575302124e-06, 6.019137799739838e-06, 6.230548024177551e-06, 6.441958248615265e-06, 6.6533684730529785e-06, 6.864778697490692e-06, 7.076188921928406e-06, 7.287599146366119e-06, 7.499009370803833e-06, 7.710419595241547e-06, 7.92182981967926e-06, 8.133240044116974e-06, 8.344650268554688e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 13.0, 19.0, 28.0, 27.0, 52.0, 94.0, 158.0, 367.0, 1885.0, 1031367.0, 13345.0, 654.0, 238.0, 107.0, 57.0, 43.0, 31.0, 26.0, 5.0, 9.0, 11.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002770423889160156, -0.0002666749060153961, -0.0002563074231147766, -0.0002459399402141571, -0.0002355724573135376, -0.0002252049744129181, -0.00021483749151229858, -0.00020447000861167908, -0.00019410252571105957, -0.00018373504281044006, -0.00017336755990982056, -0.00016300007700920105, -0.00015263259410858154, -0.00014226511120796204, -0.00013189762830734253, -0.00012153014540672302, -0.00011116266250610352, -0.00010079517960548401, -9.04276967048645e-05, -8.0060213804245e-05, -6.969273090362549e-05, -5.932524800300598e-05, -4.8957765102386475e-05, -3.859028220176697e-05, -2.822279930114746e-05, -1.7855316400527954e-05, -7.487833499908447e-06, 2.8796494007110596e-06, 1.3247132301330566e-05, 2.3614615201950073e-05, 3.398209810256958e-05, 4.434958100318909e-05, 5.4717063903808594e-05, 6.50845468044281e-05, 7.545202970504761e-05, 8.581951260566711e-05, 9.618699550628662e-05, 0.00010655447840690613, 0.00011692196130752563, 0.00012728944420814514, 0.00013765692710876465, 0.00014802441000938416, 0.00015839189291000366, 0.00016875937581062317, 0.00017912685871124268, 0.00018949434161186218, 0.0001998618245124817, 0.0002102293074131012, 0.0002205967903137207, 0.0002309642732143402, 0.00024133175611495972, 0.0002516992390155792, 0.00026206672191619873, 0.00027243420481681824, 0.00028280168771743774, 0.00029316917061805725, 0.00030353665351867676, 0.00031390413641929626, 0.00032427161931991577, 0.0003346391022205353, 0.0003450065851211548, 0.0003553740680217743, 0.0003657415509223938, 0.0003761090338230133, 0.0003864765167236328]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 3.0, 11.0, 11.0, 12.0, 36.0, 35.0, 62.0, 106.0, 131.0, 165.0, 153.0, 94.0, 54.0, 40.0, 22.0, 18.0, 9.0, 11.0, 5.0, 4.0, 5.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.641315460205078e-05, -7.329508662223816e-05, -7.017701864242554e-05, -6.705895066261292e-05, -6.394088268280029e-05, -6.082281470298767e-05, -5.770474672317505e-05, -5.458667874336243e-05, -5.1468610763549805e-05, -4.835054278373718e-05, -4.523247480392456e-05, -4.211440682411194e-05, -3.8996338844299316e-05, -3.5878270864486694e-05, -3.276020288467407e-05, -2.964213490486145e-05, -2.6524066925048828e-05, -2.3405998945236206e-05, -2.0287930965423584e-05, -1.7169862985610962e-05, -1.405179500579834e-05, -1.0933727025985718e-05, -7.815659046173096e-06, -4.697591066360474e-06, -1.5795230865478516e-06, 1.5385448932647705e-06, 4.656612873077393e-06, 7.774680852890015e-06, 1.0892748832702637e-05, 1.4010816812515259e-05, 1.712888479232788e-05, 2.0246952772140503e-05, 2.3365020751953125e-05, 2.6483088731765747e-05, 2.960115671157837e-05, 3.271922469139099e-05, 3.583729267120361e-05, 3.8955360651016235e-05, 4.207342863082886e-05, 4.519149661064148e-05, 4.83095645904541e-05, 5.1427632570266724e-05, 5.4545700550079346e-05, 5.766376852989197e-05, 6.078183650970459e-05, 6.389990448951721e-05, 6.701797246932983e-05, 7.013604044914246e-05, 7.325410842895508e-05, 7.63721764087677e-05, 7.949024438858032e-05, 8.260831236839294e-05, 8.572638034820557e-05, 8.884444832801819e-05, 9.196251630783081e-05, 9.508058428764343e-05, 9.819865226745605e-05, 0.00010131672024726868, 0.0001044347882270813, 0.00010755285620689392, 0.00011067092418670654, 0.00011378899216651917, 0.00011690706014633179, 0.00012002512812614441, 0.00012314319610595703]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 977.0, 35.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.464580774307251, -1.4350593090057373, -1.4055379629135132, -1.3760164976119995, -1.3464950323104858, -1.3169736862182617, -1.287452220916748, -1.2579307556152344, -1.2284094095230103, -1.1988879442214966, -1.1693665981292725, -1.1398451328277588, -1.1103236675262451, -1.080802321434021, -1.0512808561325073, -1.0217595100402832, -0.9922380447387695, -0.9627166390419006, -0.933195173740387, -0.9036737680435181, -0.8741523623466492, -0.8446309566497803, -0.8151094913482666, -0.7855880856513977, -0.756066620349884, -0.7265452146530151, -0.6970237493515015, -0.6675023436546326, -0.6379809379577637, -0.60845947265625, -0.5789380669593811, -0.5494166612625122, -0.5198952555656433, -0.490373820066452, -0.46085241436958313, -0.43133097887039185, -0.40180957317352295, -0.37228813767433167, -0.3427667021751404, -0.3132452964782715, -0.2837238907814026, -0.2542024552822113, -0.2246810495853424, -0.19515961408615112, -0.16563820838928223, -0.13611677289009094, -0.10659535229206085, -0.07707393169403076, -0.04755249619483948, -0.018031073734164238, 0.011490348726511002, 0.04101177304983139, 0.07053319364786148, 0.10005462169647217, 0.12957604229450226, 0.15909746289253235, 0.18861888349056244, 0.21814030408859253, 0.24766172468662262, 0.2771831452846527, 0.306704580783844, 0.3362259864807129, 0.3657474219799042, 0.39526885747909546, 0.42479026317596436]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 4.0, 11.0, 11.0, 17.0, 19.0, 35.0, 31.0, 48.0, 44.0, 60.0, 69.0, 69.0, 67.0, 59.0, 77.0, 66.0, 65.0, 51.0, 43.0, 25.0, 37.0, 20.0, 17.0, 21.0, 10.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.42555153369903564, -0.4158328175544739, -0.4061141014099121, -0.39639535546302795, -0.3866766393184662, -0.3769579231739044, -0.36723917722702026, -0.3575204610824585, -0.34780174493789673, -0.33808302879333496, -0.3283643126487732, -0.31864556670188904, -0.30892685055732727, -0.2992081344127655, -0.28948938846588135, -0.2797706723213196, -0.2700519561767578, -0.26033324003219604, -0.2506145238876343, -0.24089577794075012, -0.23117706179618835, -0.2214583456516266, -0.21173961460590363, -0.20202088356018066, -0.1923021674156189, -0.18258345127105713, -0.17286472022533417, -0.1631459891796112, -0.15342727303504944, -0.14370855689048767, -0.1339898258447647, -0.12427110224962234, -0.11455237865447998, -0.10483365505933762, -0.09511493146419525, -0.08539620786905289, -0.07567748427391052, -0.06595876067876816, -0.05624003708362579, -0.04652131348848343, -0.036802589893341064, -0.0270838662981987, -0.017365142703056335, -0.007646419107913971, 0.0020723044872283936, 0.011791028082370758, 0.021509751677513123, 0.031228475272655487, 0.04094719886779785, 0.050665922462940216, 0.06038464605808258, 0.07010336965322495, 0.07982209324836731, 0.08954081684350967, 0.09925954043865204, 0.1089782640337944, 0.11869698762893677, 0.12841570377349854, 0.1381344348192215, 0.14785316586494446, 0.15757188200950623, 0.167290598154068, 0.17700932919979095, 0.18672806024551392, 0.19644677639007568]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 11.0, 8.0, 8.0, 23.0, 31.0, 59.0, 109.0, 273.0, 839.0, 4639.0, 4180180.0, 5912.0, 1271.0, 457.0, 189.0, 95.0, 52.0, 28.0, 18.0, 9.0, 13.0, 6.0, 9.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.156494140625, -0.1513671875, -0.146240234375, -0.14111328125, -0.135986328125, -0.130859375, -0.125732421875, -0.12060546875, -0.115478515625, -0.1103515625, -0.105224609375, -0.10009765625, -0.094970703125, -0.08984375, -0.084716796875, -0.07958984375, -0.074462890625, -0.0693359375, -0.064208984375, -0.05908203125, -0.053955078125, -0.048828125, -0.043701171875, -0.03857421875, -0.033447265625, -0.0283203125, -0.023193359375, -0.01806640625, -0.012939453125, -0.0078125, -0.002685546875, 0.00244140625, 0.007568359375, 0.0126953125, 0.017822265625, 0.02294921875, 0.028076171875, 0.033203125, 0.038330078125, 0.04345703125, 0.048583984375, 0.0537109375, 0.058837890625, 0.06396484375, 0.069091796875, 0.07421875, 0.079345703125, 0.08447265625, 0.089599609375, 0.0947265625, 0.099853515625, 0.10498046875, 0.110107421875, 0.115234375, 0.120361328125, 0.12548828125, 0.130615234375, 0.1357421875, 0.140869140625, 0.14599609375, 0.151123046875, 0.15625, 0.161376953125, 0.16650390625, 0.171630859375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 9.0, 4.0, 3.0, 13.0, 9.0, 7.0, 10.0, 11.0, 50.0, 282.0, 383.0, 98.0, 19.0, 12.0, 8.0, 10.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01043701171875, -0.01009523868560791, -0.00975346565246582, -0.00941169261932373, -0.00906991958618164, -0.00872814655303955, -0.008386373519897461, -0.008044600486755371, -0.007702827453613281, -0.007361054420471191, -0.0070192813873291016, -0.006677508354187012, -0.006335735321044922, -0.005993962287902832, -0.005652189254760742, -0.005310416221618652, -0.0049686431884765625, -0.004626870155334473, -0.004285097122192383, -0.003943324089050293, -0.003601551055908203, -0.0032597780227661133, -0.0029180049896240234, -0.0025762319564819336, -0.0022344589233398438, -0.001892685890197754, -0.001550912857055664, -0.0012091398239135742, -0.0008673667907714844, -0.0005255937576293945, -0.0001838207244873047, 0.00015795230865478516, 0.000499725341796875, 0.0008414983749389648, 0.0011832714080810547, 0.0015250444412231445, 0.0018668174743652344, 0.0022085905075073242, 0.002550363540649414, 0.002892136573791504, 0.0032339096069335938, 0.0035756826400756836, 0.0039174556732177734, 0.004259228706359863, 0.004601001739501953, 0.004942774772644043, 0.005284547805786133, 0.005626320838928223, 0.0059680938720703125, 0.006309866905212402, 0.006651639938354492, 0.006993412971496582, 0.007335186004638672, 0.007676959037780762, 0.008018732070922852, 0.008360505104064941, 0.008702278137207031, 0.009044051170349121, 0.009385824203491211, 0.0097275972366333, 0.01006937026977539, 0.01041114330291748, 0.01075291633605957, 0.01109468936920166, 0.01143646240234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 13.0, 8.0, 11.0, 6.0, 18.0, 21.0, 23.0, 43.0, 51.0, 71.0, 96.0, 152.0, 421.0, 2049.0, 4070474.0, 118211.0, 1677.0, 421.0, 149.0, 102.0, 63.0, 47.0, 34.0, 26.0, 18.0, 15.0, 8.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.121826171875, -0.11730384826660156, -0.11278152465820312, -0.10825920104980469, -0.10373687744140625, -0.09921455383300781, -0.09469223022460938, -0.09016990661621094, -0.0856475830078125, -0.08112525939941406, -0.07660293579101562, -0.07208061218261719, -0.06755828857421875, -0.06303596496582031, -0.058513641357421875, -0.05399131774902344, -0.049468994140625, -0.04494667053222656, -0.040424346923828125, -0.03590202331542969, -0.03137969970703125, -0.026857376098632812, -0.022335052490234375, -0.017812728881835938, -0.0132904052734375, -0.008768081665039062, -0.004245758056640625, 0.0002765655517578125, 0.00479888916015625, 0.009321212768554688, 0.013843536376953125, 0.018365859985351562, 0.02288818359375, 0.027410507202148438, 0.031932830810546875, 0.03645515441894531, 0.04097747802734375, 0.04549980163574219, 0.050022125244140625, 0.05454444885253906, 0.0590667724609375, 0.06358909606933594, 0.06811141967773438, 0.07263374328613281, 0.07715606689453125, 0.08167839050292969, 0.08620071411132812, 0.09072303771972656, 0.095245361328125, 0.09976768493652344, 0.10429000854492188, 0.10881233215332031, 0.11333465576171875, 0.11785697937011719, 0.12237930297851562, 0.12690162658691406, 0.1314239501953125, 0.13594627380371094, 0.14046859741210938, 0.1449909210205078, 0.14951324462890625, 0.1540355682373047, 0.15855789184570312, 0.16308021545410156, 0.1676025390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 9.0, 9.0, 10.0, 14.0, 21.0, 14.0, 14.0, 36.0, 58.0, 132.0, 3195.0, 327.0, 65.0, 39.0, 21.0, 19.0, 16.0, 12.0, 7.0, 8.0, 6.0, 4.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.017974853515625, -0.017302513122558594, -0.016630172729492188, -0.01595783233642578, -0.015285491943359375, -0.014613151550292969, -0.013940811157226562, -0.013268470764160156, -0.01259613037109375, -0.011923789978027344, -0.011251449584960938, -0.010579109191894531, -0.009906768798828125, -0.009234428405761719, -0.008562088012695312, -0.007889747619628906, -0.0072174072265625, -0.006545066833496094, -0.0058727264404296875, -0.005200386047363281, -0.004528045654296875, -0.0038557052612304688, -0.0031833648681640625, -0.0025110244750976562, -0.00183868408203125, -0.0011663436889648438, -0.0004940032958984375, 0.00017833709716796875, 0.000850677490234375, 0.0015230178833007812, 0.0021953582763671875, 0.0028676986694335938, 0.0035400390625, 0.004212379455566406, 0.0048847198486328125, 0.005557060241699219, 0.006229400634765625, 0.006901741027832031, 0.0075740814208984375, 0.008246421813964844, 0.00891876220703125, 0.009591102600097656, 0.010263442993164062, 0.010935783386230469, 0.011608123779296875, 0.012280464172363281, 0.012952804565429688, 0.013625144958496094, 0.0142974853515625, 0.014969825744628906, 0.015642166137695312, 0.01631450653076172, 0.016986846923828125, 0.01765918731689453, 0.018331527709960938, 0.019003868103027344, 0.01967620849609375, 0.020348548889160156, 0.021020889282226562, 0.02169322967529297, 0.022365570068359375, 0.02303791046142578, 0.023710250854492188, 0.024382591247558594, 0.025054931640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 996.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16822035610675812, -0.15810665488243103, -0.14799295365810394, -0.13787925243377686, -0.12776553630828857, -0.11765184253454208, -0.1075381338596344, -0.09742443263530731, -0.08731073141098022, -0.07719703018665314, -0.06708332896232605, -0.056969620287418365, -0.04685591906309128, -0.03674221783876419, -0.026628512889146805, -0.01651480793952942, -0.0064011067152023315, 0.003712596371769905, 0.013826299458742142, 0.02394000254571438, 0.034053705632686615, 0.0441674068570137, 0.05428111180663109, 0.06439481675624847, 0.07450851798057556, 0.08462221920490265, 0.09473592042922974, 0.10484962910413742, 0.11496333032846451, 0.1250770390033722, 0.13519074022769928, 0.14530444145202637, 0.15541812777519226, 0.16553182899951935, 0.17564553022384644, 0.18575923144817352, 0.1958729326725006, 0.2059866487979889, 0.21610035002231598, 0.22621405124664307, 0.23632775247097015, 0.24644145369529724, 0.2565551698207855, 0.2666688561439514, 0.2767825722694397, 0.2868962585926056, 0.29700997471809387, 0.30712366104125977, 0.31723737716674805, 0.32735109329223633, 0.3374647796154022, 0.3475784957408905, 0.3576921820640564, 0.3678058981895447, 0.37791958451271057, 0.38803330063819885, 0.39814698696136475, 0.408260703086853, 0.4183743894100189, 0.4284881055355072, 0.4386017918586731, 0.4487155079841614, 0.45882919430732727, 0.46894291043281555, 0.47905662655830383]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 10.0, 16.0, 26.0, 27.0, 19.0, 35.0, 46.0, 50.0, 68.0, 45.0, 60.0, 67.0, 54.0, 59.0, 55.0, 61.0, 52.0, 29.0, 37.0, 27.0, 27.0, 29.0, 10.0, 14.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0648425817489624, -0.06285306811332703, -0.06086354702711105, -0.05887402966618538, -0.056884512305259705, -0.05489499494433403, -0.052905477583408356, -0.05091596022248268, -0.04892644286155701, -0.04693692550063133, -0.04494740813970566, -0.042957890778779984, -0.04096837341785431, -0.038978856056928635, -0.03698933869600296, -0.034999821335077286, -0.03301030397415161, -0.031020786613225937, -0.029031269252300262, -0.027041751891374588, -0.025052234530448914, -0.02306271716952324, -0.021073199808597565, -0.01908368244767189, -0.017094165086746216, -0.015104647725820541, -0.013115130364894867, -0.011125613003969193, -0.009136095643043518, -0.007146578282117844, -0.005157060921192169, -0.0031675435602664948, -0.0011780261993408203, 0.0008114911615848541, 0.0028010085225105286, 0.004790525883436203, 0.0067800432443618774, 0.008769560605287552, 0.010759077966213226, 0.0127485953271389, 0.014738112688064575, 0.01672763004899025, 0.018717147409915924, 0.0207066647708416, 0.022696182131767273, 0.024685699492692947, 0.026675216853618622, 0.028664734214544296, 0.03065425157546997, 0.032643768936395645, 0.03463328629732132, 0.036622803658246994, 0.03861232101917267, 0.04060183838009834, 0.04259135574102402, 0.04458087310194969, 0.046570390462875366, 0.04855990782380104, 0.050549425184726715, 0.05253894254565239, 0.054528459906578064, 0.05651797726750374, 0.05850749462842941, 0.06049701198935509, 0.06248652935028076]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 13.0, 28.0, 41.0, 45.0, 86.0, 100.0, 183.0, 251.0, 384.0, 633.0, 1037.0, 1693.0, 2928.0, 5493.0, 11463.0, 30096.0, 875360.0, 83938.0, 17357.0, 7603.0, 4057.0, 2208.0, 1287.0, 787.0, 506.0, 315.0, 224.0, 134.0, 93.0, 61.0, 40.0, 27.0, 20.0, 11.0, 9.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03668212890625, -0.035594940185546875, -0.03450775146484375, -0.033420562744140625, -0.0323333740234375, -0.031246185302734375, -0.03015899658203125, -0.029071807861328125, -0.027984619140625, -0.026897430419921875, -0.02581024169921875, -0.024723052978515625, -0.0236358642578125, -0.022548675537109375, -0.02146148681640625, -0.020374298095703125, -0.019287109375, -0.018199920654296875, -0.01711273193359375, -0.016025543212890625, -0.0149383544921875, -0.013851165771484375, -0.01276397705078125, -0.011676788330078125, -0.010589599609375, -0.009502410888671875, -0.00841522216796875, -0.007328033447265625, -0.0062408447265625, -0.005153656005859375, -0.00406646728515625, -0.002979278564453125, -0.00189208984375, -0.000804901123046875, 0.00028228759765625, 0.001369476318359375, 0.0024566650390625, 0.003543853759765625, 0.00463104248046875, 0.005718231201171875, 0.006805419921875, 0.007892608642578125, 0.00897979736328125, 0.010066986083984375, 0.0111541748046875, 0.012241363525390625, 0.01332855224609375, 0.014415740966796875, 0.0155029296875, 0.016590118408203125, 0.01767730712890625, 0.018764495849609375, 0.0198516845703125, 0.020938873291015625, 0.02202606201171875, 0.023113250732421875, 0.024200439453125, 0.025287628173828125, 0.02637481689453125, 0.027462005615234375, 0.0285491943359375, 0.029636383056640625, 0.03072357177734375, 0.031810760498046875, 0.03289794921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 7.0, 3.0, 8.0, 8.0, 12.0, 9.0, 8.0, 18.0, 92.0, 354.0, 295.0, 67.0, 18.0, 7.0, 7.0, 15.0, 10.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0098876953125, -0.00956106185913086, -0.009234428405761719, -0.008907794952392578, -0.008581161499023438, -0.008254528045654297, -0.007927894592285156, -0.007601261138916016, -0.007274627685546875, -0.006947994232177734, -0.006621360778808594, -0.006294727325439453, -0.0059680938720703125, -0.005641460418701172, -0.005314826965332031, -0.004988193511962891, -0.00466156005859375, -0.004334926605224609, -0.004008293151855469, -0.003681659698486328, -0.0033550262451171875, -0.003028392791748047, -0.0027017593383789062, -0.0023751258850097656, -0.002048492431640625, -0.0017218589782714844, -0.0013952255249023438, -0.0010685920715332031, -0.0007419586181640625, -0.0004153251647949219, -8.869171142578125e-05, 0.00023794174194335938, 0.0005645751953125, 0.0008912086486816406, 0.0012178421020507812, 0.0015444755554199219, 0.0018711090087890625, 0.002197742462158203, 0.0025243759155273438, 0.0028510093688964844, 0.003177642822265625, 0.0035042762756347656, 0.0038309097290039062, 0.004157543182373047, 0.0044841766357421875, 0.004810810089111328, 0.005137443542480469, 0.005464076995849609, 0.00579071044921875, 0.006117343902587891, 0.006443977355957031, 0.006770610809326172, 0.0070972442626953125, 0.007423877716064453, 0.007750511169433594, 0.008077144622802734, 0.008403778076171875, 0.008730411529541016, 0.009057044982910156, 0.009383678436279297, 0.009710311889648438, 0.010036945343017578, 0.010363578796386719, 0.01069021224975586, 0.011016845703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 11.0, 7.0, 11.0, 14.0, 21.0, 27.0, 25.0, 33.0, 37.0, 39.0, 55.0, 69.0, 69.0, 98.0, 104.0, 121.0, 190.0, 288.0, 488.0, 1301.0, 9873.0, 942326.0, 88509.0, 2662.0, 732.0, 357.0, 220.0, 160.0, 127.0, 103.0, 70.0, 76.0, 52.0, 59.0, 50.0, 41.0, 29.0, 22.0, 19.0, 10.0, 12.0, 15.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0859375, -0.08339118957519531, -0.08084487915039062, -0.07829856872558594, -0.07575225830078125, -0.07320594787597656, -0.07065963745117188, -0.06811332702636719, -0.0655670166015625, -0.06302070617675781, -0.060474395751953125, -0.05792808532714844, -0.05538177490234375, -0.05283546447753906, -0.050289154052734375, -0.04774284362792969, -0.045196533203125, -0.04265022277832031, -0.040103912353515625, -0.03755760192871094, -0.03501129150390625, -0.03246498107910156, -0.029918670654296875, -0.027372360229492188, -0.0248260498046875, -0.022279739379882812, -0.019733428955078125, -0.017187118530273438, -0.01464080810546875, -0.012094497680664062, -0.009548187255859375, -0.0070018768310546875, -0.00445556640625, -0.0019092559814453125, 0.000637054443359375, 0.0031833648681640625, 0.00572967529296875, 0.008275985717773438, 0.010822296142578125, 0.013368606567382812, 0.0159149169921875, 0.018461227416992188, 0.021007537841796875, 0.023553848266601562, 0.02610015869140625, 0.028646469116210938, 0.031192779541015625, 0.03373908996582031, 0.036285400390625, 0.03883171081542969, 0.041378021240234375, 0.04392433166503906, 0.04647064208984375, 0.04901695251464844, 0.051563262939453125, 0.05410957336425781, 0.0566558837890625, 0.05920219421386719, 0.061748504638671875, 0.06429481506347656, 0.06684112548828125, 0.06938743591308594, 0.07193374633789062, 0.07448005676269531, 0.0770263671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 5.0, 4.0, 10.0, 8.0, 8.0, 12.0, 14.0, 9.0, 15.0, 17.0, 15.0, 35.0, 23.0, 31.0, 26.0, 31.0, 33.0, 38.0, 46.0, 27.0, 61.0, 48.0, 57.0, 47.0, 45.0, 39.0, 41.0, 42.0, 30.0, 28.0, 20.0, 24.0, 18.0, 17.0, 20.0, 17.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03399658203125, -0.03305482864379883, -0.032113075256347656, -0.031171321868896484, -0.030229568481445312, -0.02928781509399414, -0.02834606170654297, -0.027404308319091797, -0.026462554931640625, -0.025520801544189453, -0.02457904815673828, -0.02363729476928711, -0.022695541381835938, -0.021753787994384766, -0.020812034606933594, -0.019870281219482422, -0.01892852783203125, -0.017986774444580078, -0.017045021057128906, -0.016103267669677734, -0.015161514282226562, -0.01421976089477539, -0.013278007507324219, -0.012336254119873047, -0.011394500732421875, -0.010452747344970703, -0.009510993957519531, -0.00856924057006836, -0.0076274871826171875, -0.006685733795166016, -0.005743980407714844, -0.004802227020263672, -0.0038604736328125, -0.002918720245361328, -0.0019769668579101562, -0.0010352134704589844, -9.34600830078125e-05, 0.0008482933044433594, 0.0017900466918945312, 0.002731800079345703, 0.003673553466796875, 0.004615306854248047, 0.005557060241699219, 0.006498813629150391, 0.0074405670166015625, 0.008382320404052734, 0.009324073791503906, 0.010265827178955078, 0.01120758056640625, 0.012149333953857422, 0.013091087341308594, 0.014032840728759766, 0.014974594116210938, 0.01591634750366211, 0.01685810089111328, 0.017799854278564453, 0.018741607666015625, 0.019683361053466797, 0.02062511444091797, 0.02156686782836914, 0.022508621215820312, 0.023450374603271484, 0.024392127990722656, 0.025333881378173828, 0.026275634765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 2.0, 3.0, 3.0, 16.0, 17.0, 22.0, 33.0, 39.0, 78.0, 106.0, 204.0, 460.0, 1008.0, 3883.0, 218102.0, 817524.0, 4806.0, 1170.0, 462.0, 226.0, 130.0, 88.0, 43.0, 35.0, 23.0, 26.0, 9.0, 13.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015401840209960938, -0.00014974642544984818, -0.00014547444880008698, -0.00014120247215032578, -0.00013693049550056458, -0.00013265851885080338, -0.00012838654220104218, -0.00012411456555128098, -0.00011984258890151978, -0.00011557061225175858, -0.00011129863560199738, -0.00010702665895223618, -0.00010275468230247498, -9.848270565271378e-05, -9.421072900295258e-05, -8.993875235319138e-05, -8.566677570343018e-05, -8.139479905366898e-05, -7.712282240390778e-05, -7.285084575414658e-05, -6.857886910438538e-05, -6.430689245462418e-05, -6.0034915804862976e-05, -5.5762939155101776e-05, -5.1490962505340576e-05, -4.7218985855579376e-05, -4.2947009205818176e-05, -3.8675032556056976e-05, -3.4403055906295776e-05, -3.0131079256534576e-05, -2.5859102606773376e-05, -2.1587125957012177e-05, -1.7315149307250977e-05, -1.3043172657489777e-05, -8.771196007728577e-06, -4.499219357967377e-06, -2.2724270820617676e-07, 4.044733941555023e-06, 8.316710591316223e-06, 1.2588687241077423e-05, 1.6860663890838623e-05, 2.1132640540599823e-05, 2.5404617190361023e-05, 2.9676593840122223e-05, 3.394857048988342e-05, 3.822054713964462e-05, 4.249252378940582e-05, 4.676450043916702e-05, 5.103647708892822e-05, 5.530845373868942e-05, 5.958043038845062e-05, 6.385240703821182e-05, 6.812438368797302e-05, 7.239636033773422e-05, 7.666833698749542e-05, 8.094031363725662e-05, 8.521229028701782e-05, 8.948426693677902e-05, 9.375624358654022e-05, 9.802822023630142e-05, 0.00010230019688606262, 0.00010657217353582382, 0.00011084415018558502, 0.00011511612683534622, 0.00011938810348510742]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 11.0, 29.0, 22.0, 21.0, 35.0, 41.0, 43.0, 42.0, 68.0, 63.0, 67.0, 74.0, 80.0, 75.0, 54.0, 47.0, 22.0, 36.0, 29.0, 18.0, 21.0, 14.0, 11.0, 10.0, 12.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.702007234096527e-06, -3.5297125577926636e-06, -3.3574178814888e-06, -3.1851232051849365e-06, -3.012828528881073e-06, -2.8405338525772095e-06, -2.668239176273346e-06, -2.4959444999694824e-06, -2.323649823665619e-06, -2.1513551473617554e-06, -1.979060471057892e-06, -1.8067657947540283e-06, -1.6344711184501648e-06, -1.4621764421463013e-06, -1.2898817658424377e-06, -1.1175870895385742e-06, -9.452924132347107e-07, -7.729977369308472e-07, -6.007030606269836e-07, -4.284083843231201e-07, -2.561137080192566e-07, -8.381903171539307e-08, 8.847564458847046e-08, 2.60770320892334e-07, 4.330649971961975e-07, 6.05359673500061e-07, 7.776543498039246e-07, 9.499490261077881e-07, 1.1222437024116516e-06, 1.2945383787155151e-06, 1.4668330550193787e-06, 1.6391277313232422e-06, 1.8114224076271057e-06, 1.9837170839309692e-06, 2.1560117602348328e-06, 2.3283064365386963e-06, 2.50060111284256e-06, 2.6728957891464233e-06, 2.845190465450287e-06, 3.0174851417541504e-06, 3.189779818058014e-06, 3.3620744943618774e-06, 3.534369170665741e-06, 3.7066638469696045e-06, 3.878958523273468e-06, 4.0512531995773315e-06, 4.223547875881195e-06, 4.395842552185059e-06, 4.568137228488922e-06, 4.740431904792786e-06, 4.912726581096649e-06, 5.085021257400513e-06, 5.257315933704376e-06, 5.42961061000824e-06, 5.601905286312103e-06, 5.774199962615967e-06, 5.94649463891983e-06, 6.118789315223694e-06, 6.291083991527557e-06, 6.463378667831421e-06, 6.6356733441352844e-06, 6.807968020439148e-06, 6.9802626967430115e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 12.0, 22.0, 26.0, 37.0, 62.0, 127.0, 203.0, 441.0, 2022.0, 1026259.0, 17815.0, 820.0, 285.0, 152.0, 92.0, 64.0, 32.0, 29.0, 11.0, 4.0, 5.0, 3.0, 4.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00019228458404541016, -0.0001865886151790619, -0.00018089264631271362, -0.00017519667744636536, -0.0001695007085800171, -0.00016380473971366882, -0.00015810877084732056, -0.0001524128019809723, -0.00014671683311462402, -0.00014102086424827576, -0.0001353248953819275, -0.00012962892651557922, -0.00012393295764923096, -0.00011823698878288269, -0.00011254101991653442, -0.00010684505105018616, -0.00010114908218383789, -9.545311331748962e-05, -8.975714445114136e-05, -8.406117558479309e-05, -7.836520671844482e-05, -7.266923785209656e-05, -6.697326898574829e-05, -6.127730011940002e-05, -5.558133125305176e-05, -4.988536238670349e-05, -4.4189393520355225e-05, -3.849342465400696e-05, -3.279745578765869e-05, -2.7101486921310425e-05, -2.1405518054962158e-05, -1.570954918861389e-05, -1.0013580322265625e-05, -4.317611455917358e-06, 1.3783574104309082e-06, 7.074326276779175e-06, 1.2770295143127441e-05, 1.8466264009475708e-05, 2.4162232875823975e-05, 2.985820174217224e-05, 3.555417060852051e-05, 4.1250139474868774e-05, 4.694610834121704e-05, 5.264207720756531e-05, 5.8338046073913574e-05, 6.403401494026184e-05, 6.972998380661011e-05, 7.542595267295837e-05, 8.112192153930664e-05, 8.681789040565491e-05, 9.251385927200317e-05, 9.820982813835144e-05, 0.00010390579700469971, 0.00010960176587104797, 0.00011529773473739624, 0.00012099370360374451, 0.00012668967247009277, 0.00013238564133644104, 0.0001380816102027893, 0.00014377757906913757, 0.00014947354793548584, 0.0001551695168018341, 0.00016086548566818237, 0.00016656145453453064, 0.0001722574234008789]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 10.0, 10.0, 19.0, 41.0, 56.0, 96.0, 142.0, 167.0, 160.0, 97.0, 72.0, 36.0, 32.0, 22.0, 11.0, 10.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.617473602294922e-05, -7.397308945655823e-05, -7.177144289016724e-05, -6.956979632377625e-05, -6.736814975738525e-05, -6.516650319099426e-05, -6.296485662460327e-05, -6.076321005821228e-05, -5.856156349182129e-05, -5.63599169254303e-05, -5.415827035903931e-05, -5.1956623792648315e-05, -4.9754977226257324e-05, -4.755333065986633e-05, -4.535168409347534e-05, -4.315003752708435e-05, -4.094839096069336e-05, -3.874674439430237e-05, -3.654509782791138e-05, -3.4343451261520386e-05, -3.2141804695129395e-05, -2.9940158128738403e-05, -2.7738511562347412e-05, -2.553686499595642e-05, -2.333521842956543e-05, -2.113357186317444e-05, -1.8931925296783447e-05, -1.6730278730392456e-05, -1.4528632164001465e-05, -1.2326985597610474e-05, -1.0125339031219482e-05, -7.923692464828491e-06, -5.7220458984375e-06, -3.520399332046509e-06, -1.3187527656555176e-06, 8.828938007354736e-07, 3.084540367126465e-06, 5.286186933517456e-06, 7.487833499908447e-06, 9.689480066299438e-06, 1.189112663269043e-05, 1.4092773199081421e-05, 1.6294419765472412e-05, 1.8496066331863403e-05, 2.0697712898254395e-05, 2.2899359464645386e-05, 2.5101006031036377e-05, 2.7302652597427368e-05, 2.950429916381836e-05, 3.170594573020935e-05, 3.390759229660034e-05, 3.610923886299133e-05, 3.8310885429382324e-05, 4.0512531995773315e-05, 4.271417856216431e-05, 4.49158251285553e-05, 4.711747169494629e-05, 4.931911826133728e-05, 5.152076482772827e-05, 5.372241139411926e-05, 5.5924057960510254e-05, 5.8125704526901245e-05, 6.0327351093292236e-05, 6.252899765968323e-05, 6.473064422607422e-05]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 6.0, 27.0, 774.0, 193.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04335526376962662, -0.031961411237716675, -0.020567556843161583, -0.009173702448606491, 0.0022201500833034515, 0.013614002615213394, 0.025007858872413635, 0.03640171140432358, 0.04779556393623352, 0.05918941646814346, 0.0705832690000534, 0.08197712898254395, 0.09337097406387329, 0.10476483404636383, 0.11615868657827377, 0.12755253911018372, 0.13894638419151306, 0.1503402441740036, 0.16173408925533295, 0.1731279492378235, 0.18452179431915283, 0.19591565430164337, 0.2073095142841339, 0.21870335936546326, 0.2300972193479538, 0.24149107933044434, 0.2528849244117737, 0.264278769493103, 0.27567264437675476, 0.2870664894580841, 0.29846033453941345, 0.3098542094230652, 0.32124802470207214, 0.3326418697834015, 0.3440357446670532, 0.35542958974838257, 0.3668234348297119, 0.37821727991104126, 0.389611154794693, 0.40100499987602234, 0.4123988449573517, 0.42379269003868103, 0.43518656492233276, 0.4465804100036621, 0.45797425508499146, 0.4693681001663208, 0.48076197504997253, 0.4921558201313019, 0.5035496950149536, 0.514943540096283, 0.5263373851776123, 0.5377312302589417, 0.5491251349449158, 0.5605189800262451, 0.5719128251075745, 0.5833066701889038, 0.5947005152702332, 0.6060943603515625, 0.6174882054328918, 0.6288820505142212, 0.6402759552001953, 0.6516698002815247, 0.663063645362854, 0.6744574904441833, 0.6858513355255127]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 11.0, 13.0, 8.0, 20.0, 23.0, 33.0, 27.0, 35.0, 27.0, 45.0, 54.0, 49.0, 47.0, 44.0, 58.0, 42.0, 52.0, 60.0, 53.0, 47.0, 40.0, 43.0, 35.0, 28.0, 24.0, 15.0, 9.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2533220052719116, -0.24554792046546936, -0.2377738356590271, -0.22999975085258484, -0.22222565114498138, -0.21445156633853912, -0.20667748153209686, -0.1989033967256546, -0.19112929701805115, -0.1833552122116089, -0.17558112740516663, -0.16780704259872437, -0.1600329428911209, -0.15225885808467865, -0.1444847732782364, -0.13671068847179413, -0.12893660366535187, -0.1211625188589096, -0.11338842660188675, -0.10561434179544449, -0.09784024953842163, -0.09006616473197937, -0.08229207992553711, -0.07451799511909485, -0.06674390286207199, -0.05896981433033943, -0.05119572579860687, -0.04342164099216461, -0.03564755246043205, -0.027873463928699493, -0.020099379122257233, -0.012325290590524673, -0.004551202058792114, 0.0032228855416178703, 0.010996973142027855, 0.018771059811115265, 0.026545148342847824, 0.03431923687458038, 0.042093321681022644, 0.0498674102127552, 0.05764149874448776, 0.06541558355093002, 0.07318967580795288, 0.08096376061439514, 0.0887378454208374, 0.09651193767786026, 0.10428602248430252, 0.11206011474132538, 0.11983419954776764, 0.1276082843542099, 0.13538236916065216, 0.14315646886825562, 0.15093055367469788, 0.15870463848114014, 0.1664787232875824, 0.17425280809402466, 0.18202689290046692, 0.18980097770690918, 0.19757506251335144, 0.2053491473197937, 0.21312324702739716, 0.22089733183383942, 0.22867141664028168, 0.23644550144672394, 0.2442196011543274]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 6.0, 14.0, 12.0, 33.0, 28.0, 52.0, 66.0, 115.0, 128.0, 219.0, 325.0, 624.0, 1298.0, 18874.0, 4156866.0, 11910.0, 1524.0, 690.0, 401.0, 305.0, 207.0, 153.0, 107.0, 74.0, 60.0, 44.0, 35.0, 17.0, 21.0, 10.0, 19.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.03627634048461914, -0.03504657745361328, -0.03381681442260742, -0.03258705139160156, -0.0313572883605957, -0.030127525329589844, -0.028897762298583984, -0.027667999267578125, -0.026438236236572266, -0.025208473205566406, -0.023978710174560547, -0.022748947143554688, -0.021519184112548828, -0.02028942108154297, -0.01905965805053711, -0.01782989501953125, -0.01660013198852539, -0.015370368957519531, -0.014140605926513672, -0.012910842895507812, -0.011681079864501953, -0.010451316833496094, -0.009221553802490234, -0.007991790771484375, -0.006762027740478516, -0.005532264709472656, -0.004302501678466797, -0.0030727386474609375, -0.0018429756164550781, -0.0006132125854492188, 0.0006165504455566406, 0.0018463134765625, 0.0030760765075683594, 0.004305839538574219, 0.005535602569580078, 0.0067653656005859375, 0.007995128631591797, 0.009224891662597656, 0.010454654693603516, 0.011684417724609375, 0.012914180755615234, 0.014143943786621094, 0.015373706817626953, 0.016603469848632812, 0.017833232879638672, 0.01906299591064453, 0.02029275894165039, 0.02152252197265625, 0.02275228500366211, 0.02398204803466797, 0.025211811065673828, 0.026441574096679688, 0.027671337127685547, 0.028901100158691406, 0.030130863189697266, 0.031360626220703125, 0.032590389251708984, 0.033820152282714844, 0.0350499153137207, 0.03627967834472656, 0.03750944137573242, 0.03873920440673828, 0.03996896743774414, 0.04119873046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 13.0, 10.0, 6.0, 9.0, 17.0, 51.0, 243.0, 369.0, 128.0, 28.0, 14.0, 9.0, 12.0, 12.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00970458984375, -0.009387731552124023, -0.009070873260498047, -0.00875401496887207, -0.008437156677246094, -0.008120298385620117, -0.007803440093994141, -0.007486581802368164, -0.0071697235107421875, -0.006852865219116211, -0.006536006927490234, -0.006219148635864258, -0.005902290344238281, -0.005585432052612305, -0.005268573760986328, -0.0049517154693603516, -0.004634857177734375, -0.0043179988861083984, -0.004001140594482422, -0.0036842823028564453, -0.0033674240112304688, -0.003050565719604492, -0.0027337074279785156, -0.002416849136352539, -0.0020999908447265625, -0.001783132553100586, -0.0014662742614746094, -0.0011494159698486328, -0.0008325576782226562, -0.0005156993865966797, -0.00019884109497070312, 0.00011801719665527344, 0.00043487548828125, 0.0007517337799072266, 0.0010685920715332031, 0.0013854503631591797, 0.0017023086547851562, 0.002019166946411133, 0.0023360252380371094, 0.002652883529663086, 0.0029697418212890625, 0.003286600112915039, 0.0036034584045410156, 0.003920316696166992, 0.004237174987792969, 0.004554033279418945, 0.004870891571044922, 0.0051877498626708984, 0.005504608154296875, 0.0058214664459228516, 0.006138324737548828, 0.006455183029174805, 0.006772041320800781, 0.007088899612426758, 0.007405757904052734, 0.007722616195678711, 0.008039474487304688, 0.008356332778930664, 0.00867319107055664, 0.008990049362182617, 0.009306907653808594, 0.00962376594543457, 0.009940624237060547, 0.010257482528686523, 0.0105743408203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 12.0, 7.0, 15.0, 14.0, 21.0, 37.0, 53.0, 88.0, 154.0, 463.0, 2731.0, 4061645.0, 126088.0, 2112.0, 356.0, 174.0, 59.0, 39.0, 42.0, 24.0, 16.0, 19.0, 12.0, 15.0, 3.0, 10.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.0799713134765625, -0.077301025390625, -0.0746307373046875, -0.07196044921875, -0.0692901611328125, -0.066619873046875, -0.0639495849609375, -0.061279296875, -0.0586090087890625, -0.055938720703125, -0.0532684326171875, -0.05059814453125, -0.0479278564453125, -0.045257568359375, -0.0425872802734375, -0.0399169921875, -0.0372467041015625, -0.034576416015625, -0.0319061279296875, -0.02923583984375, -0.0265655517578125, -0.023895263671875, -0.0212249755859375, -0.0185546875, -0.0158843994140625, -0.013214111328125, -0.0105438232421875, -0.00787353515625, -0.0052032470703125, -0.002532958984375, 0.0001373291015625, 0.0028076171875, 0.0054779052734375, 0.008148193359375, 0.0108184814453125, 0.01348876953125, 0.0161590576171875, 0.018829345703125, 0.0214996337890625, 0.024169921875, 0.0268402099609375, 0.029510498046875, 0.0321807861328125, 0.03485107421875, 0.0375213623046875, 0.040191650390625, 0.0428619384765625, 0.0455322265625, 0.0482025146484375, 0.050872802734375, 0.0535430908203125, 0.05621337890625, 0.0588836669921875, 0.061553955078125, 0.0642242431640625, 0.06689453125, 0.0695648193359375, 0.072235107421875, 0.0749053955078125, 0.07757568359375, 0.0802459716796875, 0.082916259765625, 0.0855865478515625, 0.0882568359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 13.0, 11.0, 7.0, 21.0, 50.0, 73.0, 457.0, 3149.0, 135.0, 58.0, 20.0, 12.0, 5.0, 5.0, 6.0, 7.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.016998291015625, -0.01648545265197754, -0.015972614288330078, -0.015459775924682617, -0.014946937561035156, -0.014434099197387695, -0.013921260833740234, -0.013408422470092773, -0.012895584106445312, -0.012382745742797852, -0.01186990737915039, -0.01135706901550293, -0.010844230651855469, -0.010331392288208008, -0.009818553924560547, -0.009305715560913086, -0.008792877197265625, -0.008280038833618164, -0.007767200469970703, -0.007254362106323242, -0.006741523742675781, -0.00622868537902832, -0.005715847015380859, -0.0052030086517333984, -0.0046901702880859375, -0.0041773319244384766, -0.0036644935607910156, -0.0031516551971435547, -0.0026388168334960938, -0.002125978469848633, -0.0016131401062011719, -0.001100301742553711, -0.00058746337890625, -7.462501525878906e-05, 0.0004382133483886719, 0.0009510517120361328, 0.0014638900756835938, 0.0019767284393310547, 0.0024895668029785156, 0.0030024051666259766, 0.0035152435302734375, 0.0040280818939208984, 0.004540920257568359, 0.00505375862121582, 0.005566596984863281, 0.006079435348510742, 0.006592273712158203, 0.007105112075805664, 0.007617950439453125, 0.008130788803100586, 0.008643627166748047, 0.009156465530395508, 0.009669303894042969, 0.01018214225769043, 0.01069498062133789, 0.011207818984985352, 0.011720657348632812, 0.012233495712280273, 0.012746334075927734, 0.013259172439575195, 0.013772010803222656, 0.014284849166870117, 0.014797687530517578, 0.015310525894165039, 0.0158233642578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 960.0, 50.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26537030935287476, -0.2606084942817688, -0.25584667921066284, -0.2510848939418793, -0.24632307887077332, -0.24156126379966736, -0.2367994636297226, -0.23203766345977783, -0.22727584838867188, -0.22251403331756592, -0.21775223314762115, -0.2129904329776764, -0.20822861790657043, -0.20346680283546448, -0.19870500266551971, -0.19394320249557495, -0.189181387424469, -0.18441957235336304, -0.17965777218341827, -0.1748959720134735, -0.17013415694236755, -0.1653723418712616, -0.16061054170131683, -0.15584874153137207, -0.1510869264602661, -0.14632511138916016, -0.1415633112192154, -0.13680151104927063, -0.13203969597816467, -0.12727788090705872, -0.12251608073711395, -0.11775427311658859, -0.11299246549606323, -0.10823065787553787, -0.10346885025501251, -0.09870704263448715, -0.09394523501396179, -0.08918342739343643, -0.08442161977291107, -0.07965981215238571, -0.07489800453186035, -0.07013619691133499, -0.06537438929080963, -0.06061258167028427, -0.05585077404975891, -0.05108896642923355, -0.04632715880870819, -0.04156535118818283, -0.03680354356765747, -0.03204173594713211, -0.02727992832660675, -0.02251812070608139, -0.01775631308555603, -0.01299450546503067, -0.00823269784450531, -0.00347089022397995, 0.0012909173965454102, 0.00605272501707077, 0.01081453263759613, 0.01557634025812149, 0.02033814787864685, 0.02509995549917221, 0.02986176311969757, 0.03462357074022293, 0.03938537836074829]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 9.0, 5.0, 12.0, 12.0, 18.0, 21.0, 24.0, 25.0, 36.0, 37.0, 39.0, 41.0, 50.0, 56.0, 64.0, 54.0, 70.0, 67.0, 57.0, 45.0, 37.0, 38.0, 44.0, 30.0, 24.0, 23.0, 12.0, 13.0, 18.0, 8.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0466805100440979, -0.04540916532278061, -0.04413782060146332, -0.042866479605436325, -0.041595134884119034, -0.04032379016280174, -0.03905244916677475, -0.03778110444545746, -0.03650975972414017, -0.035238415002822876, -0.033967070281505585, -0.03269572928547859, -0.0314243845641613, -0.03015303984284401, -0.028881696984171867, -0.027610354125499725, -0.026339009404182434, -0.025067664682865143, -0.023796321824193, -0.02252497896552086, -0.021253634244203568, -0.019982289522886276, -0.018710946664214134, -0.017439603805541992, -0.0161682590842247, -0.014896915294229984, -0.013625571504235268, -0.012354227714240551, -0.011082883924245834, -0.009811540134251118, -0.008540196344256401, -0.007268852554261684, -0.005997508764266968, -0.004726164974272251, -0.0034548211842775345, -0.002183477394282818, -0.0009121336042881012, 0.00035921018570661545, 0.001630553975701332, 0.0029018977656960487, 0.004173241555690765, 0.005444585345685482, 0.006715929135680199, 0.007987272925674915, 0.009258616715669632, 0.010529960505664349, 0.011801304295659065, 0.013072648085653782, 0.014343991875648499, 0.015615335665643215, 0.016886679455637932, 0.018158022314310074, 0.019429367035627365, 0.020700711756944656, 0.0219720546156168, 0.02324339747428894, 0.02451474219560623, 0.025786086916923523, 0.027057429775595665, 0.028328772634267807, 0.0296001173555851, 0.03087146207690239, 0.03214280307292938, 0.033414147794246674, 0.034685492515563965]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 8.0, 12.0, 16.0, 20.0, 32.0, 37.0, 54.0, 64.0, 109.0, 135.0, 172.0, 275.0, 382.0, 546.0, 817.0, 1203.0, 1854.0, 3010.0, 5184.0, 9521.0, 21327.0, 190503.0, 759489.0, 27116.0, 11110.0, 5805.0, 3389.0, 2099.0, 1396.0, 862.0, 580.0, 422.0, 272.0, 205.0, 153.0, 95.0, 71.0, 53.0, 43.0, 27.0, 19.0, 15.0, 13.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0216217041015625, -0.020926713943481445, -0.02023172378540039, -0.019536733627319336, -0.01884174346923828, -0.018146753311157227, -0.017451763153076172, -0.016756772994995117, -0.016061782836914062, -0.015366792678833008, -0.014671802520751953, -0.013976812362670898, -0.013281822204589844, -0.012586832046508789, -0.011891841888427734, -0.01119685173034668, -0.010501861572265625, -0.00980687141418457, -0.009111881256103516, -0.008416891098022461, -0.007721900939941406, -0.0070269107818603516, -0.006331920623779297, -0.005636930465698242, -0.0049419403076171875, -0.004246950149536133, -0.003551959991455078, -0.0028569698333740234, -0.0021619796752929688, -0.001466989517211914, -0.0007719993591308594, -7.700920104980469e-05, 0.00061798095703125, 0.0013129711151123047, 0.0020079612731933594, 0.002702951431274414, 0.0033979415893554688, 0.0040929317474365234, 0.004787921905517578, 0.005482912063598633, 0.0061779022216796875, 0.006872892379760742, 0.007567882537841797, 0.008262872695922852, 0.008957862854003906, 0.009652853012084961, 0.010347843170166016, 0.01104283332824707, 0.011737823486328125, 0.01243281364440918, 0.013127803802490234, 0.013822793960571289, 0.014517784118652344, 0.015212774276733398, 0.015907764434814453, 0.016602754592895508, 0.017297744750976562, 0.017992734909057617, 0.018687725067138672, 0.019382715225219727, 0.02007770538330078, 0.020772695541381836, 0.02146768569946289, 0.022162675857543945, 0.022857666015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 7.0, 5.0, 4.0, 5.0, 14.0, 6.0, 8.0, 9.0, 20.0, 61.0, 253.0, 357.0, 117.0, 27.0, 14.0, 9.0, 9.0, 14.0, 8.0, 6.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 9.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00946807861328125, -0.009158492088317871, -0.008848905563354492, -0.008539319038391113, -0.008229732513427734, -0.007920145988464355, -0.0076105594635009766, -0.007300972938537598, -0.006991386413574219, -0.00668179988861084, -0.006372213363647461, -0.006062626838684082, -0.005753040313720703, -0.005443453788757324, -0.005133867263793945, -0.004824280738830566, -0.0045146942138671875, -0.004205107688903809, -0.0038955211639404297, -0.0035859346389770508, -0.003276348114013672, -0.002966761589050293, -0.002657175064086914, -0.002347588539123535, -0.0020380020141601562, -0.0017284154891967773, -0.0014188289642333984, -0.0011092424392700195, -0.0007996559143066406, -0.0004900693893432617, -0.0001804828643798828, 0.0001291036605834961, 0.000438690185546875, 0.0007482767105102539, 0.0010578632354736328, 0.0013674497604370117, 0.0016770362854003906, 0.0019866228103637695, 0.0022962093353271484, 0.0026057958602905273, 0.0029153823852539062, 0.003224968910217285, 0.003534555435180664, 0.003844141960144043, 0.004153728485107422, 0.004463315010070801, 0.00477290153503418, 0.005082488059997559, 0.0053920745849609375, 0.005701661109924316, 0.006011247634887695, 0.006320834159851074, 0.006630420684814453, 0.006940007209777832, 0.007249593734741211, 0.00755918025970459, 0.007868766784667969, 0.008178353309631348, 0.008487939834594727, 0.008797526359558105, 0.009107112884521484, 0.009416699409484863, 0.009726285934448242, 0.010035872459411621, 0.010345458984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 2.0, 6.0, 5.0, 7.0, 14.0, 12.0, 15.0, 25.0, 25.0, 21.0, 28.0, 46.0, 40.0, 64.0, 73.0, 92.0, 92.0, 146.0, 191.0, 254.0, 362.0, 668.0, 1702.0, 11452.0, 927394.0, 99224.0, 3734.0, 1054.0, 499.0, 295.0, 207.0, 155.0, 119.0, 91.0, 90.0, 61.0, 54.0, 54.0, 30.0, 23.0, 27.0, 23.0, 18.0, 15.0, 14.0, 8.0, 4.0, 9.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 5.0], "bins": [-0.0621337890625, -0.06029367446899414, -0.05845355987548828, -0.05661344528198242, -0.05477333068847656, -0.0529332160949707, -0.051093101501464844, -0.049252986907958984, -0.047412872314453125, -0.045572757720947266, -0.043732643127441406, -0.04189252853393555, -0.04005241394042969, -0.03821229934692383, -0.03637218475341797, -0.03453207015991211, -0.03269195556640625, -0.03085184097290039, -0.02901172637939453, -0.027171611785888672, -0.025331497192382812, -0.023491382598876953, -0.021651268005371094, -0.019811153411865234, -0.017971038818359375, -0.016130924224853516, -0.014290809631347656, -0.012450695037841797, -0.010610580444335938, -0.008770465850830078, -0.006930351257324219, -0.005090236663818359, -0.0032501220703125, -0.0014100074768066406, 0.00043010711669921875, 0.002270221710205078, 0.0041103363037109375, 0.005950450897216797, 0.007790565490722656, 0.009630680084228516, 0.011470794677734375, 0.013310909271240234, 0.015151023864746094, 0.016991138458251953, 0.018831253051757812, 0.020671367645263672, 0.02251148223876953, 0.02435159683227539, 0.02619171142578125, 0.02803182601928711, 0.02987194061279297, 0.03171205520629883, 0.03355216979980469, 0.03539228439331055, 0.037232398986816406, 0.039072513580322266, 0.040912628173828125, 0.042752742767333984, 0.044592857360839844, 0.0464329719543457, 0.04827308654785156, 0.05011320114135742, 0.05195331573486328, 0.05379343032836914, 0.055633544921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 5.0, 8.0, 9.0, 9.0, 9.0, 18.0, 11.0, 24.0, 20.0, 22.0, 37.0, 38.0, 36.0, 54.0, 31.0, 38.0, 57.0, 45.0, 47.0, 30.0, 43.0, 35.0, 48.0, 27.0, 40.0, 28.0, 36.0, 24.0, 21.0, 21.0, 22.0, 17.0, 15.0, 9.0, 13.0, 3.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.030426025390625, -0.029525041580200195, -0.02862405776977539, -0.027723073959350586, -0.02682209014892578, -0.025921106338500977, -0.025020122528076172, -0.024119138717651367, -0.023218154907226562, -0.022317171096801758, -0.021416187286376953, -0.02051520347595215, -0.019614219665527344, -0.01871323585510254, -0.017812252044677734, -0.01691126823425293, -0.016010284423828125, -0.01510930061340332, -0.014208316802978516, -0.013307332992553711, -0.012406349182128906, -0.011505365371704102, -0.010604381561279297, -0.009703397750854492, -0.008802413940429688, -0.007901430130004883, -0.007000446319580078, -0.0060994625091552734, -0.005198478698730469, -0.004297494888305664, -0.0033965110778808594, -0.0024955272674560547, -0.00159454345703125, -0.0006935596466064453, 0.00020742416381835938, 0.001108407974243164, 0.0020093917846679688, 0.0029103755950927734, 0.003811359405517578, 0.004712343215942383, 0.0056133270263671875, 0.006514310836791992, 0.007415294647216797, 0.008316278457641602, 0.009217262268066406, 0.010118246078491211, 0.011019229888916016, 0.01192021369934082, 0.012821197509765625, 0.01372218132019043, 0.014623165130615234, 0.015524148941040039, 0.016425132751464844, 0.01732611656188965, 0.018227100372314453, 0.019128084182739258, 0.020029067993164062, 0.020930051803588867, 0.021831035614013672, 0.022732019424438477, 0.02363300323486328, 0.024533987045288086, 0.02543497085571289, 0.026335954666137695, 0.0272369384765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 2.0, 12.0, 10.0, 18.0, 29.0, 37.0, 52.0, 69.0, 130.0, 157.0, 258.0, 462.0, 897.0, 2644.0, 13507.0, 881742.0, 137882.0, 6927.0, 1820.0, 779.0, 401.0, 219.0, 146.0, 95.0, 73.0, 45.0, 24.0, 24.0, 11.0, 23.0, 9.0, 9.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0471553802490234e-05, -3.9159320294857025e-05, -3.7847086787223816e-05, -3.653485327959061e-05, -3.52226197719574e-05, -3.391038626432419e-05, -3.259815275669098e-05, -3.128591924905777e-05, -2.997368574142456e-05, -2.866145223379135e-05, -2.7349218726158142e-05, -2.6036985218524933e-05, -2.4724751710891724e-05, -2.3412518203258514e-05, -2.2100284695625305e-05, -2.0788051187992096e-05, -1.9475817680358887e-05, -1.8163584172725677e-05, -1.6851350665092468e-05, -1.553911715745926e-05, -1.422688364982605e-05, -1.291465014219284e-05, -1.1602416634559631e-05, -1.0290183126926422e-05, -8.977949619293213e-06, -7.665716111660004e-06, -6.3534826040267944e-06, -5.041249096393585e-06, -3.729015588760376e-06, -2.4167820811271667e-06, -1.1045485734939575e-06, 2.076849341392517e-07, 1.519918441772461e-06, 2.83215194940567e-06, 4.144385457038879e-06, 5.456618964672089e-06, 6.768852472305298e-06, 8.081085979938507e-06, 9.393319487571716e-06, 1.0705552995204926e-05, 1.2017786502838135e-05, 1.3330020010471344e-05, 1.4642253518104553e-05, 1.5954487025737762e-05, 1.726672053337097e-05, 1.857895404100418e-05, 1.989118754863739e-05, 2.12034210562706e-05, 2.251565456390381e-05, 2.3827888071537018e-05, 2.5140121579170227e-05, 2.6452355086803436e-05, 2.7764588594436646e-05, 2.9076822102069855e-05, 3.0389055609703064e-05, 3.170128911733627e-05, 3.301352262496948e-05, 3.432575613260269e-05, 3.56379896402359e-05, 3.695022314786911e-05, 3.826245665550232e-05, 3.957469016313553e-05, 4.088692367076874e-05, 4.219915717840195e-05, 4.3511390686035156e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 8.0, 9.0, 15.0, 13.0, 10.0, 26.0, 35.0, 36.0, 31.0, 46.0, 47.0, 73.0, 60.0, 50.0, 76.0, 76.0, 59.0, 34.0, 45.0, 51.0, 46.0, 38.0, 23.0, 21.0, 16.0, 11.0, 5.0, 11.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.649162292480469e-06, -4.4833868741989136e-06, -4.317611455917358e-06, -4.151836037635803e-06, -3.986060619354248e-06, -3.820285201072693e-06, -3.6545097827911377e-06, -3.4887343645095825e-06, -3.3229589462280273e-06, -3.157183527946472e-06, -2.991408109664917e-06, -2.825632691383362e-06, -2.6598572731018066e-06, -2.4940818548202515e-06, -2.3283064365386963e-06, -2.162531018257141e-06, -1.996755599975586e-06, -1.8309801816940308e-06, -1.6652047634124756e-06, -1.4994293451309204e-06, -1.3336539268493652e-06, -1.16787850856781e-06, -1.0021030902862549e-06, -8.363276720046997e-07, -6.705522537231445e-07, -5.047768354415894e-07, -3.390014171600342e-07, -1.73225998878479e-07, -7.450580596923828e-09, 1.5832483768463135e-07, 3.241002559661865e-07, 4.898756742477417e-07, 6.556510925292969e-07, 8.21426510810852e-07, 9.872019290924072e-07, 1.1529773473739624e-06, 1.3187527656555176e-06, 1.4845281839370728e-06, 1.650303602218628e-06, 1.816079020500183e-06, 1.9818544387817383e-06, 2.1476298570632935e-06, 2.3134052753448486e-06, 2.479180693626404e-06, 2.644956111907959e-06, 2.810731530189514e-06, 2.9765069484710693e-06, 3.1422823667526245e-06, 3.3080577850341797e-06, 3.473833203315735e-06, 3.63960862159729e-06, 3.8053840398788452e-06, 3.9711594581604e-06, 4.1369348764419556e-06, 4.302710294723511e-06, 4.468485713005066e-06, 4.634261131286621e-06, 4.800036549568176e-06, 4.9658119678497314e-06, 5.131587386131287e-06, 5.297362804412842e-06, 5.463138222694397e-06, 5.628913640975952e-06, 5.794689059257507e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 15.0, 13.0, 26.0, 18.0, 41.0, 55.0, 105.0, 151.0, 252.0, 427.0, 1531.0, 65986.0, 975765.0, 2771.0, 577.0, 288.0, 169.0, 112.0, 72.0, 34.0, 33.0, 21.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.927417755126953e-05, -7.695145905017853e-05, -7.462874054908752e-05, -7.230602204799652e-05, -6.998330354690552e-05, -6.766058504581451e-05, -6.533786654472351e-05, -6.301514804363251e-05, -6.0692429542541504e-05, -5.83697110414505e-05, -5.60469925403595e-05, -5.3724274039268494e-05, -5.140155553817749e-05, -4.907883703708649e-05, -4.6756118535995483e-05, -4.443340003490448e-05, -4.2110681533813477e-05, -3.978796303272247e-05, -3.746524453163147e-05, -3.5142526030540466e-05, -3.281980752944946e-05, -3.049708902835846e-05, -2.8174370527267456e-05, -2.5851652026176453e-05, -2.352893352508545e-05, -2.1206215023994446e-05, -1.8883496522903442e-05, -1.656077802181244e-05, -1.4238059520721436e-05, -1.1915341019630432e-05, -9.592622518539429e-06, -7.269904017448425e-06, -4.947185516357422e-06, -2.6244670152664185e-06, -3.0174851417541504e-07, 2.0209699869155884e-06, 4.343688488006592e-06, 6.666406989097595e-06, 8.989125490188599e-06, 1.1311843991279602e-05, 1.3634562492370605e-05, 1.595728099346161e-05, 1.8279999494552612e-05, 2.0602717995643616e-05, 2.292543649673462e-05, 2.5248154997825623e-05, 2.7570873498916626e-05, 2.989359200000763e-05, 3.221631050109863e-05, 3.4539029002189636e-05, 3.686174750328064e-05, 3.918446600437164e-05, 4.1507184505462646e-05, 4.382990300655365e-05, 4.615262150764465e-05, 4.847534000873566e-05, 5.079805850982666e-05, 5.3120777010917664e-05, 5.544349551200867e-05, 5.776621401309967e-05, 6.0088932514190674e-05, 6.241165101528168e-05, 6.473436951637268e-05, 6.705708801746368e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 11.0, 4.0, 13.0, 22.0, 27.0, 41.0, 46.0, 52.0, 96.0, 118.0, 148.0, 114.0, 74.0, 48.0, 51.0, 40.0, 18.0, 21.0, 12.0, 8.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8743019104003906e-05, -3.764685243368149e-05, -3.655068576335907e-05, -3.545451909303665e-05, -3.4358352422714233e-05, -3.3262185752391815e-05, -3.21660190820694e-05, -3.106985241174698e-05, -2.997368574142456e-05, -2.8877519071102142e-05, -2.7781352400779724e-05, -2.6685185730457306e-05, -2.5589019060134888e-05, -2.449285238981247e-05, -2.339668571949005e-05, -2.2300519049167633e-05, -2.1204352378845215e-05, -2.0108185708522797e-05, -1.901201903820038e-05, -1.791585236787796e-05, -1.6819685697555542e-05, -1.5723519027233124e-05, -1.4627352356910706e-05, -1.3531185686588287e-05, -1.2435019016265869e-05, -1.1338852345943451e-05, -1.0242685675621033e-05, -9.146519005298615e-06, -8.050352334976196e-06, -6.954185664653778e-06, -5.85801899433136e-06, -4.761852324008942e-06, -3.6656856536865234e-06, -2.5695189833641052e-06, -1.473352313041687e-06, -3.771856427192688e-07, 7.189810276031494e-07, 1.8151476979255676e-06, 2.911314368247986e-06, 4.007481038570404e-06, 5.103647708892822e-06, 6.1998143792152405e-06, 7.295981049537659e-06, 8.392147719860077e-06, 9.488314390182495e-06, 1.0584481060504913e-05, 1.1680647730827332e-05, 1.277681440114975e-05, 1.3872981071472168e-05, 1.4969147741794586e-05, 1.6065314412117004e-05, 1.7161481082439423e-05, 1.825764775276184e-05, 1.935381442308426e-05, 2.0449981093406677e-05, 2.1546147763729095e-05, 2.2642314434051514e-05, 2.3738481104373932e-05, 2.483464777469635e-05, 2.593081444501877e-05, 2.7026981115341187e-05, 2.8123147785663605e-05, 2.9219314455986023e-05, 3.031548112630844e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [12.0, 938.0, 64.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03425495699048042, -0.014300649985671043, 0.005653657019138336, 0.025607962161302567, 0.045562271028757095, 0.06551657617092133, 0.08547088503837585, 0.10542519390583038, 0.1253795027732849, 0.14533381164073944, 0.16528812050819397, 0.1852424144744873, 0.20519673824310303, 0.22515103220939636, 0.2451053410768509, 0.2650596499443054, 0.28501394391059875, 0.3049682378768921, 0.3249225616455078, 0.34487685561180115, 0.36483117938041687, 0.3847854733467102, 0.4047397971153259, 0.42469409108161926, 0.444648414850235, 0.4646027088165283, 0.48455703258514404, 0.5045113563537598, 0.5244656205177307, 0.5444199442863464, 0.5643742680549622, 0.5843285322189331, 0.6042829155921936, 0.6242372393608093, 0.6441915035247803, 0.664145827293396, 0.6841001510620117, 0.7040544748306274, 0.7240087389945984, 0.7439630627632141, 0.7639173865318298, 0.7838717103004456, 0.8038259744644165, 0.8237802982330322, 0.843734622001648, 0.8636889457702637, 0.8836432099342346, 0.9035975337028503, 0.9235517978668213, 0.943506121635437, 0.963460385799408, 0.9834147095680237, 1.0033689737319946, 1.0233232975006104, 1.043277621269226, 1.0632319450378418, 1.0831862688064575, 1.1031405925750732, 1.123094916343689, 1.1430492401123047, 1.1630034446716309, 1.1829577684402466, 1.2029120922088623, 1.222866415977478, 1.2428207397460938]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 9.0, 12.0, 11.0, 14.0, 26.0, 31.0, 35.0, 50.0, 54.0, 42.0, 65.0, 76.0, 64.0, 77.0, 60.0, 67.0, 60.0, 55.0, 52.0, 36.0, 23.0, 20.0, 17.0, 16.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2950636148452759, -0.2866082191467285, -0.27815282344818115, -0.2696973979473114, -0.26124200224876404, -0.2527866065502167, -0.24433119595050812, -0.23587578535079956, -0.2274203896522522, -0.21896499395370483, -0.21050958335399628, -0.20205417275428772, -0.19359877705574036, -0.185143381357193, -0.17668797075748444, -0.16823256015777588, -0.15977716445922852, -0.15132176876068115, -0.1428663581609726, -0.13441094756126404, -0.12595555186271667, -0.11750014871358871, -0.10904474556446075, -0.1005893424153328, -0.09213393926620483, -0.08367853611707687, -0.07522313296794891, -0.06676772981882095, -0.05831232666969299, -0.04985692352056503, -0.04140152037143707, -0.03294611722230911, -0.024490714073181152, -0.016035310924053192, -0.007579907774925232, 0.0008754953742027283, 0.009330898523330688, 0.01778630167245865, 0.02624170482158661, 0.03469710797071457, 0.04315251111984253, 0.05160791426897049, 0.06006331741809845, 0.06851872056722641, 0.07697412371635437, 0.08542952686548233, 0.09388493001461029, 0.10234033316373825, 0.11079573631286621, 0.11925113946199417, 0.12770654261112213, 0.1361619532108307, 0.14461734890937805, 0.15307274460792542, 0.16152815520763397, 0.16998356580734253, 0.1784389615058899, 0.18689435720443726, 0.1953497678041458, 0.20380517840385437, 0.21226057410240173, 0.2207159698009491, 0.22917138040065765, 0.2376267910003662, 0.24608218669891357]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 5.0, 11.0, 10.0, 15.0, 15.0, 25.0, 26.0, 35.0, 52.0, 64.0, 84.0, 138.0, 220.0, 644.0, 11736.0, 4171602.0, 8169.0, 492.0, 257.0, 159.0, 98.0, 80.0, 64.0, 39.0, 39.0, 23.0, 29.0, 23.0, 20.0, 15.0, 13.0, 15.0, 10.0, 4.0, 9.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031219482421875, -0.03016185760498047, -0.029104232788085938, -0.028046607971191406, -0.026988983154296875, -0.025931358337402344, -0.024873733520507812, -0.02381610870361328, -0.02275848388671875, -0.02170085906982422, -0.020643234252929688, -0.019585609436035156, -0.018527984619140625, -0.017470359802246094, -0.016412734985351562, -0.015355110168457031, -0.0142974853515625, -0.013239860534667969, -0.012182235717773438, -0.011124610900878906, -0.010066986083984375, -0.009009361267089844, -0.007951736450195312, -0.006894111633300781, -0.00583648681640625, -0.004778861999511719, -0.0037212371826171875, -0.0026636123657226562, -0.001605987548828125, -0.0005483627319335938, 0.0005092620849609375, 0.0015668869018554688, 0.00262451171875, 0.0036821365356445312, 0.0047397613525390625, 0.005797386169433594, 0.006855010986328125, 0.007912635803222656, 0.008970260620117188, 0.010027885437011719, 0.01108551025390625, 0.012143135070800781, 0.013200759887695312, 0.014258384704589844, 0.015316009521484375, 0.016373634338378906, 0.017431259155273438, 0.01848888397216797, 0.0195465087890625, 0.02060413360595703, 0.021661758422851562, 0.022719383239746094, 0.023777008056640625, 0.024834632873535156, 0.025892257690429688, 0.02694988250732422, 0.02800750732421875, 0.02906513214111328, 0.030122756958007812, 0.031180381774902344, 0.032238006591796875, 0.033295631408691406, 0.03435325622558594, 0.03541088104248047, 0.036468505859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 7.0, 10.0, 10.0, 7.0, 14.0, 15.0, 69.0, 238.0, 326.0, 139.0, 44.0, 9.0, 12.0, 9.0, 11.0, 10.0, 7.0, 2.0, 3.0, 6.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.008418679237365723, -0.008124589920043945, -0.007830500602722168, -0.007536411285400391, -0.007242321968078613, -0.006948232650756836, -0.006654143333435059, -0.006360054016113281, -0.006065964698791504, -0.0057718753814697266, -0.005477786064147949, -0.005183696746826172, -0.0048896074295043945, -0.004595518112182617, -0.00430142879486084, -0.0040073394775390625, -0.003713250160217285, -0.003419160842895508, -0.0031250715255737305, -0.002830982208251953, -0.0025368928909301758, -0.0022428035736083984, -0.001948714256286621, -0.0016546249389648438, -0.0013605356216430664, -0.001066446304321289, -0.0007723569869995117, -0.0004782676696777344, -0.00018417835235595703, 0.00010991096496582031, 0.00040400028228759766, 0.000698089599609375, 0.0009921789169311523, 0.0012862682342529297, 0.001580357551574707, 0.0018744468688964844, 0.0021685361862182617, 0.002462625503540039, 0.0027567148208618164, 0.0030508041381835938, 0.003344893455505371, 0.0036389827728271484, 0.003933072090148926, 0.004227161407470703, 0.0045212507247924805, 0.004815340042114258, 0.005109429359436035, 0.0054035186767578125, 0.00569760799407959, 0.005991697311401367, 0.0062857866287231445, 0.006579875946044922, 0.006873965263366699, 0.0071680545806884766, 0.007462143898010254, 0.007756233215332031, 0.008050322532653809, 0.008344411849975586, 0.008638501167297363, 0.00893259048461914, 0.009226679801940918, 0.009520769119262695, 0.009814858436584473, 0.01010894775390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 8.0, 6.0, 14.0, 12.0, 21.0, 42.0, 98.0, 376.0, 3730.0, 4184109.0, 5113.0, 494.0, 116.0, 55.0, 22.0, 31.0, 6.0, 14.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0845947265625, -0.08234071731567383, -0.08008670806884766, -0.07783269882202148, -0.07557868957519531, -0.07332468032836914, -0.07107067108154297, -0.0688166618347168, -0.06656265258789062, -0.06430864334106445, -0.06205463409423828, -0.05980062484741211, -0.05754661560058594, -0.055292606353759766, -0.053038597106933594, -0.05078458786010742, -0.04853057861328125, -0.04627656936645508, -0.044022560119628906, -0.041768550872802734, -0.03951454162597656, -0.03726053237915039, -0.03500652313232422, -0.03275251388549805, -0.030498504638671875, -0.028244495391845703, -0.02599048614501953, -0.02373647689819336, -0.021482467651367188, -0.019228458404541016, -0.016974449157714844, -0.014720439910888672, -0.0124664306640625, -0.010212421417236328, -0.007958412170410156, -0.005704402923583984, -0.0034503936767578125, -0.0011963844299316406, 0.0010576248168945312, 0.003311634063720703, 0.005565643310546875, 0.007819652557373047, 0.010073661804199219, 0.01232767105102539, 0.014581680297851562, 0.016835689544677734, 0.019089698791503906, 0.021343708038330078, 0.02359771728515625, 0.025851726531982422, 0.028105735778808594, 0.030359745025634766, 0.03261375427246094, 0.03486776351928711, 0.03712177276611328, 0.03937578201293945, 0.041629791259765625, 0.0438838005065918, 0.04613780975341797, 0.04839181900024414, 0.05064582824707031, 0.052899837493896484, 0.055153846740722656, 0.05740785598754883, 0.059661865234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 6.0, 19.0, 47.0, 163.0, 3591.0, 150.0, 41.0, 14.0, 8.0, 5.0, 6.0, 4.0, 2.0, 8.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01169586181640625, -0.011237263679504395, -0.010778665542602539, -0.010320067405700684, -0.009861469268798828, -0.009402871131896973, -0.008944272994995117, -0.008485674858093262, -0.008027076721191406, -0.007568478584289551, -0.007109880447387695, -0.00665128231048584, -0.006192684173583984, -0.005734086036682129, -0.0052754878997802734, -0.004816889762878418, -0.0043582916259765625, -0.003899693489074707, -0.0034410953521728516, -0.002982497215270996, -0.0025238990783691406, -0.002065300941467285, -0.0016067028045654297, -0.0011481046676635742, -0.0006895065307617188, -0.00023090839385986328, 0.0002276897430419922, 0.0006862878799438477, 0.0011448860168457031, 0.0016034841537475586, 0.002062082290649414, 0.0025206804275512695, 0.002979278564453125, 0.0034378767013549805, 0.003896474838256836, 0.004355072975158691, 0.004813671112060547, 0.005272269248962402, 0.005730867385864258, 0.006189465522766113, 0.006648063659667969, 0.007106661796569824, 0.00756525993347168, 0.008023858070373535, 0.00848245620727539, 0.008941054344177246, 0.009399652481079102, 0.009858250617980957, 0.010316848754882812, 0.010775446891784668, 0.011234045028686523, 0.011692643165588379, 0.012151241302490234, 0.01260983943939209, 0.013068437576293945, 0.0135270357131958, 0.013985633850097656, 0.014444231986999512, 0.014902830123901367, 0.015361428260803223, 0.015820026397705078, 0.016278624534606934, 0.01673722267150879, 0.017195820808410645, 0.0176544189453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1001.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21490637958049774, -0.2060028314590454, -0.19709926843643188, -0.18819572031497955, -0.17929217219352722, -0.1703886240720749, -0.16148507595062256, -0.15258151292800903, -0.1436779648065567, -0.13477441668510437, -0.12587085366249084, -0.11696730554103851, -0.10806375741958618, -0.09916020929813385, -0.09025665372610092, -0.081353098154068, -0.07244955003261566, -0.06354600191116333, -0.0546424463391304, -0.04573889449238777, -0.03683534264564514, -0.02793179079890251, -0.01902823895215988, -0.010124687105417252, -0.0012211352586746216, 0.007682416588068008, 0.01658596843481064, 0.02548952028155327, 0.0343930721282959, 0.04329662397503853, 0.05220017582178116, 0.06110372766852379, 0.07000729441642761, 0.07891084253787994, 0.08781439810991287, 0.0967179536819458, 0.10562150180339813, 0.11452504992485046, 0.12342860549688339, 0.13233216106891632, 0.14123570919036865, 0.15013925731182098, 0.15904280543327332, 0.16794636845588684, 0.17684991657733917, 0.1857534646987915, 0.19465702772140503, 0.20356057584285736, 0.2124641239643097, 0.22136767208576202, 0.23027122020721436, 0.23917478322982788, 0.2480783313512802, 0.25698187947273254, 0.26588544249534607, 0.2747889757156372, 0.28369253873825073, 0.29259610176086426, 0.3014996349811554, 0.3104031980037689, 0.31930673122406006, 0.3282102942466736, 0.3371138572692871, 0.34601739048957825, 0.3549209535121918]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 17.0, 17.0, 14.0, 24.0, 29.0, 37.0, 40.0, 46.0, 56.0, 72.0, 59.0, 43.0, 58.0, 54.0, 64.0, 60.0, 45.0, 44.0, 35.0, 28.0, 31.0, 25.0, 31.0, 19.0, 6.0, 8.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.025498926639556885, -0.02464284375309944, -0.023786762729287148, -0.022930681705474854, -0.02207459881901741, -0.021218515932559967, -0.020362434908747673, -0.01950635388493538, -0.018650270998477936, -0.017794188112020493, -0.0169381070882082, -0.016082026064395905, -0.015225943177938461, -0.014369861222803593, -0.013513779267668724, -0.012657697312533855, -0.011801615357398987, -0.010945533402264118, -0.01008945144712925, -0.009233369491994381, -0.008377287536859512, -0.007521205581724644, -0.006665123626589775, -0.0058090416714549065, -0.004952959716320038, -0.004096877761185169, -0.0032407958060503006, -0.002384713850915432, -0.0015286318957805634, -0.0006725499406456947, 0.0001835320144891739, 0.0010396139696240425, 0.0018956959247589111, 0.0027517778798937798, 0.0036078598350286484, 0.004463941790163517, 0.005320023745298386, 0.006176105700433254, 0.007032187655568123, 0.007888269610702991, 0.00874435156583786, 0.009600433520972729, 0.010456515476107597, 0.011312597431242466, 0.012168679386377335, 0.013024761341512203, 0.013880843296647072, 0.01473692525178194, 0.015593007206916809, 0.016449090093374252, 0.017305171117186546, 0.01816125214099884, 0.019017335027456284, 0.019873417913913727, 0.02072949893772602, 0.021585579961538315, 0.022441662847995758, 0.0232977457344532, 0.024153826758265495, 0.02500990778207779, 0.025865990668535233, 0.026722073554992676, 0.02757815457880497, 0.028434235602617264, 0.029290318489074707]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 15.0, 18.0, 20.0, 25.0, 37.0, 52.0, 60.0, 98.0, 108.0, 180.0, 203.0, 284.0, 367.0, 553.0, 767.0, 1087.0, 1496.0, 2229.0, 3269.0, 5013.0, 8655.0, 16295.0, 54671.0, 839653.0, 70187.0, 17540.0, 9166.0, 5302.0, 3383.0, 2296.0, 1520.0, 1087.0, 749.0, 545.0, 411.0, 294.0, 231.0, 180.0, 129.0, 90.0, 60.0, 44.0, 45.0, 26.0, 19.0, 22.0, 15.0, 10.0, 11.0, 8.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.011460661888122559, -0.011072874069213867, -0.010685086250305176, -0.010297298431396484, -0.009909510612487793, -0.009521722793579102, -0.00913393497467041, -0.008746147155761719, -0.008358359336853027, -0.007970571517944336, -0.0075827836990356445, -0.007194995880126953, -0.006807208061218262, -0.00641942024230957, -0.006031632423400879, -0.0056438446044921875, -0.005256056785583496, -0.004868268966674805, -0.004480481147766113, -0.004092693328857422, -0.0037049055099487305, -0.003317117691040039, -0.0029293298721313477, -0.0025415420532226562, -0.002153754234313965, -0.0017659664154052734, -0.001378178596496582, -0.0009903907775878906, -0.0006026029586791992, -0.0002148151397705078, 0.0001729726791381836, 0.000560760498046875, 0.0009485483169555664, 0.0013363361358642578, 0.0017241239547729492, 0.0021119117736816406, 0.002499699592590332, 0.0028874874114990234, 0.003275275230407715, 0.0036630630493164062, 0.004050850868225098, 0.004438638687133789, 0.0048264265060424805, 0.005214214324951172, 0.005602002143859863, 0.005989789962768555, 0.006377577781677246, 0.0067653656005859375, 0.007153153419494629, 0.00754094123840332, 0.007928729057312012, 0.008316516876220703, 0.008704304695129395, 0.009092092514038086, 0.009479880332946777, 0.009867668151855469, 0.01025545597076416, 0.010643243789672852, 0.011031031608581543, 0.011418819427490234, 0.011806607246398926, 0.012194395065307617, 0.012582182884216309, 0.012969970703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 4.0, 4.0, 13.0, 8.0, 9.0, 8.0, 20.0, 57.0, 215.0, 331.0, 162.0, 49.0, 12.0, 12.0, 8.0, 11.0, 11.0, 6.0, 3.0, 3.0, 6.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0087432861328125, -0.008449196815490723, -0.008155107498168945, -0.007861018180847168, -0.007566928863525391, -0.007272839546203613, -0.006978750228881836, -0.006684660911560059, -0.006390571594238281, -0.006096482276916504, -0.0058023929595947266, -0.005508303642272949, -0.005214214324951172, -0.0049201250076293945, -0.004626035690307617, -0.00433194637298584, -0.0040378570556640625, -0.003743767738342285, -0.003449678421020508, -0.0031555891036987305, -0.002861499786376953, -0.0025674104690551758, -0.0022733211517333984, -0.001979231834411621, -0.0016851425170898438, -0.0013910531997680664, -0.001096963882446289, -0.0008028745651245117, -0.0005087852478027344, -0.00021469593048095703, 7.939338684082031e-05, 0.00037348270416259766, 0.000667572021484375, 0.0009616613388061523, 0.0012557506561279297, 0.001549839973449707, 0.0018439292907714844, 0.0021380186080932617, 0.002432107925415039, 0.0027261972427368164, 0.0030202865600585938, 0.003314375877380371, 0.0036084651947021484, 0.0039025545120239258, 0.004196643829345703, 0.0044907331466674805, 0.004784822463989258, 0.005078911781311035, 0.0053730010986328125, 0.00566709041595459, 0.005961179733276367, 0.0062552690505981445, 0.006549358367919922, 0.006843447685241699, 0.0071375370025634766, 0.007431626319885254, 0.007725715637207031, 0.008019804954528809, 0.008313894271850586, 0.008607983589172363, 0.00890207290649414, 0.009196162223815918, 0.009490251541137695, 0.009784340858459473, 0.01007843017578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 6.0, 14.0, 9.0, 10.0, 16.0, 22.0, 31.0, 36.0, 49.0, 50.0, 58.0, 73.0, 78.0, 116.0, 164.0, 213.0, 343.0, 583.0, 1034.0, 2825.0, 31626.0, 967953.0, 37388.0, 2842.0, 1105.0, 579.0, 315.0, 236.0, 167.0, 136.0, 100.0, 70.0, 55.0, 42.0, 42.0, 35.0, 23.0, 20.0, 17.0, 16.0, 9.0, 8.0, 4.0, 2.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.03950834274291992, -0.038123130798339844, -0.036737918853759766, -0.03535270690917969, -0.03396749496459961, -0.03258228302001953, -0.031197071075439453, -0.029811859130859375, -0.028426647186279297, -0.02704143524169922, -0.02565622329711914, -0.024271011352539062, -0.022885799407958984, -0.021500587463378906, -0.020115375518798828, -0.01873016357421875, -0.017344951629638672, -0.015959739685058594, -0.014574527740478516, -0.013189315795898438, -0.01180410385131836, -0.010418891906738281, -0.009033679962158203, -0.007648468017578125, -0.006263256072998047, -0.004878044128417969, -0.0034928321838378906, -0.0021076202392578125, -0.0007224082946777344, 0.0006628036499023438, 0.002048015594482422, 0.0034332275390625, 0.004818439483642578, 0.006203651428222656, 0.007588863372802734, 0.008974075317382812, 0.01035928726196289, 0.011744499206542969, 0.013129711151123047, 0.014514923095703125, 0.015900135040283203, 0.01728534698486328, 0.01867055892944336, 0.020055770874023438, 0.021440982818603516, 0.022826194763183594, 0.024211406707763672, 0.02559661865234375, 0.026981830596923828, 0.028367042541503906, 0.029752254486083984, 0.031137466430664062, 0.03252267837524414, 0.03390789031982422, 0.0352931022644043, 0.036678314208984375, 0.03806352615356445, 0.03944873809814453, 0.04083395004272461, 0.04221916198730469, 0.043604373931884766, 0.044989585876464844, 0.04637479782104492, 0.047760009765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 9.0, 14.0, 21.0, 20.0, 20.0, 31.0, 26.0, 29.0, 28.0, 36.0, 32.0, 35.0, 46.0, 26.0, 48.0, 55.0, 32.0, 43.0, 31.0, 35.0, 41.0, 39.0, 32.0, 31.0, 30.0, 28.0, 22.0, 10.0, 13.0, 16.0, 18.0, 14.0, 9.0, 12.0, 11.0, 6.0, 4.0, 4.0, 2.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235137939453125, -0.022716522216796875, -0.02191925048828125, -0.021121978759765625, -0.02032470703125, -0.019527435302734375, -0.01873016357421875, -0.017932891845703125, -0.0171356201171875, -0.016338348388671875, -0.01554107666015625, -0.014743804931640625, -0.013946533203125, -0.013149261474609375, -0.01235198974609375, -0.011554718017578125, -0.0107574462890625, -0.009960174560546875, -0.00916290283203125, -0.008365631103515625, -0.007568359375, -0.006771087646484375, -0.00597381591796875, -0.005176544189453125, -0.0043792724609375, -0.003582000732421875, -0.00278472900390625, -0.001987457275390625, -0.001190185546875, -0.000392913818359375, 0.00040435791015625, 0.001201629638671875, 0.0019989013671875, 0.002796173095703125, 0.00359344482421875, 0.004390716552734375, 0.00518798828125, 0.005985260009765625, 0.00678253173828125, 0.007579803466796875, 0.0083770751953125, 0.009174346923828125, 0.00997161865234375, 0.010768890380859375, 0.011566162109375, 0.012363433837890625, 0.01316070556640625, 0.013957977294921875, 0.0147552490234375, 0.015552520751953125, 0.01634979248046875, 0.017147064208984375, 0.0179443359375, 0.018741607666015625, 0.01953887939453125, 0.020336151123046875, 0.0211334228515625, 0.021930694580078125, 0.02272796630859375, 0.023525238037109375, 0.024322509765625, 0.025119781494140625, 0.02591705322265625, 0.026714324951171875, 0.0275115966796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 7.0, 10.0, 14.0, 15.0, 24.0, 32.0, 58.0, 82.0, 125.0, 248.0, 524.0, 1407.0, 7119.0, 875579.0, 157216.0, 4158.0, 1008.0, 386.0, 179.0, 111.0, 68.0, 36.0, 34.0, 22.0, 10.0, 16.0, 6.0, 8.0, 8.0, 8.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.445148468017578e-05, -3.311969339847565e-05, -3.178790211677551e-05, -3.045611083507538e-05, -2.9124319553375244e-05, -2.779252827167511e-05, -2.6460736989974976e-05, -2.512894570827484e-05, -2.3797154426574707e-05, -2.2465363144874573e-05, -2.113357186317444e-05, -1.9801780581474304e-05, -1.846998929977417e-05, -1.7138198018074036e-05, -1.58064067363739e-05, -1.4474615454673767e-05, -1.3142824172973633e-05, -1.1811032891273499e-05, -1.0479241609573364e-05, -9.14745032787323e-06, -7.815659046173096e-06, -6.4838677644729614e-06, -5.152076482772827e-06, -3.820285201072693e-06, -2.4884939193725586e-06, -1.1567026376724243e-06, 1.7508864402770996e-07, 1.5068799257278442e-06, 2.8386712074279785e-06, 4.170462489128113e-06, 5.502253770828247e-06, 6.834045052528381e-06, 8.165836334228516e-06, 9.49762761592865e-06, 1.0829418897628784e-05, 1.2161210179328918e-05, 1.3493001461029053e-05, 1.4824792742729187e-05, 1.615658402442932e-05, 1.7488375306129456e-05, 1.882016658782959e-05, 2.0151957869529724e-05, 2.148374915122986e-05, 2.2815540432929993e-05, 2.4147331714630127e-05, 2.547912299633026e-05, 2.6810914278030396e-05, 2.814270555973053e-05, 2.9474496841430664e-05, 3.08062881231308e-05, 3.213807940483093e-05, 3.346987068653107e-05, 3.48016619682312e-05, 3.6133453249931335e-05, 3.746524453163147e-05, 3.8797035813331604e-05, 4.012882709503174e-05, 4.146061837673187e-05, 4.279240965843201e-05, 4.412420094013214e-05, 4.5455992221832275e-05, 4.678778350353241e-05, 4.8119574785232544e-05, 4.945136606693268e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 12.0, 6.0, 17.0, 8.0, 17.0, 33.0, 22.0, 39.0, 25.0, 74.0, 67.0, 63.0, 88.0, 73.0, 93.0, 58.0, 43.0, 52.0, 19.0, 52.0, 19.0, 19.0, 18.0, 11.0, 13.0, 13.0, 9.0, 7.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.602836608886719e-06, -5.448237061500549e-06, -5.29363751411438e-06, -5.1390379667282104e-06, -4.984438419342041e-06, -4.829838871955872e-06, -4.675239324569702e-06, -4.520639777183533e-06, -4.366040229797363e-06, -4.211440682411194e-06, -4.056841135025024e-06, -3.902241587638855e-06, -3.7476420402526855e-06, -3.593042492866516e-06, -3.4384429454803467e-06, -3.2838433980941772e-06, -3.129243850708008e-06, -2.9746443033218384e-06, -2.820044755935669e-06, -2.6654452085494995e-06, -2.51084566116333e-06, -2.3562461137771606e-06, -2.201646566390991e-06, -2.0470470190048218e-06, -1.8924474716186523e-06, -1.737847924232483e-06, -1.5832483768463135e-06, -1.428648829460144e-06, -1.2740492820739746e-06, -1.1194497346878052e-06, -9.648501873016357e-07, -8.102506399154663e-07, -6.556510925292969e-07, -5.010515451431274e-07, -3.46451997756958e-07, -1.9185245037078857e-07, -3.725290298461914e-08, 1.1734664440155029e-07, 2.7194619178771973e-07, 4.2654573917388916e-07, 5.811452865600586e-07, 7.35744833946228e-07, 8.903443813323975e-07, 1.044943928718567e-06, 1.1995434761047363e-06, 1.3541430234909058e-06, 1.5087425708770752e-06, 1.6633421182632446e-06, 1.817941665649414e-06, 1.9725412130355835e-06, 2.127140760421753e-06, 2.2817403078079224e-06, 2.436339855194092e-06, 2.5909394025802612e-06, 2.7455389499664307e-06, 2.9001384973526e-06, 3.0547380447387695e-06, 3.209337592124939e-06, 3.3639371395111084e-06, 3.518536686897278e-06, 3.6731362342834473e-06, 3.827735781669617e-06, 3.982335329055786e-06, 4.1369348764419556e-06, 4.291534423828125e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 8.0, 8.0, 22.0, 27.0, 36.0, 89.0, 121.0, 229.0, 711.0, 4777.0, 1033941.0, 7206.0, 748.0, 266.0, 141.0, 79.0, 41.0, 29.0, 18.0, 10.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16908073425293e-05, -5.960371345281601e-05, -5.751661956310272e-05, -5.5429525673389435e-05, -5.334243178367615e-05, -5.125533789396286e-05, -4.916824400424957e-05, -4.7081150114536285e-05, -4.4994056224823e-05, -4.290696233510971e-05, -4.081986844539642e-05, -3.8732774555683136e-05, -3.664568066596985e-05, -3.455858677625656e-05, -3.2471492886543274e-05, -3.0384398996829987e-05, -2.82973051071167e-05, -2.6210211217403412e-05, -2.4123117327690125e-05, -2.2036023437976837e-05, -1.994892954826355e-05, -1.7861835658550262e-05, -1.5774741768836975e-05, -1.3687647879123688e-05, -1.16005539894104e-05, -9.513460099697113e-06, -7.426366209983826e-06, -5.339272320270538e-06, -3.252178430557251e-06, -1.1650845408439636e-06, 9.220093488693237e-07, 3.009103238582611e-06, 5.0961971282958984e-06, 7.183291018009186e-06, 9.270384907722473e-06, 1.135747879743576e-05, 1.3444572687149048e-05, 1.5531666576862335e-05, 1.7618760466575623e-05, 1.970585435628891e-05, 2.1792948246002197e-05, 2.3880042135715485e-05, 2.5967136025428772e-05, 2.805422991514206e-05, 3.0141323804855347e-05, 3.2228417694568634e-05, 3.431551158428192e-05, 3.640260547399521e-05, 3.8489699363708496e-05, 4.0576793253421783e-05, 4.266388714313507e-05, 4.475098103284836e-05, 4.6838074922561646e-05, 4.892516881227493e-05, 5.101226270198822e-05, 5.309935659170151e-05, 5.5186450481414795e-05, 5.727354437112808e-05, 5.936063826084137e-05, 6.144773215055466e-05, 6.353482604026794e-05, 6.562191992998123e-05, 6.770901381969452e-05, 6.97961077094078e-05, 7.18832015991211e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 8.0, 26.0, 26.0, 20.0, 44.0, 78.0, 118.0, 207.0, 153.0, 102.0, 58.0, 39.0, 37.0, 20.0, 12.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.759695053100586e-05, -2.6520341634750366e-05, -2.5443732738494873e-05, -2.436712384223938e-05, -2.3290514945983887e-05, -2.2213906049728394e-05, -2.11372971534729e-05, -2.0060688257217407e-05, -1.8984079360961914e-05, -1.790747046470642e-05, -1.6830861568450928e-05, -1.5754252672195435e-05, -1.4677643775939941e-05, -1.3601034879684448e-05, -1.2524425983428955e-05, -1.1447817087173462e-05, -1.0371208190917969e-05, -9.294599294662476e-06, -8.217990398406982e-06, -7.141381502151489e-06, -6.064772605895996e-06, -4.988163709640503e-06, -3.91155481338501e-06, -2.8349459171295166e-06, -1.7583370208740234e-06, -6.817281246185303e-07, 3.948807716369629e-07, 1.471489667892456e-06, 2.5480985641479492e-06, 3.6247074604034424e-06, 4.7013163566589355e-06, 5.777925252914429e-06, 6.854534149169922e-06, 7.931143045425415e-06, 9.007751941680908e-06, 1.0084360837936401e-05, 1.1160969734191895e-05, 1.2237578630447388e-05, 1.3314187526702881e-05, 1.4390796422958374e-05, 1.5467405319213867e-05, 1.654401421546936e-05, 1.7620623111724854e-05, 1.8697232007980347e-05, 1.977384090423584e-05, 2.0850449800491333e-05, 2.1927058696746826e-05, 2.300366759300232e-05, 2.4080276489257812e-05, 2.5156885385513306e-05, 2.62334942817688e-05, 2.7310103178024292e-05, 2.8386712074279785e-05, 2.946332097053528e-05, 3.053992986679077e-05, 3.1616538763046265e-05, 3.269314765930176e-05, 3.376975655555725e-05, 3.4846365451812744e-05, 3.592297434806824e-05, 3.699958324432373e-05, 3.8076192140579224e-05, 3.915280103683472e-05, 4.022940993309021e-05, 4.13060188293457e-05]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 23.0, 79.0, 574.0, 241.0, 59.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12260283529758453, -0.11834025382995605, -0.11407766491174698, -0.1098150759935379, -0.10555249452590942, -0.10128991305828094, -0.09702732414007187, -0.09276473522186279, -0.08850215375423431, -0.08423957228660583, -0.07997698336839676, -0.07571439445018768, -0.0714518129825592, -0.06718923151493073, -0.06292664259672165, -0.05866405740380287, -0.054401472210884094, -0.05013888701796532, -0.04587630182504654, -0.04161371663212776, -0.037351131439208984, -0.03308854624629021, -0.02882596105337143, -0.024563375860452652, -0.020300790667533875, -0.016038205474615097, -0.01177562028169632, -0.007513035088777542, -0.0032504498958587646, 0.0010121352970600128, 0.00527472048997879, 0.009537305682897568, 0.013799875974655151, 0.01806246116757393, 0.022325046360492706, 0.026587631553411484, 0.03085021674633026, 0.03511280193924904, 0.039375387132167816, 0.043637972325086594, 0.04790055751800537, 0.05216314271092415, 0.056425727903842926, 0.060688313096761703, 0.06495089828968048, 0.06921347975730896, 0.07347606867551804, 0.07773865759372711, 0.08200123906135559, 0.08626382052898407, 0.09052640944719315, 0.09478899836540222, 0.0990515798330307, 0.10331416130065918, 0.10757675021886826, 0.11183933913707733, 0.11610192060470581, 0.12036450207233429, 0.12462709099054337, 0.12888967990875244, 0.13315226137638092, 0.1374148428440094, 0.14167743921279907, 0.14594002068042755, 0.15020260214805603]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 14.0, 17.0, 13.0, 21.0, 35.0, 36.0, 57.0, 58.0, 76.0, 86.0, 85.0, 80.0, 101.0, 47.0, 53.0, 49.0, 39.0, 31.0, 24.0, 17.0, 19.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3054198622703552, -0.2963999807834625, -0.28738006949424744, -0.27836018800735474, -0.26934030652046204, -0.26032042503356934, -0.25130051374435425, -0.24228063225746155, -0.23326073586940765, -0.22424083948135376, -0.21522095799446106, -0.20620106160640717, -0.19718116521835327, -0.18816128373146057, -0.17914138734340668, -0.17012149095535278, -0.16110160946846008, -0.1520817130804062, -0.1430618315935135, -0.1340419352054596, -0.1250220537185669, -0.116002157330513, -0.1069822609424591, -0.09796237200498581, -0.08894248306751251, -0.07992259413003922, -0.07090270519256592, -0.061882808804512024, -0.05286291986703873, -0.04384303092956543, -0.034823138266801834, -0.02580324560403824, -0.01678335666656494, -0.007763465866446495, 0.0012564249336719513, 0.010276315733790398, 0.019296206533908844, 0.02831609547138214, 0.03733598813414574, 0.04635588079690933, 0.05537576973438263, 0.06439565867185593, 0.07341554760932922, 0.08243544399738312, 0.09145533293485641, 0.10047522187232971, 0.1094951182603836, 0.1185150071978569, 0.1275348961353302, 0.1365547925233841, 0.1455746740102768, 0.1545945703983307, 0.1636144518852234, 0.17263434827327728, 0.18165424466133118, 0.19067412614822388, 0.19969402253627777, 0.20871391892433167, 0.21773380041122437, 0.22675369679927826, 0.23577359318733215, 0.24479347467422485, 0.25381335616111755, 0.26283326745033264, 0.27185314893722534]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 7.0, 12.0, 23.0, 27.0, 31.0, 41.0, 70.0, 93.0, 131.0, 203.0, 371.0, 1133.0, 18583.0, 3843278.0, 320433.0, 7921.0, 607.0, 381.0, 248.0, 176.0, 122.0, 83.0, 70.0, 50.0, 41.0, 29.0, 19.0, 18.0, 9.0, 11.0, 10.0, 10.0, 4.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211639404296875, -0.020406246185302734, -0.01964855194091797, -0.018890857696533203, -0.018133163452148438, -0.017375469207763672, -0.016617774963378906, -0.01586008071899414, -0.015102386474609375, -0.01434469223022461, -0.013586997985839844, -0.012829303741455078, -0.012071609497070312, -0.011313915252685547, -0.010556221008300781, -0.009798526763916016, -0.00904083251953125, -0.008283138275146484, -0.007525444030761719, -0.006767749786376953, -0.0060100555419921875, -0.005252361297607422, -0.004494667053222656, -0.0037369728088378906, -0.002979278564453125, -0.0022215843200683594, -0.0014638900756835938, -0.0007061958312988281, 5.14984130859375e-05, 0.0008091926574707031, 0.0015668869018554688, 0.0023245811462402344, 0.003082275390625, 0.0038399696350097656, 0.004597663879394531, 0.005355358123779297, 0.0061130523681640625, 0.006870746612548828, 0.007628440856933594, 0.00838613510131836, 0.009143829345703125, 0.00990152359008789, 0.010659217834472656, 0.011416912078857422, 0.012174606323242188, 0.012932300567626953, 0.013689994812011719, 0.014447689056396484, 0.01520538330078125, 0.015963077545166016, 0.01672077178955078, 0.017478466033935547, 0.018236160278320312, 0.018993854522705078, 0.019751548767089844, 0.02050924301147461, 0.021266937255859375, 0.02202463150024414, 0.022782325744628906, 0.023540019989013672, 0.024297714233398438, 0.025055408477783203, 0.02581310272216797, 0.026570796966552734, 0.0273284912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 6.0, 11.0, 11.0, 7.0, 5.0, 17.0, 51.0, 147.0, 307.0, 216.0, 90.0, 20.0, 7.0, 10.0, 10.0, 8.0, 10.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00777435302734375, -0.007497429847717285, -0.00722050666809082, -0.0069435834884643555, -0.006666660308837891, -0.006389737129211426, -0.006112813949584961, -0.005835890769958496, -0.005558967590332031, -0.005282044410705566, -0.0050051212310791016, -0.004728198051452637, -0.004451274871826172, -0.004174351692199707, -0.003897428512573242, -0.0036205053329467773, -0.0033435821533203125, -0.0030666589736938477, -0.002789735794067383, -0.002512812614440918, -0.002235889434814453, -0.0019589662551879883, -0.0016820430755615234, -0.0014051198959350586, -0.0011281967163085938, -0.0008512735366821289, -0.0005743503570556641, -0.0002974271774291992, -2.0503997802734375e-05, 0.00025641918182373047, 0.0005333423614501953, 0.0008102655410766602, 0.001087188720703125, 0.0013641119003295898, 0.0016410350799560547, 0.0019179582595825195, 0.0021948814392089844, 0.0024718046188354492, 0.002748727798461914, 0.003025650978088379, 0.0033025741577148438, 0.0035794973373413086, 0.0038564205169677734, 0.004133343696594238, 0.004410266876220703, 0.004687190055847168, 0.004964113235473633, 0.005241036415100098, 0.0055179595947265625, 0.005794882774353027, 0.006071805953979492, 0.006348729133605957, 0.006625652313232422, 0.006902575492858887, 0.0071794986724853516, 0.007456421852111816, 0.007733345031738281, 0.008010268211364746, 0.008287191390991211, 0.008564114570617676, 0.00884103775024414, 0.009117960929870605, 0.00939488410949707, 0.009671807289123535, 0.00994873046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 12.0, 15.0, 31.0, 29.0, 75.0, 150.0, 411.0, 1848.0, 37173.0, 4148994.0, 4413.0, 662.0, 188.0, 102.0, 38.0, 35.0, 17.0, 11.0, 4.0, 10.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04246091842651367, -0.041007041931152344, -0.039553165435791016, -0.03809928894042969, -0.03664541244506836, -0.03519153594970703, -0.0337376594543457, -0.032283782958984375, -0.030829906463623047, -0.02937602996826172, -0.02792215347290039, -0.026468276977539062, -0.025014400482177734, -0.023560523986816406, -0.022106647491455078, -0.02065277099609375, -0.019198894500732422, -0.017745018005371094, -0.016291141510009766, -0.014837265014648438, -0.01338338851928711, -0.011929512023925781, -0.010475635528564453, -0.009021759033203125, -0.007567882537841797, -0.006114006042480469, -0.004660129547119141, -0.0032062530517578125, -0.0017523765563964844, -0.00029850006103515625, 0.0011553764343261719, 0.0026092529296875, 0.004063129425048828, 0.005517005920410156, 0.006970882415771484, 0.008424758911132812, 0.00987863540649414, 0.011332511901855469, 0.012786388397216797, 0.014240264892578125, 0.015694141387939453, 0.01714801788330078, 0.01860189437866211, 0.020055770874023438, 0.021509647369384766, 0.022963523864746094, 0.024417400360107422, 0.02587127685546875, 0.027325153350830078, 0.028779029846191406, 0.030232906341552734, 0.03168678283691406, 0.03314065933227539, 0.03459453582763672, 0.03604841232299805, 0.037502288818359375, 0.0389561653137207, 0.04041004180908203, 0.04186391830444336, 0.04331779479980469, 0.044771671295166016, 0.046225547790527344, 0.04767942428588867, 0.04913330078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 21.0, 49.0, 101.0, 293.0, 1532.0, 1495.0, 319.0, 115.0, 61.0, 21.0, 11.0, 7.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.016082763671875, -0.015659451484680176, -0.015236139297485352, -0.014812827110290527, -0.014389514923095703, -0.013966202735900879, -0.013542890548706055, -0.01311957836151123, -0.012696266174316406, -0.012272953987121582, -0.011849641799926758, -0.011426329612731934, -0.01100301742553711, -0.010579705238342285, -0.010156393051147461, -0.009733080863952637, -0.009309768676757812, -0.008886456489562988, -0.008463144302368164, -0.00803983211517334, -0.007616519927978516, -0.007193207740783691, -0.006769895553588867, -0.006346583366394043, -0.005923271179199219, -0.0054999589920043945, -0.00507664680480957, -0.004653334617614746, -0.004230022430419922, -0.0038067102432250977, -0.0033833980560302734, -0.0029600858688354492, -0.002536773681640625, -0.0021134614944458008, -0.0016901493072509766, -0.0012668371200561523, -0.0008435249328613281, -0.0004202127456665039, 3.0994415283203125e-06, 0.00042641162872314453, 0.0008497238159179688, 0.001273036003112793, 0.0016963481903076172, 0.0021196603775024414, 0.0025429725646972656, 0.00296628475189209, 0.003389596939086914, 0.0038129091262817383, 0.0042362213134765625, 0.004659533500671387, 0.005082845687866211, 0.005506157875061035, 0.005929470062255859, 0.006352782249450684, 0.006776094436645508, 0.007199406623840332, 0.007622718811035156, 0.00804603099822998, 0.008469343185424805, 0.008892655372619629, 0.009315967559814453, 0.009739279747009277, 0.010162591934204102, 0.010585904121398926, 0.01100921630859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 970.0, 34.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15761198103427887, -0.153827503323555, -0.15004302561283112, -0.14625854790210724, -0.14247405529022217, -0.1386895775794983, -0.13490509986877441, -0.13112062215805054, -0.12733614444732666, -0.12355166673660278, -0.1197671890258789, -0.11598270386457443, -0.11219822615385056, -0.10841374844312668, -0.1046292632818222, -0.10084478557109833, -0.09706030786037445, -0.09327583014965057, -0.0894913524389267, -0.08570686727762222, -0.08192238956689835, -0.07813791185617447, -0.07435342669487, -0.07056894898414612, -0.06678447127342224, -0.06299999356269836, -0.05921551212668419, -0.05543103069067001, -0.051646552979946136, -0.04786207526922226, -0.044077593833208084, -0.04029311239719391, -0.03650863468647003, -0.032724156975746155, -0.02893967553973198, -0.025155195966362953, -0.021370716392993927, -0.0175862368196249, -0.013801757246255875, -0.010017277672886848, -0.006232798099517822, -0.002448318526148796, 0.00133616104722023, 0.005120640620589256, 0.008905120193958282, 0.012689599767327309, 0.016474079340696335, 0.02025855891406536, 0.024043038487434387, 0.027827518060803413, 0.03161199763417244, 0.035396479070186615, 0.03918095678091049, 0.04296543449163437, 0.046749915927648544, 0.05053439736366272, 0.0543188750743866, 0.058103352785110474, 0.06188783422112465, 0.06567231565713882, 0.0694567933678627, 0.07324127107858658, 0.07702575623989105, 0.08081023395061493, 0.0845947116613388]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 10.0, 12.0, 20.0, 20.0, 23.0, 30.0, 40.0, 51.0, 43.0, 48.0, 57.0, 41.0, 61.0, 56.0, 45.0, 39.0, 41.0, 46.0, 33.0, 44.0, 27.0, 23.0, 28.0, 33.0, 22.0, 17.0, 12.0, 12.0, 10.0, 9.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03274601697921753, -0.03188027814030647, -0.031014541164040565, -0.030148804187774658, -0.0292830653488636, -0.028417326509952545, -0.027551589533686638, -0.02668585255742073, -0.025820113718509674, -0.024954374879598618, -0.02408863790333271, -0.023222900927066803, -0.022357162088155746, -0.02149142324924469, -0.020625686272978783, -0.019759949296712875, -0.01889421045780182, -0.018028471618890762, -0.017162734642624855, -0.016296997666358948, -0.015431258827447891, -0.01456552091985941, -0.013699783012270927, -0.012834045104682446, -0.011968307197093964, -0.011102569289505482, -0.010236831381917, -0.009371093474328518, -0.008505355566740036, -0.007639617659151554, -0.006773879751563072, -0.00590814184397459, -0.005042403936386108, -0.0041766660287976265, -0.0033109281212091446, -0.0024451902136206627, -0.0015794523060321808, -0.0007137143984436989, 0.00015202350914478302, 0.001017761416733265, 0.0018834993243217468, 0.0027492372319102287, 0.0036149751394987106, 0.0044807130470871925, 0.0053464509546756744, 0.006212188862264156, 0.007077926769852638, 0.00794366467744112, 0.008809402585029602, 0.009675140492618084, 0.010540878400206566, 0.011406616307795048, 0.01227235421538353, 0.013138092122972012, 0.014003830030560493, 0.014869567938148975, 0.015735305845737457, 0.016601044684648514, 0.01746678166091442, 0.01833251863718033, 0.019198257476091385, 0.02006399631500244, 0.02092973329126835, 0.021795470267534256, 0.022661209106445312]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 9.0, 10.0, 11.0, 21.0, 19.0, 34.0, 42.0, 70.0, 100.0, 129.0, 173.0, 232.0, 356.0, 519.0, 810.0, 1174.0, 1791.0, 2821.0, 4616.0, 8240.0, 17087.0, 68515.0, 858691.0, 48504.0, 14967.0, 7562.0, 4177.0, 2668.0, 1672.0, 1153.0, 743.0, 491.0, 344.0, 245.0, 143.0, 125.0, 81.0, 55.0, 40.0, 28.0, 24.0, 11.0, 5.0, 12.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.01500701904296875, -0.014571070671081543, -0.014135122299194336, -0.013699173927307129, -0.013263225555419922, -0.012827277183532715, -0.012391328811645508, -0.0119553804397583, -0.011519432067871094, -0.011083483695983887, -0.01064753532409668, -0.010211586952209473, -0.009775638580322266, -0.009339690208435059, -0.008903741836547852, -0.008467793464660645, -0.008031845092773438, -0.0075958967208862305, -0.0071599483489990234, -0.006723999977111816, -0.006288051605224609, -0.005852103233337402, -0.005416154861450195, -0.004980206489562988, -0.004544258117675781, -0.004108309745788574, -0.003672361373901367, -0.00323641300201416, -0.002800464630126953, -0.002364516258239746, -0.001928567886352539, -0.001492619514465332, -0.001056671142578125, -0.000620722770690918, -0.00018477439880371094, 0.0002511739730834961, 0.0006871223449707031, 0.0011230707168579102, 0.0015590190887451172, 0.0019949674606323242, 0.0024309158325195312, 0.0028668642044067383, 0.0033028125762939453, 0.0037387609481811523, 0.004174709320068359, 0.004610657691955566, 0.0050466060638427734, 0.0054825544357299805, 0.0059185028076171875, 0.0063544511795043945, 0.0067903995513916016, 0.007226347923278809, 0.007662296295166016, 0.008098244667053223, 0.00853419303894043, 0.008970141410827637, 0.009406089782714844, 0.00984203815460205, 0.010277986526489258, 0.010713934898376465, 0.011149883270263672, 0.011585831642150879, 0.012021780014038086, 0.012457728385925293, 0.0128936767578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 6.0, 1.0, 4.0, 13.0, 11.0, 8.0, 4.0, 16.0, 48.0, 146.0, 309.0, 219.0, 85.0, 25.0, 6.0, 10.0, 11.0, 8.0, 9.0, 6.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0077667236328125, -0.0074901580810546875, -0.007213592529296875, -0.0069370269775390625, -0.00666046142578125, -0.0063838958740234375, -0.006107330322265625, -0.0058307647705078125, -0.00555419921875, -0.0052776336669921875, -0.005001068115234375, -0.0047245025634765625, -0.00444793701171875, -0.0041713714599609375, -0.003894805908203125, -0.0036182403564453125, -0.0033416748046875, -0.0030651092529296875, -0.002788543701171875, -0.0025119781494140625, -0.00223541259765625, -0.0019588470458984375, -0.001682281494140625, -0.0014057159423828125, -0.001129150390625, -0.0008525848388671875, -0.000576019287109375, -0.0002994537353515625, -2.288818359375e-05, 0.0002536773681640625, 0.000530242919921875, 0.0008068084716796875, 0.0010833740234375, 0.0013599395751953125, 0.001636505126953125, 0.0019130706787109375, 0.00218963623046875, 0.0024662017822265625, 0.002742767333984375, 0.0030193328857421875, 0.0032958984375, 0.0035724639892578125, 0.003849029541015625, 0.0041255950927734375, 0.00440216064453125, 0.0046787261962890625, 0.004955291748046875, 0.0052318572998046875, 0.0055084228515625, 0.0057849884033203125, 0.006061553955078125, 0.0063381195068359375, 0.00661468505859375, 0.0068912506103515625, 0.007167816162109375, 0.0074443817138671875, 0.007720947265625, 0.007997512817382812, 0.008274078369140625, 0.008550643920898438, 0.00882720947265625, 0.009103775024414062, 0.009380340576171875, 0.009656906127929688, 0.0099334716796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 5.0, 11.0, 14.0, 14.0, 14.0, 19.0, 28.0, 31.0, 37.0, 46.0, 63.0, 67.0, 66.0, 118.0, 142.0, 191.0, 250.0, 437.0, 661.0, 1510.0, 8531.0, 821542.0, 206649.0, 4836.0, 1209.0, 634.0, 348.0, 260.0, 162.0, 116.0, 96.0, 100.0, 56.0, 34.0, 43.0, 37.0, 28.0, 36.0, 22.0, 16.0, 20.0, 10.0, 4.0, 7.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.03973388671875, -0.03852558135986328, -0.03731727600097656, -0.036108970642089844, -0.034900665283203125, -0.033692359924316406, -0.03248405456542969, -0.03127574920654297, -0.03006744384765625, -0.02885913848876953, -0.027650833129882812, -0.026442527770996094, -0.025234222412109375, -0.024025917053222656, -0.022817611694335938, -0.02160930633544922, -0.0204010009765625, -0.01919269561767578, -0.017984390258789062, -0.016776084899902344, -0.015567779541015625, -0.014359474182128906, -0.013151168823242188, -0.011942863464355469, -0.01073455810546875, -0.009526252746582031, -0.008317947387695312, -0.007109642028808594, -0.005901336669921875, -0.004693031311035156, -0.0034847259521484375, -0.0022764205932617188, -0.001068115234375, 0.00014019012451171875, 0.0013484954833984375, 0.0025568008422851562, 0.003765106201171875, 0.004973411560058594, 0.0061817169189453125, 0.007390022277832031, 0.00859832763671875, 0.009806632995605469, 0.011014938354492188, 0.012223243713378906, 0.013431549072265625, 0.014639854431152344, 0.015848159790039062, 0.01705646514892578, 0.0182647705078125, 0.01947307586669922, 0.020681381225585938, 0.021889686584472656, 0.023097991943359375, 0.024306297302246094, 0.025514602661132812, 0.02672290802001953, 0.02793121337890625, 0.02913951873779297, 0.030347824096679688, 0.031556129455566406, 0.032764434814453125, 0.033972740173339844, 0.03518104553222656, 0.03638935089111328, 0.03759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 9.0, 7.0, 10.0, 13.0, 14.0, 12.0, 21.0, 28.0, 21.0, 23.0, 24.0, 33.0, 33.0, 27.0, 52.0, 39.0, 30.0, 45.0, 38.0, 32.0, 32.0, 33.0, 32.0, 31.0, 24.0, 33.0, 30.0, 33.0, 36.0, 26.0, 10.0, 28.0, 20.0, 14.0, 20.0, 13.0, 11.0, 13.0, 7.0, 4.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0235443115234375, -0.02282881736755371, -0.022113323211669922, -0.021397829055786133, -0.020682334899902344, -0.019966840744018555, -0.019251346588134766, -0.018535852432250977, -0.017820358276367188, -0.0171048641204834, -0.01638936996459961, -0.01567387580871582, -0.014958381652832031, -0.014242887496948242, -0.013527393341064453, -0.012811899185180664, -0.012096405029296875, -0.011380910873413086, -0.010665416717529297, -0.009949922561645508, -0.009234428405761719, -0.00851893424987793, -0.007803440093994141, -0.0070879459381103516, -0.0063724517822265625, -0.0056569576263427734, -0.004941463470458984, -0.004225969314575195, -0.0035104751586914062, -0.002794981002807617, -0.002079486846923828, -0.001363992691040039, -0.00064849853515625, 6.699562072753906e-05, 0.0007824897766113281, 0.0014979839324951172, 0.0022134780883789062, 0.0029289722442626953, 0.0036444664001464844, 0.0043599605560302734, 0.0050754547119140625, 0.0057909488677978516, 0.006506443023681641, 0.00722193717956543, 0.007937431335449219, 0.008652925491333008, 0.009368419647216797, 0.010083913803100586, 0.010799407958984375, 0.011514902114868164, 0.012230396270751953, 0.012945890426635742, 0.013661384582519531, 0.01437687873840332, 0.01509237289428711, 0.0158078670501709, 0.016523361206054688, 0.017238855361938477, 0.017954349517822266, 0.018669843673706055, 0.019385337829589844, 0.020100831985473633, 0.020816326141357422, 0.02153182029724121, 0.022247314453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 8.0, 15.0, 15.0, 23.0, 28.0, 45.0, 57.0, 91.0, 179.0, 306.0, 711.0, 2035.0, 9988.0, 169467.0, 844383.0, 16650.0, 2806.0, 839.0, 348.0, 238.0, 120.0, 69.0, 41.0, 30.0, 22.0, 5.0, 9.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-05, -1.5014782547950745e-05, -1.4532357454299927e-05, -1.4049932360649109e-05, -1.3567507266998291e-05, -1.3085082173347473e-05, -1.2602657079696655e-05, -1.2120231986045837e-05, -1.163780689239502e-05, -1.1155381798744202e-05, -1.0672956705093384e-05, -1.0190531611442566e-05, -9.708106517791748e-06, -9.22568142414093e-06, -8.743256330490112e-06, -8.260831236839294e-06, -7.778406143188477e-06, -7.295981049537659e-06, -6.813555955886841e-06, -6.331130862236023e-06, -5.848705768585205e-06, -5.366280674934387e-06, -4.883855581283569e-06, -4.4014304876327515e-06, -3.919005393981934e-06, -3.4365803003311157e-06, -2.954155206680298e-06, -2.47173011302948e-06, -1.989305019378662e-06, -1.5068799257278442e-06, -1.0244548320770264e-06, -5.420297384262085e-07, -5.960464477539063e-08, 4.2282044887542725e-07, 9.052455425262451e-07, 1.387670636177063e-06, 1.8700957298278809e-06, 2.3525208234786987e-06, 2.8349459171295166e-06, 3.3173710107803345e-06, 3.7997961044311523e-06, 4.28222119808197e-06, 4.764646291732788e-06, 5.247071385383606e-06, 5.729496479034424e-06, 6.211921572685242e-06, 6.6943466663360596e-06, 7.1767717599868774e-06, 7.659196853637695e-06, 8.141621947288513e-06, 8.624047040939331e-06, 9.106472134590149e-06, 9.588897228240967e-06, 1.0071322321891785e-05, 1.0553747415542603e-05, 1.103617250919342e-05, 1.1518597602844238e-05, 1.2001022696495056e-05, 1.2483447790145874e-05, 1.2965872883796692e-05, 1.344829797744751e-05, 1.3930723071098328e-05, 1.4413148164749146e-05, 1.4895573258399963e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 19.0, 26.0, 24.0, 44.0, 40.0, 86.0, 63.0, 65.0, 124.0, 76.0, 87.0, 91.0, 44.0, 49.0, 29.0, 25.0, 13.0, 22.0, 13.0, 5.0, 10.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.852190613746643e-06, -4.637986421585083e-06, -4.423782229423523e-06, -4.209578037261963e-06, -3.995373845100403e-06, -3.7811696529388428e-06, -3.5669654607772827e-06, -3.3527612686157227e-06, -3.1385570764541626e-06, -2.9243528842926025e-06, -2.7101486921310425e-06, -2.4959444999694824e-06, -2.2817403078079224e-06, -2.0675361156463623e-06, -1.8533319234848022e-06, -1.6391277313232422e-06, -1.4249235391616821e-06, -1.210719347000122e-06, -9.96515154838562e-07, -7.82310962677002e-07, -5.681067705154419e-07, -3.5390257835388184e-07, -1.3969838619232178e-07, 7.450580596923828e-08, 2.8870999813079834e-07, 5.029141902923584e-07, 7.171183824539185e-07, 9.313225746154785e-07, 1.1455267667770386e-06, 1.3597309589385986e-06, 1.5739351511001587e-06, 1.7881393432617188e-06, 2.002343535423279e-06, 2.216547727584839e-06, 2.430751919746399e-06, 2.644956111907959e-06, 2.859160304069519e-06, 3.073364496231079e-06, 3.287568688392639e-06, 3.5017728805541992e-06, 3.7159770727157593e-06, 3.930181264877319e-06, 4.144385457038879e-06, 4.3585896492004395e-06, 4.5727938413619995e-06, 4.7869980335235596e-06, 5.00120222568512e-06, 5.21540641784668e-06, 5.42961061000824e-06, 5.6438148021698e-06, 5.85801899433136e-06, 6.07222318649292e-06, 6.28642737865448e-06, 6.50063157081604e-06, 6.7148357629776e-06, 6.92903995513916e-06, 7.14324414730072e-06, 7.35744833946228e-06, 7.57165253162384e-06, 7.7858567237854e-06, 8.00006091594696e-06, 8.21426510810852e-06, 8.42846930027008e-06, 8.64267349243164e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 9.0, 9.0, 12.0, 11.0, 18.0, 29.0, 47.0, 109.0, 308.0, 1712.0, 1036926.0, 8449.0, 568.0, 164.0, 84.0, 31.0, 19.0, 15.0, 10.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.039308547973633e-05, -6.836559623479843e-05, -6.633810698986053e-05, -6.431061774492264e-05, -6.228312849998474e-05, -6.0255639255046844e-05, -5.822815001010895e-05, -5.620066076517105e-05, -5.4173171520233154e-05, -5.214568227529526e-05, -5.011819303035736e-05, -4.8090703785419464e-05, -4.606321454048157e-05, -4.403572529554367e-05, -4.2008236050605774e-05, -3.998074680566788e-05, -3.795325756072998e-05, -3.5925768315792084e-05, -3.389827907085419e-05, -3.187078982591629e-05, -2.9843300580978394e-05, -2.7815811336040497e-05, -2.57883220911026e-05, -2.3760832846164703e-05, -2.1733343601226807e-05, -1.970585435628891e-05, -1.7678365111351013e-05, -1.5650875866413116e-05, -1.362338662147522e-05, -1.1595897376537323e-05, -9.568408131599426e-06, -7.5409188866615295e-06, -5.513429641723633e-06, -3.485940396785736e-06, -1.4584511518478394e-06, 5.690380930900574e-07, 2.596527338027954e-06, 4.624016582965851e-06, 6.6515058279037476e-06, 8.678995072841644e-06, 1.0706484317779541e-05, 1.2733973562717438e-05, 1.4761462807655334e-05, 1.678895205259323e-05, 1.8816441297531128e-05, 2.0843930542469025e-05, 2.287141978740692e-05, 2.4898909032344818e-05, 2.6926398277282715e-05, 2.895388752222061e-05, 3.098137676715851e-05, 3.3008866012096405e-05, 3.50363552570343e-05, 3.70638445019722e-05, 3.9091333746910095e-05, 4.111882299184799e-05, 4.314631223678589e-05, 4.5173801481723785e-05, 4.720129072666168e-05, 4.922877997159958e-05, 5.1256269216537476e-05, 5.328375846147537e-05, 5.531124770641327e-05, 5.7338736951351166e-05, 5.936622619628906e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 2.0, 5.0, 16.0, 15.0, 42.0, 75.0, 144.0, 306.0, 177.0, 106.0, 48.0, 17.0, 14.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -4.0617771446704865e-05, -3.951229155063629e-05, -3.840681165456772e-05, -3.7301331758499146e-05, -3.619585186243057e-05, -3.5090371966362e-05, -3.3984892070293427e-05, -3.2879412174224854e-05, -3.177393227815628e-05, -3.066845238208771e-05, -2.9562972486019135e-05, -2.845749258995056e-05, -2.735201269388199e-05, -2.6246532797813416e-05, -2.5141052901744843e-05, -2.403557300567627e-05, -2.2930093109607697e-05, -2.1824613213539124e-05, -2.071913331747055e-05, -1.9613653421401978e-05, -1.8508173525333405e-05, -1.740269362926483e-05, -1.629721373319626e-05, -1.5191733837127686e-05, -1.4086253941059113e-05, -1.298077404499054e-05, -1.1875294148921967e-05, -1.0769814252853394e-05, -9.66433435678482e-06, -8.558854460716248e-06, -7.4533745646476746e-06, -6.3478946685791016e-06, -5.2424147725105286e-06, -4.1369348764419556e-06, -3.0314549803733826e-06, -1.9259750843048096e-06, -8.204951882362366e-07, 2.849847078323364e-07, 1.3904646039009094e-06, 2.4959444999694824e-06, 3.6014243960380554e-06, 4.706904292106628e-06, 5.812384188175201e-06, 6.917864084243774e-06, 8.023343980312347e-06, 9.12882387638092e-06, 1.0234303772449493e-05, 1.1339783668518066e-05, 1.244526356458664e-05, 1.3550743460655212e-05, 1.4656223356723785e-05, 1.576170325279236e-05, 1.686718314886093e-05, 1.7972663044929504e-05, 1.9078142940998077e-05, 2.018362283706665e-05, 2.1289102733135223e-05, 2.2394582629203796e-05, 2.350006252527237e-05, 2.4605542421340942e-05, 2.5711022317409515e-05, 2.681650221347809e-05, 2.792198210954666e-05, 2.9027462005615234e-05]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 21.0, 34.0, 137.0, 496.0, 199.0, 68.0, 16.0, 10.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06408916413784027, -0.06138811260461807, -0.058687061071395874, -0.055986013263463974, -0.053284961730241776, -0.05058391019701958, -0.04788286238908768, -0.04518181085586548, -0.04248075932264328, -0.03977970778942108, -0.03707865625619888, -0.03437760844826698, -0.031676556915044785, -0.028975505381822586, -0.026274455711245537, -0.023573406040668488, -0.02087235450744629, -0.01817130297422409, -0.015470253303647041, -0.012769202701747417, -0.010068152099847794, -0.00736710149794817, -0.004666050896048546, -0.0019650012254714966, 0.0007360503077507019, 0.0034371009096503258, 0.00613815151154995, 0.008839202113449574, 0.011540252715349197, 0.014241303317248821, 0.016942353919148445, 0.019643403589725494, 0.022344455122947693, 0.02504550665616989, 0.02774655632674694, 0.03044760599732399, 0.03314865753054619, 0.03584970906376839, 0.03855075687170029, 0.041251808404922485, 0.043952859938144684, 0.04665391147136688, 0.04935496300458908, 0.05205601081252098, 0.05475706234574318, 0.05745811387896538, 0.06015916168689728, 0.06286021322011948, 0.06556126475334167, 0.06826231628656387, 0.07096336781978607, 0.07366441935300827, 0.07636547088623047, 0.07906651496887207, 0.08176756650209427, 0.08446861803531647, 0.08716966956853867, 0.08987072110176086, 0.09257177263498306, 0.09527282416820526, 0.09797386825084686, 0.10067491978406906, 0.10337597131729126, 0.10607702285051346, 0.10877807438373566]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 11.0, 8.0, 14.0, 15.0, 12.0, 16.0, 15.0, 24.0, 34.0, 20.0, 22.0, 44.0, 33.0, 46.0, 45.0, 45.0, 43.0, 52.0, 43.0, 55.0, 42.0, 38.0, 35.0, 42.0, 28.0, 29.0, 18.0, 20.0, 16.0, 17.0, 18.0, 16.0, 11.0, 14.0, 4.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.15168660879135132, -0.14716698229312897, -0.14264734089374542, -0.13812771439552307, -0.13360807299613953, -0.12908844649791718, -0.12456881999969482, -0.12004918605089188, -0.11552955210208893, -0.11100991815328598, -0.10649028420448303, -0.10197065770626068, -0.09745102375745773, -0.09293138980865479, -0.08841176331043243, -0.08389212936162949, -0.07937249541282654, -0.07485286146402359, -0.07033322751522064, -0.06581360101699829, -0.06129396706819534, -0.056774333119392395, -0.052254702895879745, -0.047735072672367096, -0.04321543872356415, -0.0386958047747612, -0.03417617455124855, -0.02965654246509075, -0.025136910378932953, -0.020617278292775154, -0.016097646206617355, -0.011578015983104706, -0.007058382034301758, -0.002538749948143959, 0.0019808821380138397, 0.0065005142241716385, 0.011020146310329437, 0.015539778396487236, 0.020059410482645035, 0.024579040706157684, 0.029098674654960632, 0.03361830860376358, 0.03813793882727623, 0.04265756905078888, 0.04717720299959183, 0.051696836948394775, 0.056216467171907425, 0.060736097395420074, 0.06525573134422302, 0.06977536529302597, 0.07429499924182892, 0.07881462574005127, 0.08333425968885422, 0.08785389363765717, 0.09237352013587952, 0.09689315408468246, 0.10141278803348541, 0.10593242198228836, 0.11045205593109131, 0.11497168242931366, 0.11949131637811661, 0.12401095032691956, 0.1285305768251419, 0.13305020332336426, 0.1375698447227478]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 18.0, 20.0, 27.0, 23.0, 32.0, 68.0, 556.0, 4603.0, 4161182.0, 25990.0, 1408.0, 80.0, 38.0, 38.0, 41.0, 35.0, 16.0, 15.0, 12.0, 6.0, 10.0, 4.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185394287109375, -0.017873287200927734, -0.01720714569091797, -0.016541004180908203, -0.015874862670898438, -0.015208721160888672, -0.014542579650878906, -0.01387643814086914, -0.013210296630859375, -0.01254415512084961, -0.011878013610839844, -0.011211872100830078, -0.010545730590820312, -0.009879589080810547, -0.009213447570800781, -0.008547306060791016, -0.00788116455078125, -0.007215023040771484, -0.006548881530761719, -0.005882740020751953, -0.0052165985107421875, -0.004550457000732422, -0.0038843154907226562, -0.0032181739807128906, -0.002552032470703125, -0.0018858909606933594, -0.0012197494506835938, -0.0005536079406738281, 0.0001125335693359375, 0.0007786750793457031, 0.0014448165893554688, 0.0021109580993652344, 0.002777099609375, 0.0034432411193847656, 0.004109382629394531, 0.004775524139404297, 0.0054416656494140625, 0.006107807159423828, 0.006773948669433594, 0.007440090179443359, 0.008106231689453125, 0.00877237319946289, 0.009438514709472656, 0.010104656219482422, 0.010770797729492188, 0.011436939239501953, 0.012103080749511719, 0.012769222259521484, 0.01343536376953125, 0.014101505279541016, 0.014767646789550781, 0.015433788299560547, 0.016099929809570312, 0.016766071319580078, 0.017432212829589844, 0.01809835433959961, 0.018764495849609375, 0.01943063735961914, 0.020096778869628906, 0.020762920379638672, 0.021429061889648438, 0.022095203399658203, 0.02276134490966797, 0.023427486419677734, 0.0240936279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 5.0, 13.0, 10.0, 6.0, 6.0, 15.0, 64.0, 139.0, 278.0, 228.0, 95.0, 26.0, 9.0, 8.0, 12.0, 9.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00760650634765625, -0.007335662841796875, -0.0070648193359375, -0.006793975830078125, -0.00652313232421875, -0.006252288818359375, -0.0059814453125, -0.005710601806640625, -0.00543975830078125, -0.005168914794921875, -0.0048980712890625, -0.004627227783203125, -0.00435638427734375, -0.004085540771484375, -0.003814697265625, -0.003543853759765625, -0.00327301025390625, -0.003002166748046875, -0.0027313232421875, -0.002460479736328125, -0.00218963623046875, -0.001918792724609375, -0.00164794921875, -0.001377105712890625, -0.00110626220703125, -0.000835418701171875, -0.0005645751953125, -0.000293731689453125, -2.288818359375e-05, 0.000247955322265625, 0.000518798828125, 0.000789642333984375, 0.00106048583984375, 0.001331329345703125, 0.0016021728515625, 0.001873016357421875, 0.00214385986328125, 0.002414703369140625, 0.002685546875, 0.002956390380859375, 0.00322723388671875, 0.003498077392578125, 0.0037689208984375, 0.004039764404296875, 0.00431060791015625, 0.004581451416015625, 0.004852294921875, 0.005123138427734375, 0.00539398193359375, 0.005664825439453125, 0.0059356689453125, 0.006206512451171875, 0.00647735595703125, 0.006748199462890625, 0.00701904296875, 0.007289886474609375, 0.00756072998046875, 0.007831573486328125, 0.0081024169921875, 0.008373260498046875, 0.00864410400390625, 0.008914947509765625, 0.009185791015625, 0.009456634521484375, 0.00972747802734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 14.0, 9.0, 22.0, 38.0, 109.0, 313.0, 1561.0, 70134.0, 4118719.0, 2561.0, 496.0, 159.0, 62.0, 22.0, 15.0, 12.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02703857421875, -0.02628946304321289, -0.02554035186767578, -0.024791240692138672, -0.024042129516601562, -0.023293018341064453, -0.022543907165527344, -0.021794795989990234, -0.021045684814453125, -0.020296573638916016, -0.019547462463378906, -0.018798351287841797, -0.018049240112304688, -0.017300128936767578, -0.01655101776123047, -0.01580190658569336, -0.01505279541015625, -0.01430368423461914, -0.013554573059082031, -0.012805461883544922, -0.012056350708007812, -0.011307239532470703, -0.010558128356933594, -0.009809017181396484, -0.009059906005859375, -0.008310794830322266, -0.007561683654785156, -0.006812572479248047, -0.0060634613037109375, -0.005314350128173828, -0.004565238952636719, -0.0038161277770996094, -0.0030670166015625, -0.0023179054260253906, -0.0015687942504882812, -0.0008196830749511719, -7.05718994140625e-05, 0.0006785392761230469, 0.0014276504516601562, 0.0021767616271972656, 0.002925872802734375, 0.0036749839782714844, 0.004424095153808594, 0.005173206329345703, 0.0059223175048828125, 0.006671428680419922, 0.007420539855957031, 0.00816965103149414, 0.00891876220703125, 0.00966787338256836, 0.010416984558105469, 0.011166095733642578, 0.011915206909179688, 0.012664318084716797, 0.013413429260253906, 0.014162540435791016, 0.014911651611328125, 0.015660762786865234, 0.016409873962402344, 0.017158985137939453, 0.017908096313476562, 0.018657207489013672, 0.01940631866455078, 0.02015542984008789, 0.020904541015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 27.0, 42.0, 108.0, 3207.0, 506.0, 86.0, 40.0, 18.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005298614501953125, -0.005076348781585693, -0.004854083061218262, -0.00463181734085083, -0.0044095516204833984, -0.004187285900115967, -0.003965020179748535, -0.0037427544593811035, -0.003520488739013672, -0.0032982230186462402, -0.0030759572982788086, -0.002853691577911377, -0.0026314258575439453, -0.0024091601371765137, -0.002186894416809082, -0.0019646286964416504, -0.0017423629760742188, -0.0015200972557067871, -0.0012978315353393555, -0.0010755658149719238, -0.0008533000946044922, -0.0006310343742370605, -0.0004087686538696289, -0.00018650293350219727, 3.5762786865234375e-05, 0.000258028507232666, 0.00048029422760009766, 0.0007025599479675293, 0.0009248256683349609, 0.0011470913887023926, 0.0013693571090698242, 0.0015916228294372559, 0.0018138885498046875, 0.002036154270172119, 0.0022584199905395508, 0.0024806857109069824, 0.002702951431274414, 0.0029252171516418457, 0.0031474828720092773, 0.003369748592376709, 0.0035920143127441406, 0.0038142800331115723, 0.004036545753479004, 0.0042588114738464355, 0.004481077194213867, 0.004703342914581299, 0.0049256086349487305, 0.005147874355316162, 0.005370140075683594, 0.005592405796051025, 0.005814671516418457, 0.006036937236785889, 0.00625920295715332, 0.006481468677520752, 0.006703734397888184, 0.006926000118255615, 0.007148265838623047, 0.0073705315589904785, 0.00759279727935791, 0.007815062999725342, 0.008037328720092773, 0.008259594440460205, 0.008481860160827637, 0.008704125881195068, 0.0089263916015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 724.0, 287.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012417360208928585, -0.01033632643520832, -0.008255291730165482, -0.006174257956445217, -0.004093224182724953, -0.0020121904090046883, 6.884429603815079e-05, 0.0021498780697584152, 0.00423091184347868, 0.006311945617198944, 0.008392980322241783, 0.010474014095962048, 0.012555047869682312, 0.014636081643402576, 0.01671711727976799, 0.01879815012216568, 0.02087918296456337, 0.02296021766960621, 0.0250412505120039, 0.027122285217046738, 0.029203318059444427, 0.031284354627132416, 0.033365387469530106, 0.035446420311927795, 0.037527456879615784, 0.039608489722013474, 0.04168952628970146, 0.04377055913209915, 0.04585159197449684, 0.04793262481689453, 0.05001366138458252, 0.05209469422698021, 0.054175734519958496, 0.056256767362356186, 0.058337803930044174, 0.060418836772441864, 0.062499869614839554, 0.06458090245723724, 0.06666193902492523, 0.06874297559261322, 0.07082400470972061, 0.0729050412774086, 0.07498607039451599, 0.07706710696220398, 0.07914814352989197, 0.08122917264699936, 0.08331020921468735, 0.08539124578237534, 0.08747227489948273, 0.08955331146717072, 0.0916343405842781, 0.0937153771519661, 0.09579641371965408, 0.09787744283676147, 0.09995847940444946, 0.10203951597213745, 0.10412055253982544, 0.10620158910751343, 0.10828261822462082, 0.11036365479230881, 0.1124446913599968, 0.11452572047710419, 0.11660675704479218, 0.11868779361248016, 0.12076882272958755]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 13.0, 18.0, 26.0, 29.0, 41.0, 66.0, 66.0, 82.0, 74.0, 75.0, 90.0, 63.0, 68.0, 70.0, 66.0, 35.0, 37.0, 31.0, 21.0, 9.0, 6.0, 9.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019170522689819336, -0.018626732751727104, -0.018082942813634872, -0.01753915287554264, -0.01699536293745041, -0.016451572999358177, -0.015907783061265945, -0.015363993123173714, -0.014820203185081482, -0.01427641324698925, -0.013732623308897018, -0.013188833370804787, -0.012645043432712555, -0.012101253494620323, -0.011557463556528091, -0.01101367361843586, -0.010469883680343628, -0.009926093742251396, -0.009382303804159164, -0.008838513866066933, -0.008294723927974701, -0.007750933989882469, -0.007207144051790237, -0.006663354113698006, -0.006119564175605774, -0.005575774237513542, -0.00503198429942131, -0.004488194361329079, -0.003944404423236847, -0.003400614485144615, -0.0028568245470523834, -0.0023130346089601517, -0.00176924467086792, -0.0012254547327756882, -0.0006816647946834564, -0.00013787485659122467, 0.0004059150815010071, 0.0009497050195932388, 0.0014934949576854706, 0.0020372848957777023, 0.002581074833869934, 0.003124864771962166, 0.0036686547100543976, 0.004212444648146629, 0.004756234586238861, 0.005300024524331093, 0.005843814462423325, 0.006387604400515556, 0.006931394338607788, 0.00747518427670002, 0.008018974214792252, 0.008562764152884483, 0.009106554090976715, 0.009650344029068947, 0.010194133967161179, 0.01073792390525341, 0.011281713843345642, 0.011825503781437874, 0.012369293719530106, 0.012913083657622337, 0.013456873595714569, 0.0140006635338068, 0.014544453471899033, 0.015088243409991264, 0.015632033348083496]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 8.0, 12.0, 15.0, 17.0, 14.0, 24.0, 24.0, 41.0, 46.0, 62.0, 81.0, 91.0, 147.0, 174.0, 277.0, 482.0, 905.0, 1729.0, 3570.0, 7843.0, 21900.0, 704514.0, 273239.0, 19255.0, 6944.0, 3187.0, 1637.0, 867.0, 458.0, 276.0, 188.0, 114.0, 75.0, 69.0, 43.0, 42.0, 42.0, 28.0, 27.0, 16.0, 16.0, 14.0, 5.0, 3.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.015716552734375, -0.015191793441772461, -0.014667034149169922, -0.014142274856567383, -0.013617515563964844, -0.013092756271362305, -0.012567996978759766, -0.012043237686157227, -0.011518478393554688, -0.010993719100952148, -0.01046895980834961, -0.00994420051574707, -0.009419441223144531, -0.008894681930541992, -0.008369922637939453, -0.007845163345336914, -0.007320404052734375, -0.006795644760131836, -0.006270885467529297, -0.005746126174926758, -0.005221366882324219, -0.00469660758972168, -0.004171848297119141, -0.0036470890045166016, -0.0031223297119140625, -0.0025975704193115234, -0.0020728111267089844, -0.0015480518341064453, -0.0010232925415039062, -0.0004985332489013672, 2.6226043701171875e-05, 0.0005509853363037109, 0.00107574462890625, 0.001600503921508789, 0.002125263214111328, 0.002650022506713867, 0.0031747817993164062, 0.0036995410919189453, 0.004224300384521484, 0.0047490596771240234, 0.0052738189697265625, 0.0057985782623291016, 0.006323337554931641, 0.00684809684753418, 0.007372856140136719, 0.007897615432739258, 0.008422374725341797, 0.008947134017944336, 0.009471893310546875, 0.009996652603149414, 0.010521411895751953, 0.011046171188354492, 0.011570930480957031, 0.01209568977355957, 0.01262044906616211, 0.013145208358764648, 0.013669967651367188, 0.014194726943969727, 0.014719486236572266, 0.015244245529174805, 0.015769004821777344, 0.016293764114379883, 0.016818523406982422, 0.01734328269958496, 0.0178680419921875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 15.0, 9.0, 6.0, 6.0, 18.0, 67.0, 156.0, 287.0, 209.0, 84.0, 23.0, 10.0, 7.0, 14.0, 8.0, 8.0, 4.0, 5.0, 2.0, 6.0, 2.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0075836181640625, -0.007312655448913574, -0.0070416927337646484, -0.006770730018615723, -0.006499767303466797, -0.006228804588317871, -0.005957841873168945, -0.0056868791580200195, -0.005415916442871094, -0.005144953727722168, -0.004873991012573242, -0.004603028297424316, -0.004332065582275391, -0.004061102867126465, -0.003790140151977539, -0.0035191774368286133, -0.0032482147216796875, -0.0029772520065307617, -0.002706289291381836, -0.00243532657623291, -0.0021643638610839844, -0.0018934011459350586, -0.0016224384307861328, -0.001351475715637207, -0.0010805130004882812, -0.0008095502853393555, -0.0005385875701904297, -0.0002676248550415039, 3.337860107421875e-06, 0.00027430057525634766, 0.0005452632904052734, 0.0008162260055541992, 0.001087188720703125, 0.0013581514358520508, 0.0016291141510009766, 0.0019000768661499023, 0.002171039581298828, 0.002442002296447754, 0.0027129650115966797, 0.0029839277267456055, 0.0032548904418945312, 0.003525853157043457, 0.003796815872192383, 0.004067778587341309, 0.004338741302490234, 0.00460970401763916, 0.004880666732788086, 0.005151629447937012, 0.0054225921630859375, 0.005693554878234863, 0.005964517593383789, 0.006235480308532715, 0.006506443023681641, 0.006777405738830566, 0.007048368453979492, 0.007319331169128418, 0.007590293884277344, 0.00786125659942627, 0.008132219314575195, 0.008403182029724121, 0.008674144744873047, 0.008945107460021973, 0.009216070175170898, 0.009487032890319824, 0.00975799560546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 13.0, 14.0, 17.0, 13.0, 20.0, 23.0, 24.0, 43.0, 58.0, 46.0, 62.0, 78.0, 110.0, 135.0, 180.0, 274.0, 450.0, 787.0, 1824.0, 11462.0, 990311.0, 37465.0, 2469.0, 919.0, 517.0, 311.0, 212.0, 159.0, 110.0, 82.0, 65.0, 52.0, 39.0, 40.0, 32.0, 35.0, 17.0, 24.0, 13.0, 8.0, 10.0, 7.0, 11.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0352783203125, -0.03412675857543945, -0.032975196838378906, -0.03182363510131836, -0.030672073364257812, -0.029520511627197266, -0.02836894989013672, -0.027217388153076172, -0.026065826416015625, -0.024914264678955078, -0.02376270294189453, -0.022611141204833984, -0.021459579467773438, -0.02030801773071289, -0.019156455993652344, -0.018004894256591797, -0.01685333251953125, -0.015701770782470703, -0.014550209045410156, -0.01339864730834961, -0.012247085571289062, -0.011095523834228516, -0.009943962097167969, -0.008792400360107422, -0.007640838623046875, -0.006489276885986328, -0.005337715148925781, -0.004186153411865234, -0.0030345916748046875, -0.0018830299377441406, -0.0007314682006835938, 0.0004200935363769531, 0.0015716552734375, 0.002723217010498047, 0.0038747787475585938, 0.005026340484619141, 0.0061779022216796875, 0.007329463958740234, 0.008481025695800781, 0.009632587432861328, 0.010784149169921875, 0.011935710906982422, 0.013087272644042969, 0.014238834381103516, 0.015390396118164062, 0.01654195785522461, 0.017693519592285156, 0.018845081329345703, 0.01999664306640625, 0.021148204803466797, 0.022299766540527344, 0.02345132827758789, 0.024602890014648438, 0.025754451751708984, 0.02690601348876953, 0.028057575225830078, 0.029209136962890625, 0.030360698699951172, 0.03151226043701172, 0.032663822174072266, 0.03381538391113281, 0.03496694564819336, 0.036118507385253906, 0.03727006912231445, 0.038421630859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 7.0, 5.0, 13.0, 7.0, 10.0, 14.0, 12.0, 15.0, 30.0, 17.0, 23.0, 30.0, 40.0, 37.0, 37.0, 35.0, 26.0, 44.0, 38.0, 46.0, 31.0, 44.0, 33.0, 24.0, 48.0, 37.0, 33.0, 37.0, 38.0, 25.0, 21.0, 15.0, 19.0, 16.0, 15.0, 24.0, 3.0, 14.0, 10.0, 5.0, 6.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0212554931640625, -0.020560741424560547, -0.019865989685058594, -0.01917123794555664, -0.018476486206054688, -0.017781734466552734, -0.01708698272705078, -0.016392230987548828, -0.015697479248046875, -0.015002727508544922, -0.014307975769042969, -0.013613224029541016, -0.012918472290039062, -0.01222372055053711, -0.011528968811035156, -0.010834217071533203, -0.01013946533203125, -0.009444713592529297, -0.008749961853027344, -0.00805521011352539, -0.0073604583740234375, -0.006665706634521484, -0.005970954895019531, -0.005276203155517578, -0.004581451416015625, -0.003886699676513672, -0.0031919479370117188, -0.0024971961975097656, -0.0018024444580078125, -0.0011076927185058594, -0.00041294097900390625, 0.0002818107604980469, 0.0009765625, 0.0016713142395019531, 0.0023660659790039062, 0.0030608177185058594, 0.0037555694580078125, 0.004450321197509766, 0.005145072937011719, 0.005839824676513672, 0.006534576416015625, 0.007229328155517578, 0.007924079895019531, 0.008618831634521484, 0.009313583374023438, 0.01000833511352539, 0.010703086853027344, 0.011397838592529297, 0.01209259033203125, 0.012787342071533203, 0.013482093811035156, 0.01417684555053711, 0.014871597290039062, 0.015566349029541016, 0.01626110076904297, 0.016955852508544922, 0.017650604248046875, 0.018345355987548828, 0.01904010772705078, 0.019734859466552734, 0.020429611206054688, 0.02112436294555664, 0.021819114685058594, 0.022513866424560547, 0.0232086181640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 8.0, 10.0, 9.0, 17.0, 20.0, 25.0, 43.0, 46.0, 62.0, 139.0, 244.0, 427.0, 753.0, 2751.0, 13727.0, 133467.0, 860111.0, 29893.0, 4464.0, 1067.0, 534.0, 273.0, 125.0, 119.0, 58.0, 38.0, 25.0, 33.0, 18.0, 3.0, 8.0, 6.0, 2.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1282972991466522e-05, -1.0943040251731873e-05, -1.0603107511997223e-05, -1.0263174772262573e-05, -9.923242032527924e-06, -9.583309292793274e-06, -9.243376553058624e-06, -8.903443813323975e-06, -8.563511073589325e-06, -8.223578333854675e-06, -7.883645594120026e-06, -7.543712854385376e-06, -7.203780114650726e-06, -6.863847374916077e-06, -6.523914635181427e-06, -6.183981895446777e-06, -5.844049155712128e-06, -5.504116415977478e-06, -5.164183676242828e-06, -4.824250936508179e-06, -4.484318196773529e-06, -4.144385457038879e-06, -3.8044527173042297e-06, -3.46451997756958e-06, -3.1245872378349304e-06, -2.7846544981002808e-06, -2.444721758365631e-06, -2.1047890186309814e-06, -1.7648562788963318e-06, -1.4249235391616821e-06, -1.0849907994270325e-06, -7.450580596923828e-07, -4.0512531995773315e-07, -6.51925802230835e-08, 2.7474015951156616e-07, 6.146728992462158e-07, 9.546056389808655e-07, 1.2945383787155151e-06, 1.6344711184501648e-06, 1.9744038581848145e-06, 2.314336597919464e-06, 2.6542693376541138e-06, 2.9942020773887634e-06, 3.334134817123413e-06, 3.6740675568580627e-06, 4.014000296592712e-06, 4.353933036327362e-06, 4.693865776062012e-06, 5.033798515796661e-06, 5.373731255531311e-06, 5.713663995265961e-06, 6.05359673500061e-06, 6.39352947473526e-06, 6.73346221446991e-06, 7.073394954204559e-06, 7.413327693939209e-06, 7.753260433673859e-06, 8.093193173408508e-06, 8.433125913143158e-06, 8.773058652877808e-06, 9.112991392612457e-06, 9.452924132347107e-06, 9.792856872081757e-06, 1.0132789611816406e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 11.0, 9.0, 13.0, 14.0, 46.0, 31.0, 37.0, 82.0, 68.0, 99.0, 105.0, 117.0, 62.0, 69.0, 73.0, 39.0, 47.0, 18.0, 10.0, 12.0, 11.0, 6.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.068738341331482e-06, -6.865710020065308e-06, -6.662681698799133e-06, -6.459653377532959e-06, -6.256625056266785e-06, -6.05359673500061e-06, -5.850568413734436e-06, -5.647540092468262e-06, -5.444511771202087e-06, -5.241483449935913e-06, -5.038455128669739e-06, -4.8354268074035645e-06, -4.63239848613739e-06, -4.429370164871216e-06, -4.2263418436050415e-06, -4.023313522338867e-06, -3.820285201072693e-06, -3.6172568798065186e-06, -3.4142285585403442e-06, -3.21120023727417e-06, -3.0081719160079956e-06, -2.8051435947418213e-06, -2.602115273475647e-06, -2.3990869522094727e-06, -2.1960586309432983e-06, -1.993030309677124e-06, -1.7900019884109497e-06, -1.5869736671447754e-06, -1.383945345878601e-06, -1.1809170246124268e-06, -9.778887033462524e-07, -7.748603820800781e-07, -5.718320608139038e-07, -3.688037395477295e-07, -1.6577541828155518e-07, 3.725290298461914e-08, 2.4028122425079346e-07, 4.4330954551696777e-07, 6.463378667831421e-07, 8.493661880493164e-07, 1.0523945093154907e-06, 1.255422830581665e-06, 1.4584511518478394e-06, 1.6614794731140137e-06, 1.864507794380188e-06, 2.0675361156463623e-06, 2.2705644369125366e-06, 2.473592758178711e-06, 2.6766210794448853e-06, 2.8796494007110596e-06, 3.082677721977234e-06, 3.285706043243408e-06, 3.4887343645095825e-06, 3.691762685775757e-06, 3.894791007041931e-06, 4.0978193283081055e-06, 4.30084764957428e-06, 4.503875970840454e-06, 4.706904292106628e-06, 4.909932613372803e-06, 5.112960934638977e-06, 5.315989255905151e-06, 5.519017577171326e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 21.0, 19.0, 43.0, 57.0, 94.0, 184.0, 594.0, 3890.0, 1039782.0, 2927.0, 484.0, 193.0, 102.0, 46.0, 27.0, 36.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6835670471191406e-05, -3.5585835576057434e-05, -3.433600068092346e-05, -3.308616578578949e-05, -3.183633089065552e-05, -3.0586495995521545e-05, -2.9336661100387573e-05, -2.80868262052536e-05, -2.683699131011963e-05, -2.5587156414985657e-05, -2.4337321519851685e-05, -2.3087486624717712e-05, -2.183765172958374e-05, -2.0587816834449768e-05, -1.9337981939315796e-05, -1.8088147044181824e-05, -1.683831214904785e-05, -1.558847725391388e-05, -1.4338642358779907e-05, -1.3088807463645935e-05, -1.1838972568511963e-05, -1.058913767337799e-05, -9.339302778244019e-06, -8.089467883110046e-06, -6.839632987976074e-06, -5.589798092842102e-06, -4.33996319770813e-06, -3.0901283025741577e-06, -1.8402934074401855e-06, -5.904585123062134e-07, 6.593763828277588e-07, 1.909211277961731e-06, 3.159046173095703e-06, 4.408881068229675e-06, 5.6587159633636475e-06, 6.90855085849762e-06, 8.158385753631592e-06, 9.408220648765564e-06, 1.0658055543899536e-05, 1.1907890439033508e-05, 1.315772533416748e-05, 1.4407560229301453e-05, 1.5657395124435425e-05, 1.6907230019569397e-05, 1.815706491470337e-05, 1.940689980983734e-05, 2.0656734704971313e-05, 2.1906569600105286e-05, 2.3156404495239258e-05, 2.440623939037323e-05, 2.5656074285507202e-05, 2.6905909180641174e-05, 2.8155744075775146e-05, 2.940557897090912e-05, 3.065541386604309e-05, 3.190524876117706e-05, 3.3155083656311035e-05, 3.440491855144501e-05, 3.565475344657898e-05, 3.690458834171295e-05, 3.8154423236846924e-05, 3.9404258131980896e-05, 4.065409302711487e-05, 4.190392792224884e-05, 4.315376281738281e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 11.0, 7.0, 9.0, 18.0, 31.0, 31.0, 58.0, 124.0, 138.0, 267.0, 118.0, 71.0, 41.0, 21.0, 14.0, 13.0, 15.0, 4.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0384788513183594e-05, -1.965835690498352e-05, -1.8931925296783447e-05, -1.8205493688583374e-05, -1.74790620803833e-05, -1.6752630472183228e-05, -1.6026198863983154e-05, -1.529976725578308e-05, -1.4573335647583008e-05, -1.3846904039382935e-05, -1.3120472431182861e-05, -1.2394040822982788e-05, -1.1667609214782715e-05, -1.0941177606582642e-05, -1.0214745998382568e-05, -9.488314390182495e-06, -8.761882781982422e-06, -8.035451173782349e-06, -7.309019565582275e-06, -6.582587957382202e-06, -5.856156349182129e-06, -5.129724740982056e-06, -4.403293132781982e-06, -3.676861524581909e-06, -2.950429916381836e-06, -2.2239983081817627e-06, -1.4975666999816895e-06, -7.711350917816162e-07, -4.470348358154297e-08, 6.817281246185303e-07, 1.4081597328186035e-06, 2.1345913410186768e-06, 2.86102294921875e-06, 3.5874545574188232e-06, 4.3138861656188965e-06, 5.04031777381897e-06, 5.766749382019043e-06, 6.493180990219116e-06, 7.2196125984191895e-06, 7.946044206619263e-06, 8.672475814819336e-06, 9.39890742301941e-06, 1.0125339031219482e-05, 1.0851770639419556e-05, 1.1578202247619629e-05, 1.2304633855819702e-05, 1.3031065464019775e-05, 1.3757497072219849e-05, 1.4483928680419922e-05, 1.5210360288619995e-05, 1.593679189682007e-05, 1.666322350502014e-05, 1.7389655113220215e-05, 1.8116086721420288e-05, 1.884251832962036e-05, 1.9568949937820435e-05, 2.0295381546020508e-05, 2.102181315422058e-05, 2.1748244762420654e-05, 2.2474676370620728e-05, 2.32011079788208e-05, 2.3927539587020874e-05, 2.4653971195220947e-05, 2.538040280342102e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 48.0, 735.0, 200.0, 20.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27395039796829224, -0.2670600414276123, -0.26016965508461, -0.25327929854393005, -0.24638892710208893, -0.2394985556602478, -0.23260819911956787, -0.22571782767772675, -0.21882745623588562, -0.2119370847940445, -0.20504672825336456, -0.19815635681152344, -0.1912659853696823, -0.1843756139278412, -0.17748525738716125, -0.17059488594532013, -0.163704514503479, -0.15681414306163788, -0.14992378652095795, -0.14303341507911682, -0.1361430436372757, -0.12925267219543457, -0.12236231565475464, -0.11547194421291351, -0.10858158767223358, -0.10169122368097305, -0.09480085223913193, -0.0879104882478714, -0.08102011680603027, -0.07412975281476974, -0.06723938882350922, -0.06034901738166809, -0.053458645939826965, -0.04656827822327614, -0.03967791050672531, -0.03278754651546478, -0.025897176936268806, -0.01900681108236313, -0.012116443365812302, -0.005226075649261475, 0.0016642920672893524, 0.00855465978384018, 0.015445026569068432, 0.022335393354296684, 0.02922576107084751, 0.03611612692475319, 0.043006494641304016, 0.04989686235785484, 0.05678723007440567, 0.0636775940656662, 0.07056796550750732, 0.07745832949876785, 0.08434870094060898, 0.0912390649318695, 0.09812943637371063, 0.10501980036497116, 0.11191016435623169, 0.11880052834749222, 0.12569089233875275, 0.13258126378059387, 0.139471635222435, 0.14636200666427612, 0.15325236320495605, 0.16014273464679718, 0.1670331060886383]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 6.0, 5.0, 11.0, 10.0, 13.0, 14.0, 19.0, 28.0, 29.0, 37.0, 42.0, 45.0, 50.0, 57.0, 56.0, 62.0, 51.0, 43.0, 48.0, 40.0, 46.0, 35.0, 41.0, 33.0, 38.0, 23.0, 19.0, 20.0, 15.0, 14.0, 8.0, 6.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16866850852966309, -0.1637195497751236, -0.1587705910205841, -0.15382163226604462, -0.14887267351150513, -0.14392371475696564, -0.13897475600242615, -0.13402581214904785, -0.12907683849334717, -0.12412787973880768, -0.11917892098426819, -0.1142299622297287, -0.10928100347518921, -0.10433204472064972, -0.09938309341669083, -0.09443413466215134, -0.08948518335819244, -0.08453622460365295, -0.07958726584911346, -0.07463830709457397, -0.06968934834003448, -0.064740389585495, -0.0597914382815361, -0.05484247952699661, -0.04989352077245712, -0.04494456201791763, -0.03999560326337814, -0.03504664823412895, -0.030097689479589462, -0.025148730725049973, -0.020199773833155632, -0.015250816941261292, -0.010301858186721802, -0.005352900363504887, -0.0004039425402879715, 0.004545015282928944, 0.009493973106145859, 0.014442931860685349, 0.01939188875257969, 0.02434084564447403, 0.02928980439901352, 0.03423876315355301, 0.0391877219080925, 0.04413667693734169, 0.04908563569188118, 0.05403459444642067, 0.05898354947566986, 0.06393250823020935, 0.06888146698474884, 0.07383042573928833, 0.07877938449382782, 0.08372834324836731, 0.0886773020029068, 0.09362626075744629, 0.09857521206140518, 0.10352417081594467, 0.10847312957048416, 0.11342208832502365, 0.11837104707956314, 0.12332000583410263, 0.12826895713806152, 0.133217915892601, 0.1381668746471405, 0.14311583340168, 0.14806479215621948]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 2.0, 7.0, 13.0, 7.0, 10.0, 10.0, 25.0, 84.0, 207.0, 4163852.0, 29758.0, 136.0, 42.0, 16.0, 16.0, 12.0, 11.0, 6.0, 4.0, 5.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.09469318389892578, -0.09118080139160156, -0.08766841888427734, -0.08415603637695312, -0.0806436538696289, -0.07713127136230469, -0.07361888885498047, -0.07010650634765625, -0.06659412384033203, -0.06308174133300781, -0.059569358825683594, -0.056056976318359375, -0.052544593811035156, -0.04903221130371094, -0.04551982879638672, -0.0420074462890625, -0.03849506378173828, -0.03498268127441406, -0.031470298767089844, -0.027957916259765625, -0.024445533752441406, -0.020933151245117188, -0.01742076873779297, -0.01390838623046875, -0.010396003723144531, -0.0068836212158203125, -0.0033712387084960938, 0.000141143798828125, 0.0036535263061523438, 0.0071659088134765625, 0.010678291320800781, 0.014190673828125, 0.01770305633544922, 0.021215438842773438, 0.024727821350097656, 0.028240203857421875, 0.031752586364746094, 0.03526496887207031, 0.03877735137939453, 0.04228973388671875, 0.04580211639404297, 0.04931449890136719, 0.052826881408691406, 0.056339263916015625, 0.059851646423339844, 0.06336402893066406, 0.06687641143798828, 0.0703887939453125, 0.07390117645263672, 0.07741355895996094, 0.08092594146728516, 0.08443832397460938, 0.0879507064819336, 0.09146308898925781, 0.09497547149658203, 0.09848785400390625, 0.10200023651123047, 0.10551261901855469, 0.1090250015258789, 0.11253738403320312, 0.11604976654052734, 0.11956214904785156, 0.12307453155517578, 0.1265869140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 5.0, 15.0, 7.0, 9.0, 8.0, 14.0, 70.0, 142.0, 281.0, 209.0, 99.0, 26.0, 8.0, 10.0, 10.0, 10.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007133066654205322, -0.0068694353103637695, -0.006605803966522217, -0.006342172622680664, -0.006078541278839111, -0.005814909934997559, -0.005551278591156006, -0.005287647247314453, -0.0050240159034729, -0.004760384559631348, -0.004496753215789795, -0.004233121871948242, -0.0039694905281066895, -0.0037058591842651367, -0.003442227840423584, -0.0031785964965820312, -0.0029149651527404785, -0.0026513338088989258, -0.002387702465057373, -0.0021240711212158203, -0.0018604397773742676, -0.0015968084335327148, -0.0013331770896911621, -0.0010695457458496094, -0.0008059144020080566, -0.0005422830581665039, -0.00027865171432495117, -1.5020370483398438e-05, 0.0002486109733581543, 0.000512242317199707, 0.0007758736610412598, 0.0010395050048828125, 0.0013031363487243652, 0.001566767692565918, 0.0018303990364074707, 0.0020940303802490234, 0.002357661724090576, 0.002621293067932129, 0.0028849244117736816, 0.0031485557556152344, 0.003412187099456787, 0.00367581844329834, 0.003939449787139893, 0.004203081130981445, 0.004466712474822998, 0.004730343818664551, 0.0049939751625061035, 0.005257606506347656, 0.005521237850189209, 0.005784869194030762, 0.0060485005378723145, 0.006312131881713867, 0.00657576322555542, 0.006839394569396973, 0.007103025913238525, 0.007366657257080078, 0.007630288600921631, 0.007893919944763184, 0.008157551288604736, 0.008421182632446289, 0.008684813976287842, 0.008948445320129395, 0.009212076663970947, 0.0094757080078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 9.0, 13.0, 23.0, 75.0, 202.0, 721.0, 6143.0, 4179271.0, 6784.0, 722.0, 190.0, 62.0, 27.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018585205078125, -0.017976045608520508, -0.017366886138916016, -0.016757726669311523, -0.01614856719970703, -0.015539407730102539, -0.014930248260498047, -0.014321088790893555, -0.013711929321289062, -0.01310276985168457, -0.012493610382080078, -0.011884450912475586, -0.011275291442871094, -0.010666131973266602, -0.01005697250366211, -0.009447813034057617, -0.008838653564453125, -0.008229494094848633, -0.007620334625244141, -0.0070111751556396484, -0.006402015686035156, -0.005792856216430664, -0.005183696746826172, -0.00457453727722168, -0.0039653778076171875, -0.0033562183380126953, -0.002747058868408203, -0.002137899398803711, -0.0015287399291992188, -0.0009195804595947266, -0.0003104209899902344, 0.0002987384796142578, 0.00090789794921875, 0.0015170574188232422, 0.0021262168884277344, 0.0027353763580322266, 0.0033445358276367188, 0.003953695297241211, 0.004562854766845703, 0.005172014236450195, 0.0057811737060546875, 0.00639033317565918, 0.006999492645263672, 0.007608652114868164, 0.008217811584472656, 0.008826971054077148, 0.00943613052368164, 0.010045289993286133, 0.010654449462890625, 0.011263608932495117, 0.01187276840209961, 0.012481927871704102, 0.013091087341308594, 0.013700246810913086, 0.014309406280517578, 0.01491856575012207, 0.015527725219726562, 0.016136884689331055, 0.016746044158935547, 0.01735520362854004, 0.01796436309814453, 0.018573522567749023, 0.019182682037353516, 0.019791841506958008, 0.0204010009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 12.0, 19.0, 37.0, 90.0, 193.0, 2958.0, 528.0, 128.0, 56.0, 29.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00806427001953125, -0.007861495018005371, -0.007658720016479492, -0.007455945014953613, -0.007253170013427734, -0.0070503950119018555, -0.0068476200103759766, -0.006644845008850098, -0.006442070007324219, -0.00623929500579834, -0.006036520004272461, -0.005833745002746582, -0.005630970001220703, -0.005428194999694824, -0.005225419998168945, -0.005022644996643066, -0.0048198699951171875, -0.004617094993591309, -0.00441431999206543, -0.004211544990539551, -0.004008769989013672, -0.003805994987487793, -0.003603219985961914, -0.003400444984436035, -0.0031976699829101562, -0.0029948949813842773, -0.0027921199798583984, -0.0025893449783325195, -0.0023865699768066406, -0.0021837949752807617, -0.001981019973754883, -0.001778244972229004, -0.001575469970703125, -0.001372694969177246, -0.0011699199676513672, -0.0009671449661254883, -0.0007643699645996094, -0.0005615949630737305, -0.00035881996154785156, -0.00015604496002197266, 4.673004150390625e-05, 0.00024950504302978516, 0.00045228004455566406, 0.000655055046081543, 0.0008578300476074219, 0.0010606050491333008, 0.0012633800506591797, 0.0014661550521850586, 0.0016689300537109375, 0.0018717050552368164, 0.0020744800567626953, 0.0022772550582885742, 0.002480030059814453, 0.002682805061340332, 0.002885580062866211, 0.00308835506439209, 0.0032911300659179688, 0.0034939050674438477, 0.0036966800689697266, 0.0038994550704956055, 0.004102230072021484, 0.004305005073547363, 0.004507780075073242, 0.004710555076599121, 0.004913330078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [107.0, 909.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444257356226444, -0.00020800484344363213, 0.00402824766933918, 0.008264499716460705, 0.012500752694904804, 0.01673700660467148, 0.02097325772047043, 0.02520950883626938, 0.029445763677358627, 0.03368201479315758, 0.037918269634246826, 0.042154520750045776, 0.04639077186584473, 0.050627026706933975, 0.054863277822732925, 0.059099532663822174, 0.06333578377962112, 0.06757203489542007, 0.07180828601121902, 0.07604454457759857, 0.08028079569339752, 0.08451704680919647, 0.08875329792499542, 0.09298954904079437, 0.09722580015659332, 0.10146205127239227, 0.10569830238819122, 0.10993455350399017, 0.11417081207036972, 0.11840706318616867, 0.12264331430196762, 0.12687957286834717, 0.13111580908298492, 0.13535206019878387, 0.13958831131458282, 0.14382456243038177, 0.14806081354618073, 0.15229707956314087, 0.15653333067893982, 0.16076958179473877, 0.16500583291053772, 0.16924208402633667, 0.17347833514213562, 0.17771458625793457, 0.18195083737373352, 0.18618708848953247, 0.19042333960533142, 0.19465960562229156, 0.19889584183692932, 0.20313209295272827, 0.20736834406852722, 0.21160459518432617, 0.21584084630012512, 0.22007709741592407, 0.22431334853172302, 0.22854961454868317, 0.23278586566448212, 0.23702211678028107, 0.24125836789608002, 0.24549461901187897, 0.24973087012767792, 0.25396713614463806, 0.258203387260437, 0.26243963837623596, 0.2666758894920349]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 6.0, 14.0, 13.0, 19.0, 17.0, 21.0, 23.0, 27.0, 40.0, 35.0, 57.0, 44.0, 65.0, 55.0, 45.0, 47.0, 54.0, 50.0, 50.0, 36.0, 37.0, 40.0, 29.0, 26.0, 33.0, 21.0, 10.0, 21.0, 11.0, 9.0, 14.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008043885231018066, -0.007724401541054249, -0.007404917851090431, -0.007085434161126614, -0.006765950471162796, -0.006446466781198978, -0.006126983091235161, -0.005807499401271343, -0.005488015711307526, -0.005168532021343708, -0.0048490483313798904, -0.004529564641416073, -0.004210080951452255, -0.0038905972614884377, -0.00357111357152462, -0.0032516298815608025, -0.002932146191596985, -0.0026126625016331673, -0.0022931788116693497, -0.001973695121705532, -0.0016542114317417145, -0.0013347277417778969, -0.0010152440518140793, -0.0006957603618502617, -0.0003762766718864441, -5.6792981922626495e-05, 0.0002626907080411911, 0.0005821743980050087, 0.0009016580879688263, 0.0012211417779326439, 0.0015406254678964615, 0.001860109157860279, 0.0021795928478240967, 0.0024990765377879143, 0.002818560227751732, 0.0031380439177155495, 0.003457527607679367, 0.0037770112976431847, 0.004096494987607002, 0.00441597867757082, 0.0047354623675346375, 0.005054946057498455, 0.005374429747462273, 0.00569391343742609, 0.006013397127389908, 0.006332880817353725, 0.006652364507317543, 0.006971848197281361, 0.007291331887245178, 0.007610815577208996, 0.007930299267172813, 0.008249782957136631, 0.008569266647100449, 0.008888750337064266, 0.009208234027028084, 0.009527717716991901, 0.009847201406955719, 0.010166685096919537, 0.010486168786883354, 0.010805652476847172, 0.01112513616681099, 0.011444619856774807, 0.011764103546738625, 0.012083587236702442, 0.01240307092666626]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 8.0, 9.0, 12.0, 18.0, 24.0, 32.0, 38.0, 42.0, 77.0, 114.0, 156.0, 217.0, 372.0, 547.0, 887.0, 1380.0, 2521.0, 4589.0, 9715.0, 27367.0, 813729.0, 151509.0, 18309.0, 7676.0, 3661.0, 2044.0, 1185.0, 752.0, 508.0, 319.0, 197.0, 176.0, 106.0, 80.0, 40.0, 28.0, 29.0, 19.0, 15.0, 14.0, 6.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.01155853271484375, -0.011236071586608887, -0.010913610458374023, -0.01059114933013916, -0.010268688201904297, -0.009946227073669434, -0.00962376594543457, -0.009301304817199707, -0.008978843688964844, -0.00865638256072998, -0.008333921432495117, -0.008011460304260254, -0.007688999176025391, -0.007366538047790527, -0.007044076919555664, -0.006721615791320801, -0.0063991546630859375, -0.006076693534851074, -0.005754232406616211, -0.005431771278381348, -0.005109310150146484, -0.004786849021911621, -0.004464387893676758, -0.0041419267654418945, -0.0038194656372070312, -0.003497004508972168, -0.0031745433807373047, -0.0028520822525024414, -0.002529621124267578, -0.002207159996032715, -0.0018846988677978516, -0.0015622377395629883, -0.001239776611328125, -0.0009173154830932617, -0.0005948543548583984, -0.00027239322662353516, 5.0067901611328125e-05, 0.0003725290298461914, 0.0006949901580810547, 0.001017451286315918, 0.0013399124145507812, 0.0016623735427856445, 0.001984834671020508, 0.002307295799255371, 0.0026297569274902344, 0.0029522180557250977, 0.003274679183959961, 0.0035971403121948242, 0.0039196014404296875, 0.004242062568664551, 0.004564523696899414, 0.004886984825134277, 0.005209445953369141, 0.005531907081604004, 0.005854368209838867, 0.0061768293380737305, 0.006499290466308594, 0.006821751594543457, 0.00714421272277832, 0.007466673851013184, 0.007789134979248047, 0.00811159610748291, 0.008434057235717773, 0.008756518363952637, 0.0090789794921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 6.0, 14.0, 7.0, 8.0, 9.0, 14.0, 70.0, 149.0, 278.0, 209.0, 96.0, 25.0, 8.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00738525390625, -0.0071218013763427734, -0.006858348846435547, -0.00659489631652832, -0.006331443786621094, -0.006067991256713867, -0.005804538726806641, -0.005541086196899414, -0.0052776336669921875, -0.005014181137084961, -0.004750728607177734, -0.004487276077270508, -0.004223823547363281, -0.003960371017456055, -0.003696918487548828, -0.0034334659576416016, -0.003170013427734375, -0.0029065608978271484, -0.002643108367919922, -0.0023796558380126953, -0.0021162033081054688, -0.0018527507781982422, -0.0015892982482910156, -0.001325845718383789, -0.0010623931884765625, -0.0007989406585693359, -0.0005354881286621094, -0.0002720355987548828, -8.58306884765625e-06, 0.0002548694610595703, 0.0005183219909667969, 0.0007817745208740234, 0.00104522705078125, 0.0013086795806884766, 0.0015721321105957031, 0.0018355846405029297, 0.0020990371704101562, 0.002362489700317383, 0.0026259422302246094, 0.002889394760131836, 0.0031528472900390625, 0.003416299819946289, 0.0036797523498535156, 0.003943204879760742, 0.004206657409667969, 0.004470109939575195, 0.004733562469482422, 0.0049970149993896484, 0.005260467529296875, 0.0055239200592041016, 0.005787372589111328, 0.006050825119018555, 0.006314277648925781, 0.006577730178833008, 0.006841182708740234, 0.007104635238647461, 0.0073680877685546875, 0.007631540298461914, 0.00789499282836914, 0.008158445358276367, 0.008421897888183594, 0.00868535041809082, 0.008948802947998047, 0.009212255477905273, 0.0094757080078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 10.0, 7.0, 14.0, 24.0, 17.0, 17.0, 31.0, 35.0, 32.0, 61.0, 100.0, 118.0, 137.0, 187.0, 308.0, 576.0, 1068.0, 4259.0, 799459.0, 236536.0, 3050.0, 939.0, 471.0, 309.0, 191.0, 151.0, 100.0, 95.0, 63.0, 41.0, 28.0, 29.0, 16.0, 15.0, 17.0, 10.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.02503371238708496, -0.024249553680419922, -0.023465394973754883, -0.022681236267089844, -0.021897077560424805, -0.021112918853759766, -0.020328760147094727, -0.019544601440429688, -0.01876044273376465, -0.01797628402709961, -0.01719212532043457, -0.01640796661376953, -0.015623807907104492, -0.014839649200439453, -0.014055490493774414, -0.013271331787109375, -0.012487173080444336, -0.011703014373779297, -0.010918855667114258, -0.010134696960449219, -0.00935053825378418, -0.00856637954711914, -0.0077822208404541016, -0.0069980621337890625, -0.0062139034271240234, -0.005429744720458984, -0.004645586013793945, -0.0038614273071289062, -0.003077268600463867, -0.002293109893798828, -0.001508951187133789, -0.00072479248046875, 5.936622619628906e-05, 0.0008435249328613281, 0.0016276836395263672, 0.0024118423461914062, 0.0031960010528564453, 0.003980159759521484, 0.0047643184661865234, 0.0055484771728515625, 0.0063326358795166016, 0.007116794586181641, 0.00790095329284668, 0.008685111999511719, 0.009469270706176758, 0.010253429412841797, 0.011037588119506836, 0.011821746826171875, 0.012605905532836914, 0.013390064239501953, 0.014174222946166992, 0.014958381652832031, 0.01574254035949707, 0.01652669906616211, 0.01731085777282715, 0.018095016479492188, 0.018879175186157227, 0.019663333892822266, 0.020447492599487305, 0.021231651306152344, 0.022015810012817383, 0.022799968719482422, 0.02358412742614746, 0.0243682861328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 10.0, 6.0, 13.0, 20.0, 13.0, 10.0, 19.0, 21.0, 19.0, 27.0, 40.0, 36.0, 37.0, 26.0, 38.0, 36.0, 44.0, 58.0, 39.0, 43.0, 34.0, 35.0, 38.0, 44.0, 40.0, 50.0, 25.0, 32.0, 24.0, 17.0, 19.0, 19.0, 10.0, 9.0, 15.0, 7.0, 8.0, 5.0, 1.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022247314453125, -0.02157115936279297, -0.020895004272460938, -0.020218849182128906, -0.019542694091796875, -0.018866539001464844, -0.018190383911132812, -0.01751422882080078, -0.01683807373046875, -0.01616191864013672, -0.015485763549804688, -0.014809608459472656, -0.014133453369140625, -0.013457298278808594, -0.012781143188476562, -0.012104988098144531, -0.0114288330078125, -0.010752677917480469, -0.010076522827148438, -0.009400367736816406, -0.008724212646484375, -0.008048057556152344, -0.0073719024658203125, -0.006695747375488281, -0.00601959228515625, -0.005343437194824219, -0.0046672821044921875, -0.003991127014160156, -0.003314971923828125, -0.0026388168334960938, -0.0019626617431640625, -0.0012865066528320312, -0.0006103515625, 6.580352783203125e-05, 0.0007419586181640625, 0.0014181137084960938, 0.002094268798828125, 0.0027704238891601562, 0.0034465789794921875, 0.004122734069824219, 0.00479888916015625, 0.005475044250488281, 0.0061511993408203125, 0.006827354431152344, 0.007503509521484375, 0.008179664611816406, 0.008855819702148438, 0.009531974792480469, 0.0102081298828125, 0.010884284973144531, 0.011560440063476562, 0.012236595153808594, 0.012912750244140625, 0.013588905334472656, 0.014265060424804688, 0.014941215515136719, 0.01561737060546875, 0.01629352569580078, 0.016969680786132812, 0.017645835876464844, 0.018321990966796875, 0.018998146057128906, 0.019674301147460938, 0.02035045623779297, 0.021026611328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 4.0, 8.0, 11.0, 23.0, 15.0, 22.0, 42.0, 37.0, 109.0, 86.0, 112.0, 298.0, 323.0, 1054.0, 1839.0, 15046.0, 147643.0, 836544.0, 39231.0, 3178.0, 1544.0, 444.0, 371.0, 175.0, 99.0, 97.0, 46.0, 43.0, 20.0, 17.0, 24.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.50480729341507e-06, -4.36045229434967e-06, -4.216097295284271e-06, -4.071742296218872e-06, -3.927387297153473e-06, -3.7830322980880737e-06, -3.6386772990226746e-06, -3.4943222999572754e-06, -3.3499673008918762e-06, -3.205612301826477e-06, -3.061257302761078e-06, -2.9169023036956787e-06, -2.7725473046302795e-06, -2.6281923055648804e-06, -2.483837306499481e-06, -2.339482307434082e-06, -2.195127308368683e-06, -2.0507723093032837e-06, -1.9064173102378845e-06, -1.7620623111724854e-06, -1.6177073121070862e-06, -1.473352313041687e-06, -1.3289973139762878e-06, -1.1846423149108887e-06, -1.0402873158454895e-06, -8.959323167800903e-07, -7.515773177146912e-07, -6.07222318649292e-07, -4.628673195838928e-07, -3.1851232051849365e-07, -1.7415732145309448e-07, -2.9802322387695312e-08, 1.1455267667770386e-07, 2.5890767574310303e-07, 4.032626748085022e-07, 5.476176738739014e-07, 6.919726729393005e-07, 8.363276720046997e-07, 9.806826710700989e-07, 1.125037670135498e-06, 1.2693926692008972e-06, 1.4137476682662964e-06, 1.5581026673316956e-06, 1.7024576663970947e-06, 1.846812665462494e-06, 1.991167664527893e-06, 2.1355226635932922e-06, 2.2798776626586914e-06, 2.4242326617240906e-06, 2.5685876607894897e-06, 2.712942659854889e-06, 2.857297658920288e-06, 3.0016526579856873e-06, 3.1460076570510864e-06, 3.2903626561164856e-06, 3.4347176551818848e-06, 3.579072654247284e-06, 3.723427653312683e-06, 3.867782652378082e-06, 4.0121376514434814e-06, 4.156492650508881e-06, 4.30084764957428e-06, 4.445202648639679e-06, 4.589557647705078e-06]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 17.0, 9.0, 17.0, 18.0, 28.0, 19.0, 40.0, 17.0, 39.0, 23.0, 61.0, 19.0, 64.0, 34.0, 91.0, 80.0, 38.0, 68.0, 15.0, 47.0, 29.0, 33.0, 18.0, 38.0, 17.0, 19.0, 7.0, 12.0, 6.0, 9.0, 8.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8293579816818237e-06, -2.738088369369507e-06, -2.64681875705719e-06, -2.555549144744873e-06, -2.464279532432556e-06, -2.3730099201202393e-06, -2.2817403078079224e-06, -2.1904706954956055e-06, -2.0992010831832886e-06, -2.0079314708709717e-06, -1.9166618585586548e-06, -1.8253922462463379e-06, -1.734122633934021e-06, -1.642853021621704e-06, -1.5515834093093872e-06, -1.4603137969970703e-06, -1.3690441846847534e-06, -1.2777745723724365e-06, -1.1865049600601196e-06, -1.0952353477478027e-06, -1.0039657354354858e-06, -9.126961231231689e-07, -8.21426510810852e-07, -7.301568984985352e-07, -6.388872861862183e-07, -5.476176738739014e-07, -4.5634806156158447e-07, -3.650784492492676e-07, -2.738088369369507e-07, -1.825392246246338e-07, -9.12696123123169e-08, 0.0, 9.12696123123169e-08, 1.825392246246338e-07, 2.738088369369507e-07, 3.650784492492676e-07, 4.5634806156158447e-07, 5.476176738739014e-07, 6.388872861862183e-07, 7.301568984985352e-07, 8.21426510810852e-07, 9.126961231231689e-07, 1.0039657354354858e-06, 1.0952353477478027e-06, 1.1865049600601196e-06, 1.2777745723724365e-06, 1.3690441846847534e-06, 1.4603137969970703e-06, 1.5515834093093872e-06, 1.642853021621704e-06, 1.734122633934021e-06, 1.8253922462463379e-06, 1.9166618585586548e-06, 2.0079314708709717e-06, 2.0992010831832886e-06, 2.1904706954956055e-06, 2.2817403078079224e-06, 2.3730099201202393e-06, 2.464279532432556e-06, 2.555549144744873e-06, 2.64681875705719e-06, 2.738088369369507e-06, 2.8293579816818237e-06, 2.9206275939941406e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 15.0, 19.0, 27.0, 51.0, 78.0, 167.0, 415.0, 3803.0, 1040571.0, 2588.0, 452.0, 148.0, 84.0, 45.0, 29.0, 20.0, 7.0, 7.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5174970030784607e-05, -1.4554709196090698e-05, -1.393444836139679e-05, -1.3314187526702881e-05, -1.2693926692008972e-05, -1.2073665857315063e-05, -1.1453405022621155e-05, -1.0833144187927246e-05, -1.0212883353233337e-05, -9.592622518539429e-06, -8.97236168384552e-06, -8.352100849151611e-06, -7.731840014457703e-06, -7.111579179763794e-06, -6.491318345069885e-06, -5.8710575103759766e-06, -5.250796675682068e-06, -4.630535840988159e-06, -4.0102750062942505e-06, -3.390014171600342e-06, -2.769753336906433e-06, -2.1494925022125244e-06, -1.5292316675186157e-06, -9.08970832824707e-07, -2.8870999813079834e-07, 3.3155083656311035e-07, 9.51811671257019e-07, 1.5720725059509277e-06, 2.1923333406448364e-06, 2.812594175338745e-06, 3.432855010032654e-06, 4.0531158447265625e-06, 4.673376679420471e-06, 5.29363751411438e-06, 5.9138983488082886e-06, 6.534159183502197e-06, 7.154420018196106e-06, 7.774680852890015e-06, 8.394941687583923e-06, 9.015202522277832e-06, 9.63546335697174e-06, 1.025572419166565e-05, 1.0875985026359558e-05, 1.1496245861053467e-05, 1.2116506695747375e-05, 1.2736767530441284e-05, 1.3357028365135193e-05, 1.3977289199829102e-05, 1.459755003452301e-05, 1.5217810869216919e-05, 1.5838071703910828e-05, 1.6458332538604736e-05, 1.7078593373298645e-05, 1.7698854207992554e-05, 1.8319115042686462e-05, 1.893937587738037e-05, 1.955963671207428e-05, 2.017989754676819e-05, 2.0800158381462097e-05, 2.1420419216156006e-05, 2.2040680050849915e-05, 2.2660940885543823e-05, 2.3281201720237732e-05, 2.390146255493164e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 8.0, 10.0, 9.0, 25.0, 30.0, 42.0, 67.0, 81.0, 481.0, 78.0, 55.0, 32.0, 23.0, 21.0, 6.0, 10.0, 5.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3055279850959778e-05, -1.2520700693130493e-05, -1.1986121535301208e-05, -1.1451542377471924e-05, -1.091696321964264e-05, -1.0382384061813354e-05, -9.84780490398407e-06, -9.313225746154785e-06, -8.7786465883255e-06, -8.244067430496216e-06, -7.709488272666931e-06, -7.1749091148376465e-06, -6.640329957008362e-06, -6.105750799179077e-06, -5.5711716413497925e-06, -5.036592483520508e-06, -4.502013325691223e-06, -3.9674341678619385e-06, -3.432855010032654e-06, -2.898275852203369e-06, -2.3636966943740845e-06, -1.8291175365447998e-06, -1.2945383787155151e-06, -7.599592208862305e-07, -2.253800630569458e-07, 3.0919909477233887e-07, 8.437782526016235e-07, 1.3783574104309082e-06, 1.912936568260193e-06, 2.4475157260894775e-06, 2.982094883918762e-06, 3.516674041748047e-06, 4.0512531995773315e-06, 4.585832357406616e-06, 5.120411515235901e-06, 5.6549906730651855e-06, 6.18956983089447e-06, 6.724148988723755e-06, 7.2587281465530396e-06, 7.793307304382324e-06, 8.327886462211609e-06, 8.862465620040894e-06, 9.397044777870178e-06, 9.931623935699463e-06, 1.0466203093528748e-05, 1.1000782251358032e-05, 1.1535361409187317e-05, 1.2069940567016602e-05, 1.2604519724845886e-05, 1.3139098882675171e-05, 1.3673678040504456e-05, 1.420825719833374e-05, 1.4742836356163025e-05, 1.527741551399231e-05, 1.5811994671821594e-05, 1.634657382965088e-05, 1.6881152987480164e-05, 1.7415732145309448e-05, 1.7950311303138733e-05, 1.8484890460968018e-05, 1.9019469618797302e-05, 1.9554048776626587e-05, 2.008862793445587e-05, 2.0623207092285156e-05]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 104.0, 878.0, 27.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476025819778442, -0.06575579941272736, -0.05675134062767029, -0.04774687811732292, -0.038742419332265854, -0.029737960547208786, -0.02073349803686142, -0.011729039251804352, -0.002724580466747284, 0.0062798792496323586, 0.015284338966012001, 0.024288799613714218, 0.033293258398771286, 0.042297717183828354, 0.05130217969417572, 0.06030663847923279, 0.06931109726428986, 0.07831555604934692, 0.08732001483440399, 0.09632447361946106, 0.10532893240451813, 0.1143333911895752, 0.12333785742521286, 0.13234230875968933, 0.1413467824459076, 0.15035124123096466, 0.15935570001602173, 0.1683601588010788, 0.17736461758613586, 0.18636907637119293, 0.19537353515625, 0.20437800884246826, 0.21338245272636414, 0.2223869115114212, 0.23139137029647827, 0.24039582908153534, 0.2494002878665924, 0.25840476155281067, 0.26740920543670654, 0.2764136791229248, 0.2854181230068207, 0.29442259669303894, 0.3034270405769348, 0.3124315142631531, 0.32143595814704895, 0.3304404318332672, 0.3394448757171631, 0.34844934940338135, 0.3574538230895996, 0.36645829677581787, 0.37546274065971375, 0.384467214345932, 0.3934716582298279, 0.40247613191604614, 0.411480575799942, 0.4204850494861603, 0.42948949337005615, 0.4384939670562744, 0.4474984109401703, 0.45650288462638855, 0.4655073285102844, 0.4745118021965027, 0.48351624608039856, 0.4925207197666168, 0.5015251636505127]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 6.0, 9.0, 12.0, 10.0, 17.0, 15.0, 14.0, 25.0, 23.0, 31.0, 41.0, 34.0, 40.0, 37.0, 54.0, 56.0, 49.0, 44.0, 54.0, 55.0, 38.0, 41.0, 29.0, 35.0, 23.0, 28.0, 26.0, 24.0, 18.0, 24.0, 13.0, 13.0, 8.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12279540300369263, -0.11929187923669815, -0.11578836292028427, -0.1122848391532898, -0.10878132283687592, -0.10527779906988144, -0.10177427530288696, -0.09827075898647308, -0.09476723521947861, -0.09126371145248413, -0.08776019513607025, -0.08425667136907578, -0.0807531476020813, -0.07724963128566742, -0.07374610751867294, -0.07024258375167847, -0.06673906743526459, -0.06323554366827011, -0.05973202735185623, -0.056228503584861755, -0.05272498354315758, -0.0492214635014534, -0.04571793973445892, -0.042214419692754745, -0.03871089965105057, -0.03520737960934639, -0.03170385956764221, -0.028200335800647736, -0.024696815758943558, -0.02119329571723938, -0.017689773812890053, -0.014186251908540726, -0.010682731866836548, -0.007179210893809795, -0.003675689920783043, -0.00017216894775629044, 0.003331352025270462, 0.00683487206697464, 0.010338393971323967, 0.013841915875673294, 0.017345435917377472, 0.02084895595908165, 0.024352477863430977, 0.027855999767780304, 0.03135951980948448, 0.03486303985118866, 0.038366563618183136, 0.041870083659887314, 0.04537360370159149, 0.04887712374329567, 0.05238064378499985, 0.055884167551994324, 0.0593876875936985, 0.06289120763540268, 0.06639473140239716, 0.06989824771881104, 0.07340177148580551, 0.07690529525279999, 0.08040881156921387, 0.08391233533620834, 0.08741585910320282, 0.0909193754196167, 0.09442289918661118, 0.09792642295360565, 0.10142993927001953]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 4.0, 16.0, 5.0, 11.0, 6.0, 21.0, 88.0, 498.0, 12074.0, 4180730.0, 613.0, 76.0, 27.0, 11.0, 12.0, 12.0, 6.0, 5.0, 6.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0277099609375, -0.026724815368652344, -0.025739669799804688, -0.02475452423095703, -0.023769378662109375, -0.02278423309326172, -0.021799087524414062, -0.020813941955566406, -0.01982879638671875, -0.018843650817871094, -0.017858505249023438, -0.01687335968017578, -0.015888214111328125, -0.014903068542480469, -0.013917922973632812, -0.012932777404785156, -0.0119476318359375, -0.010962486267089844, -0.009977340698242188, -0.008992195129394531, -0.008007049560546875, -0.007021903991699219, -0.0060367584228515625, -0.005051612854003906, -0.00406646728515625, -0.0030813217163085938, -0.0020961761474609375, -0.0011110305786132812, -0.000125885009765625, 0.0008592605590820312, 0.0018444061279296875, 0.0028295516967773438, 0.003814697265625, 0.004799842834472656, 0.0057849884033203125, 0.006770133972167969, 0.007755279541015625, 0.008740425109863281, 0.009725570678710938, 0.010710716247558594, 0.01169586181640625, 0.012681007385253906, 0.013666152954101562, 0.014651298522949219, 0.015636444091796875, 0.01662158966064453, 0.017606735229492188, 0.018591880798339844, 0.0195770263671875, 0.020562171936035156, 0.021547317504882812, 0.02253246307373047, 0.023517608642578125, 0.02450275421142578, 0.025487899780273438, 0.026473045349121094, 0.02745819091796875, 0.028443336486816406, 0.029428482055664062, 0.03041362762451172, 0.031398773193359375, 0.03238391876220703, 0.03336906433105469, 0.034354209899902344, 0.03533935546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 3.0, 16.0, 6.0, 10.0, 6.0, 15.0, 54.0, 118.0, 265.0, 233.0, 116.0, 37.0, 14.0, 7.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007142364978790283, -0.006880402565002441, -0.0066184401512146, -0.006356477737426758, -0.006094515323638916, -0.005832552909851074, -0.005570590496063232, -0.005308628082275391, -0.005046665668487549, -0.004784703254699707, -0.004522740840911865, -0.0042607784271240234, -0.003998816013336182, -0.00373685359954834, -0.003474891185760498, -0.0032129287719726562, -0.0029509663581848145, -0.0026890039443969727, -0.002427041530609131, -0.002165079116821289, -0.0019031167030334473, -0.0016411542892456055, -0.0013791918754577637, -0.0011172294616699219, -0.0008552670478820801, -0.0005933046340942383, -0.0003313422203063965, -6.937980651855469e-05, 0.0001925826072692871, 0.0004545450210571289, 0.0007165074348449707, 0.0009784698486328125, 0.0012404322624206543, 0.001502394676208496, 0.0017643570899963379, 0.0020263195037841797, 0.0022882819175720215, 0.0025502443313598633, 0.002812206745147705, 0.003074169158935547, 0.0033361315727233887, 0.0035980939865112305, 0.0038600564002990723, 0.004122018814086914, 0.004383981227874756, 0.004645943641662598, 0.0049079060554504395, 0.005169868469238281, 0.005431830883026123, 0.005693793296813965, 0.005955755710601807, 0.0062177181243896484, 0.00647968053817749, 0.006741642951965332, 0.007003605365753174, 0.007265567779541016, 0.007527530193328857, 0.007789492607116699, 0.008051455020904541, 0.008313417434692383, 0.008575379848480225, 0.008837342262268066, 0.009099304676055908, 0.00936126708984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 11.0, 4.0, 22.0, 22.0, 44.0, 56.0, 209.0, 646.0, 2926.0, 27620.0, 4148640.0, 11572.0, 1730.0, 454.0, 136.0, 73.0, 18.0, 22.0, 16.0, 11.0, 8.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0074310302734375, -0.007214725017547607, -0.006998419761657715, -0.006782114505767822, -0.00656580924987793, -0.006349503993988037, -0.0061331987380981445, -0.005916893482208252, -0.005700588226318359, -0.005484282970428467, -0.005267977714538574, -0.005051672458648682, -0.004835367202758789, -0.0046190619468688965, -0.004402756690979004, -0.004186451435089111, -0.003970146179199219, -0.003753840923309326, -0.0035375356674194336, -0.003321230411529541, -0.0031049251556396484, -0.002888619899749756, -0.0026723146438598633, -0.0024560093879699707, -0.002239704132080078, -0.0020233988761901855, -0.001807093620300293, -0.0015907883644104004, -0.0013744831085205078, -0.0011581778526306152, -0.0009418725967407227, -0.0007255673408508301, -0.0005092620849609375, -0.0002929568290710449, -7.665157318115234e-05, 0.00013965368270874023, 0.0003559589385986328, 0.0005722641944885254, 0.000788569450378418, 0.0010048747062683105, 0.0012211799621582031, 0.0014374852180480957, 0.0016537904739379883, 0.0018700957298278809, 0.0020864009857177734, 0.002302706241607666, 0.0025190114974975586, 0.002735316753387451, 0.0029516220092773438, 0.0031679272651672363, 0.003384232521057129, 0.0036005377769470215, 0.003816843032836914, 0.004033148288726807, 0.004249453544616699, 0.004465758800506592, 0.004682064056396484, 0.004898369312286377, 0.0051146745681762695, 0.005330979824066162, 0.005547285079956055, 0.005763590335845947, 0.00597989559173584, 0.006196200847625732, 0.006412506103515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 7.0, 8.0, 3.0, 7.0, 15.0, 25.0, 36.0, 162.0, 3526.0, 152.0, 43.0, 23.0, 17.0, 11.0, 10.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002166748046875, -0.0020933449268341064, -0.002019941806793213, -0.0019465386867523193, -0.0018731355667114258, -0.0017997324466705322, -0.0017263293266296387, -0.0016529262065887451, -0.0015795230865478516, -0.001506119966506958, -0.0014327168464660645, -0.001359313726425171, -0.0012859106063842773, -0.0012125074863433838, -0.0011391043663024902, -0.0010657012462615967, -0.0009922981262207031, -0.0009188950061798096, -0.000845491886138916, -0.0007720887660980225, -0.0006986856460571289, -0.0006252825260162354, -0.0005518794059753418, -0.00047847628593444824, -0.0004050731658935547, -0.00033167004585266113, -0.0002582669258117676, -0.00018486380577087402, -0.00011146068572998047, -3.8057565689086914e-05, 3.534555435180664e-05, 0.0001087486743927002, 0.00018215179443359375, 0.0002555549144744873, 0.00032895803451538086, 0.0004023611545562744, 0.00047576427459716797, 0.0005491673946380615, 0.0006225705146789551, 0.0006959736347198486, 0.0007693767547607422, 0.0008427798748016357, 0.0009161829948425293, 0.0009895861148834229, 0.0010629892349243164, 0.00113639235496521, 0.0012097954750061035, 0.001283198595046997, 0.0013566017150878906, 0.0014300048351287842, 0.0015034079551696777, 0.0015768110752105713, 0.0016502141952514648, 0.0017236173152923584, 0.001797020435333252, 0.0018704235553741455, 0.001943826675415039, 0.0020172297954559326, 0.002090632915496826, 0.0021640360355377197, 0.0022374391555786133, 0.002310842275619507, 0.0023842453956604004, 0.002457648515701294, 0.0025310516357421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 918.0, 72.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020353326573967934, -0.019935347139835358, -0.01951736770570278, -0.019099388271570206, -0.01868141070008278, -0.018263431265950203, -0.017845451831817627, -0.01742747239768505, -0.017009492963552475, -0.0165915135294199, -0.016173534095287323, -0.015755556523799896, -0.015337576158344746, -0.014919597655534744, -0.014501618221402168, -0.014083638787269592, -0.013665660284459591, -0.013247680850327015, -0.012829702347517014, -0.012411722913384438, -0.011993743479251862, -0.011575764045119286, -0.011157785542309284, -0.010739806108176708, -0.010321827605366707, -0.00990384817123413, -0.00948586966842413, -0.009067890234291553, -0.008649910800158978, -0.008231932297348976, -0.0078139528632164, -0.007395973429083824, -0.006977994926273823, -0.006560015957802534, -0.006142036523669958, -0.005724057555198669, -0.0053060781210660934, -0.004888099152594805, -0.004470120184123516, -0.00405214074999094, -0.0036341617815196514, -0.003216182580217719, -0.0027982033789157867, -0.002380224410444498, -0.0019622452091425657, -0.0015442660078406334, -0.0011262870393693447, -0.0007083078380674124, -0.00029032863676548004, 0.00012765050632879138, 0.0005456296494230628, 0.0009636087343096733, 0.0013815879356116056, 0.001799567136913538, 0.0022175461053848267, 0.002635525306686759, 0.0030535045079886913, 0.0034714837092906237, 0.003889462910592556, 0.004307441879063845, 0.004725420847535133, 0.005143400281667709, 0.005561379250138998, 0.005979358218610287, 0.006397337652742863]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 16.0, 14.0, 10.0, 19.0, 22.0, 22.0, 29.0, 30.0, 38.0, 40.0, 39.0, 36.0, 36.0, 56.0, 55.0, 59.0, 51.0, 47.0, 49.0, 41.0, 46.0, 38.0, 37.0, 30.0, 37.0, 16.0, 17.0, 10.0, 12.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.004937589168548584, -0.0047957561910152435, -0.004653923213481903, -0.004512090235948563, -0.004370257258415222, -0.004228424280881882, -0.004086591303348541, -0.003944758325815201, -0.0038029253482818604, -0.00366109237074852, -0.0035192593932151794, -0.003377426415681839, -0.0032355934381484985, -0.003093760460615158, -0.0029519274830818176, -0.002810094505548477, -0.0026682615280151367, -0.0025264285504817963, -0.002384595572948456, -0.0022427625954151154, -0.002100929617881775, -0.0019590966403484344, -0.001817263662815094, -0.0016754306852817535, -0.001533597707748413, -0.0013917647302150726, -0.0012499317526817322, -0.0011080987751483917, -0.0009662657976150513, -0.0008244328200817108, -0.0006825998425483704, -0.0005407668650150299, -0.00039893388748168945, -0.000257100909948349, -0.00011526793241500854, 2.656504511833191e-05, 0.00016839802265167236, 0.0003102310001850128, 0.00045206397771835327, 0.0005938969552516937, 0.0007357299327850342, 0.0008775629103183746, 0.001019395887851715, 0.0011612288653850555, 0.001303061842918396, 0.0014448948204517365, 0.001586727797985077, 0.0017285607755184174, 0.0018703937530517578, 0.0020122267305850983, 0.0021540597081184387, 0.002295892685651779, 0.0024377256631851196, 0.00257955864071846, 0.0027213916182518005, 0.002863224595785141, 0.0030050575733184814, 0.003146890550851822, 0.0032887235283851624, 0.003430556505918503, 0.0035723894834518433, 0.0037142224609851837, 0.003856055438518524, 0.003997888416051865, 0.004139721393585205]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 9.0, 4.0, 14.0, 9.0, 14.0, 17.0, 37.0, 55.0, 59.0, 93.0, 142.0, 208.0, 322.0, 440.0, 622.0, 988.0, 1604.0, 2544.0, 4350.0, 8113.0, 17370.0, 81866.0, 857292.0, 42220.0, 13513.0, 6741.0, 3664.0, 2117.0, 1370.0, 887.0, 597.0, 394.0, 272.0, 174.0, 110.0, 83.0, 65.0, 54.0, 38.0, 22.0, 16.0, 17.0, 7.0, 4.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00897216796875, -0.008666515350341797, -0.008360862731933594, -0.00805521011352539, -0.0077495574951171875, -0.007443904876708984, -0.007138252258300781, -0.006832599639892578, -0.006526947021484375, -0.006221294403076172, -0.005915641784667969, -0.005609989166259766, -0.0053043365478515625, -0.004998683929443359, -0.004693031311035156, -0.004387378692626953, -0.00408172607421875, -0.003776073455810547, -0.0034704208374023438, -0.0031647682189941406, -0.0028591156005859375, -0.0025534629821777344, -0.0022478103637695312, -0.0019421577453613281, -0.001636505126953125, -0.0013308525085449219, -0.0010251998901367188, -0.0007195472717285156, -0.0004138946533203125, -0.00010824203491210938, 0.00019741058349609375, 0.0005030632019042969, 0.0008087158203125, 0.0011143684387207031, 0.0014200210571289062, 0.0017256736755371094, 0.0020313262939453125, 0.0023369789123535156, 0.0026426315307617188, 0.002948284149169922, 0.003253936767578125, 0.003559589385986328, 0.0038652420043945312, 0.004170894622802734, 0.0044765472412109375, 0.004782199859619141, 0.005087852478027344, 0.005393505096435547, 0.00569915771484375, 0.006004810333251953, 0.006310462951660156, 0.006616115570068359, 0.0069217681884765625, 0.007227420806884766, 0.007533073425292969, 0.007838726043701172, 0.008144378662109375, 0.008450031280517578, 0.008755683898925781, 0.009061336517333984, 0.009366989135742188, 0.00967264175415039, 0.009978294372558594, 0.010283946990966797, 0.010589599609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 16.0, 5.0, 10.0, 6.0, 15.0, 56.0, 116.0, 271.0, 227.0, 116.0, 39.0, 12.0, 7.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007134854793548584, -0.006873011589050293, -0.006611168384552002, -0.006349325180053711, -0.00608748197555542, -0.005825638771057129, -0.005563795566558838, -0.005301952362060547, -0.005040109157562256, -0.004778265953063965, -0.004516422748565674, -0.004254579544067383, -0.003992736339569092, -0.0037308931350708008, -0.0034690499305725098, -0.0032072067260742188, -0.0029453635215759277, -0.0026835203170776367, -0.0024216771125793457, -0.0021598339080810547, -0.0018979907035827637, -0.0016361474990844727, -0.0013743042945861816, -0.0011124610900878906, -0.0008506178855895996, -0.0005887746810913086, -0.0003269314765930176, -6.508827209472656e-05, 0.00019675493240356445, 0.00045859813690185547, 0.0007204413414001465, 0.0009822845458984375, 0.0012441277503967285, 0.0015059709548950195, 0.0017678141593933105, 0.0020296573638916016, 0.0022915005683898926, 0.0025533437728881836, 0.0028151869773864746, 0.0030770301818847656, 0.0033388733863830566, 0.0036007165908813477, 0.0038625597953796387, 0.00412440299987793, 0.004386246204376221, 0.004648089408874512, 0.004909932613372803, 0.005171775817871094, 0.005433619022369385, 0.005695462226867676, 0.005957305431365967, 0.006219148635864258, 0.006480991840362549, 0.00674283504486084, 0.007004678249359131, 0.007266521453857422, 0.007528364658355713, 0.007790207862854004, 0.008052051067352295, 0.008313894271850586, 0.008575737476348877, 0.008837580680847168, 0.009099423885345459, 0.00936126708984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 6.0, 8.0, 11.0, 12.0, 15.0, 9.0, 27.0, 40.0, 44.0, 48.0, 78.0, 101.0, 130.0, 224.0, 338.0, 583.0, 1389.0, 11482.0, 988220.0, 41750.0, 2018.0, 747.0, 397.0, 245.0, 143.0, 110.0, 95.0, 61.0, 43.0, 36.0, 36.0, 22.0, 17.0, 12.0, 13.0, 9.0, 10.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02239990234375, -0.02158975601196289, -0.02077960968017578, -0.019969463348388672, -0.019159317016601562, -0.018349170684814453, -0.017539024353027344, -0.016728878021240234, -0.015918731689453125, -0.015108585357666016, -0.014298439025878906, -0.013488292694091797, -0.012678146362304688, -0.011868000030517578, -0.011057853698730469, -0.01024770736694336, -0.00943756103515625, -0.00862741470336914, -0.007817268371582031, -0.007007122039794922, -0.0061969757080078125, -0.005386829376220703, -0.004576683044433594, -0.0037665367126464844, -0.002956390380859375, -0.0021462440490722656, -0.0013360977172851562, -0.0005259513854980469, 0.0002841949462890625, 0.0010943412780761719, 0.0019044876098632812, 0.0027146339416503906, 0.0035247802734375, 0.004334926605224609, 0.005145072937011719, 0.005955219268798828, 0.0067653656005859375, 0.007575511932373047, 0.008385658264160156, 0.009195804595947266, 0.010005950927734375, 0.010816097259521484, 0.011626243591308594, 0.012436389923095703, 0.013246536254882812, 0.014056682586669922, 0.014866828918457031, 0.01567697525024414, 0.01648712158203125, 0.01729726791381836, 0.01810741424560547, 0.018917560577392578, 0.019727706909179688, 0.020537853240966797, 0.021347999572753906, 0.022158145904541016, 0.022968292236328125, 0.023778438568115234, 0.024588584899902344, 0.025398731231689453, 0.026208877563476562, 0.027019023895263672, 0.02782917022705078, 0.02863931655883789, 0.029449462890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 11.0, 5.0, 14.0, 24.0, 25.0, 21.0, 32.0, 31.0, 34.0, 53.0, 46.0, 47.0, 42.0, 47.0, 49.0, 41.0, 35.0, 34.0, 42.0, 38.0, 42.0, 41.0, 42.0, 31.0, 28.0, 16.0, 23.0, 16.0, 9.0, 11.0, 11.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0197296142578125, -0.01901698112487793, -0.01830434799194336, -0.01759171485900879, -0.01687908172607422, -0.01616644859313965, -0.015453815460205078, -0.014741182327270508, -0.014028549194335938, -0.013315916061401367, -0.012603282928466797, -0.011890649795532227, -0.011178016662597656, -0.010465383529663086, -0.009752750396728516, -0.009040117263793945, -0.008327484130859375, -0.007614850997924805, -0.006902217864990234, -0.006189584732055664, -0.005476951599121094, -0.0047643184661865234, -0.004051685333251953, -0.003339052200317383, -0.0026264190673828125, -0.0019137859344482422, -0.0012011528015136719, -0.0004885196685791016, 0.00022411346435546875, 0.0009367465972900391, 0.0016493797302246094, 0.0023620128631591797, 0.00307464599609375, 0.0037872791290283203, 0.004499912261962891, 0.005212545394897461, 0.005925178527832031, 0.0066378116607666016, 0.007350444793701172, 0.008063077926635742, 0.008775711059570312, 0.009488344192504883, 0.010200977325439453, 0.010913610458374023, 0.011626243591308594, 0.012338876724243164, 0.013051509857177734, 0.013764142990112305, 0.014476776123046875, 0.015189409255981445, 0.015902042388916016, 0.016614675521850586, 0.017327308654785156, 0.018039941787719727, 0.018752574920654297, 0.019465208053588867, 0.020177841186523438, 0.020890474319458008, 0.021603107452392578, 0.02231574058532715, 0.02302837371826172, 0.02374100685119629, 0.02445363998413086, 0.02516627311706543, 0.02587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 36.0, 32.0, 53.0, 56.0, 87.0, 166.0, 356.0, 865.0, 1357.0, 6704.0, 53288.0, 922044.0, 53612.0, 6699.0, 1347.0, 909.0, 323.0, 172.0, 113.0, 51.0, 54.0, 45.0, 22.0, 18.0, 5.0, 13.0, 8.0, 8.0, 8.0, 9.0, 1.0, 8.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.6140124797821045e-06, -5.446374416351318e-06, -5.278736352920532e-06, -5.111098289489746e-06, -4.94346022605896e-06, -4.775822162628174e-06, -4.608184099197388e-06, -4.4405460357666016e-06, -4.2729079723358154e-06, -4.105269908905029e-06, -3.937631845474243e-06, -3.769993782043457e-06, -3.602355718612671e-06, -3.4347176551818848e-06, -3.2670795917510986e-06, -3.0994415283203125e-06, -2.9318034648895264e-06, -2.7641654014587402e-06, -2.596527338027954e-06, -2.428889274597168e-06, -2.261251211166382e-06, -2.0936131477355957e-06, -1.9259750843048096e-06, -1.7583370208740234e-06, -1.5906989574432373e-06, -1.4230608940124512e-06, -1.255422830581665e-06, -1.087784767150879e-06, -9.201467037200928e-07, -7.525086402893066e-07, -5.848705768585205e-07, -4.172325134277344e-07, -2.4959444999694824e-07, -8.195638656616211e-08, 8.568167686462402e-08, 2.5331974029541016e-07, 4.209578037261963e-07, 5.885958671569824e-07, 7.562339305877686e-07, 9.238719940185547e-07, 1.0915100574493408e-06, 1.259148120880127e-06, 1.426786184310913e-06, 1.5944242477416992e-06, 1.7620623111724854e-06, 1.9297003746032715e-06, 2.0973384380340576e-06, 2.2649765014648438e-06, 2.43261456489563e-06, 2.600252628326416e-06, 2.767890691757202e-06, 2.9355287551879883e-06, 3.1031668186187744e-06, 3.2708048820495605e-06, 3.4384429454803467e-06, 3.606081008911133e-06, 3.773719072341919e-06, 3.941357135772705e-06, 4.108995199203491e-06, 4.276633262634277e-06, 4.4442713260650635e-06, 4.61190938949585e-06, 4.779547452926636e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 9.0, 16.0, 16.0, 10.0, 17.0, 34.0, 25.0, 31.0, 39.0, 79.0, 51.0, 52.0, 77.0, 95.0, 58.0, 83.0, 44.0, 37.0, 22.0, 33.0, 16.0, 32.0, 17.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.947185516357422e-06, -4.81773167848587e-06, -4.688277840614319e-06, -4.558824002742767e-06, -4.429370164871216e-06, -4.299916326999664e-06, -4.170462489128113e-06, -4.041008651256561e-06, -3.91155481338501e-06, -3.7821009755134583e-06, -3.6526471376419067e-06, -3.5231932997703552e-06, -3.3937394618988037e-06, -3.264285624027252e-06, -3.1348317861557007e-06, -3.005377948284149e-06, -2.8759241104125977e-06, -2.746470272541046e-06, -2.6170164346694946e-06, -2.487562596797943e-06, -2.3581087589263916e-06, -2.22865492105484e-06, -2.0992010831832886e-06, -1.969747245311737e-06, -1.8402934074401855e-06, -1.710839569568634e-06, -1.5813857316970825e-06, -1.451931893825531e-06, -1.3224780559539795e-06, -1.193024218082428e-06, -1.0635703802108765e-06, -9.34116542339325e-07, -8.046627044677734e-07, -6.752088665962219e-07, -5.457550287246704e-07, -4.163011908531189e-07, -2.868473529815674e-07, -1.5739351511001587e-07, -2.7939677238464355e-08, 1.0151416063308716e-07, 2.3096799850463867e-07, 3.604218363761902e-07, 4.898756742477417e-07, 6.193295121192932e-07, 7.487833499908447e-07, 8.782371878623962e-07, 1.0076910257339478e-06, 1.1371448636054993e-06, 1.2665987014770508e-06, 1.3960525393486023e-06, 1.5255063772201538e-06, 1.6549602150917053e-06, 1.7844140529632568e-06, 1.9138678908348083e-06, 2.04332172870636e-06, 2.1727755665779114e-06, 2.302229404449463e-06, 2.4316832423210144e-06, 2.561137080192566e-06, 2.6905909180641174e-06, 2.820044755935669e-06, 2.9494985938072205e-06, 3.078952431678772e-06, 3.2084062695503235e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 10.0, 15.0, 23.0, 28.0, 36.0, 85.0, 202.0, 820.0, 78333.0, 967444.0, 1094.0, 206.0, 100.0, 42.0, 32.0, 20.0, 12.0, 12.0, 6.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.1517276763916016e-05, -2.0920298993587494e-05, -2.0323321223258972e-05, -1.972634345293045e-05, -1.912936568260193e-05, -1.8532387912273407e-05, -1.7935410141944885e-05, -1.7338432371616364e-05, -1.6741454601287842e-05, -1.614447683095932e-05, -1.55474990606308e-05, -1.4950521290302277e-05, -1.4353543519973755e-05, -1.3756565749645233e-05, -1.3159587979316711e-05, -1.256261020898819e-05, -1.1965632438659668e-05, -1.1368654668331146e-05, -1.0771676898002625e-05, -1.0174699127674103e-05, -9.577721357345581e-06, -8.98074358701706e-06, -8.383765816688538e-06, -7.786788046360016e-06, -7.189810276031494e-06, -6.592832505702972e-06, -5.995854735374451e-06, -5.398876965045929e-06, -4.801899194717407e-06, -4.2049214243888855e-06, -3.6079436540603638e-06, -3.010965883731842e-06, -2.4139881134033203e-06, -1.8170103430747986e-06, -1.2200325727462769e-06, -6.230548024177551e-07, -2.60770320892334e-08, 5.709007382392883e-07, 1.16787850856781e-06, 1.7648562788963318e-06, 2.3618340492248535e-06, 2.9588118195533752e-06, 3.555789589881897e-06, 4.152767360210419e-06, 4.7497451305389404e-06, 5.346722900867462e-06, 5.943700671195984e-06, 6.540678441524506e-06, 7.137656211853027e-06, 7.734633982181549e-06, 8.33161175251007e-06, 8.928589522838593e-06, 9.525567293167114e-06, 1.0122545063495636e-05, 1.0719522833824158e-05, 1.131650060415268e-05, 1.1913478374481201e-05, 1.2510456144809723e-05, 1.3107433915138245e-05, 1.3704411685466766e-05, 1.4301389455795288e-05, 1.489836722612381e-05, 1.549534499645233e-05, 1.6092322766780853e-05, 1.6689300537109375e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 3.0, 10.0, 25.0, 34.0, 55.0, 103.0, 544.0, 74.0, 47.0, 32.0, 17.0, 9.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.901388168334961e-05, -1.848861575126648e-05, -1.796334981918335e-05, -1.743808388710022e-05, -1.691281795501709e-05, -1.638755202293396e-05, -1.586228609085083e-05, -1.53370201587677e-05, -1.481175422668457e-05, -1.428648829460144e-05, -1.376122236251831e-05, -1.323595643043518e-05, -1.271069049835205e-05, -1.2185424566268921e-05, -1.1660158634185791e-05, -1.1134892702102661e-05, -1.0609626770019531e-05, -1.0084360837936401e-05, -9.559094905853271e-06, -9.033828973770142e-06, -8.508563041687012e-06, -7.983297109603882e-06, -7.458031177520752e-06, -6.932765245437622e-06, -6.407499313354492e-06, -5.882233381271362e-06, -5.356967449188232e-06, -4.8317015171051025e-06, -4.306435585021973e-06, -3.7811696529388428e-06, -3.255903720855713e-06, -2.730637788772583e-06, -2.205371856689453e-06, -1.6801059246063232e-06, -1.1548399925231934e-06, -6.295740604400635e-07, -1.043081283569336e-07, 4.209578037261963e-07, 9.462237358093262e-07, 1.471489667892456e-06, 1.996755599975586e-06, 2.522021532058716e-06, 3.0472874641418457e-06, 3.5725533962249756e-06, 4.0978193283081055e-06, 4.623085260391235e-06, 5.148351192474365e-06, 5.673617124557495e-06, 6.198883056640625e-06, 6.724148988723755e-06, 7.249414920806885e-06, 7.774680852890015e-06, 8.299946784973145e-06, 8.825212717056274e-06, 9.350478649139404e-06, 9.875744581222534e-06, 1.0401010513305664e-05, 1.0926276445388794e-05, 1.1451542377471924e-05, 1.1976808309555054e-05, 1.2502074241638184e-05, 1.3027340173721313e-05, 1.3552606105804443e-05, 1.4077872037887573e-05, 1.4603137969970703e-05]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 35.0, 240.0, 634.0, 78.0, 12.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20908275246620178, -0.20536312460899353, -0.20164349675178528, -0.19792388379573822, -0.19420425593852997, -0.19048462808132172, -0.18676500022411346, -0.1830453723669052, -0.17932575941085815, -0.1756061315536499, -0.17188650369644165, -0.1681668907403946, -0.16444726288318634, -0.1607276350259781, -0.15700800716876984, -0.15328837931156158, -0.14956875145435333, -0.14584912359714508, -0.14212949573993683, -0.13840988278388977, -0.13469025492668152, -0.13097062706947327, -0.12725099921226501, -0.12353137880563736, -0.1198117583990097, -0.11609213054180145, -0.1123725101351738, -0.10865288227796555, -0.10493326187133789, -0.10121363401412964, -0.09749400615692139, -0.09377438575029373, -0.09005476534366608, -0.08633513748645782, -0.08261551707983017, -0.07889588922262192, -0.07517626881599426, -0.07145664095878601, -0.06773701310157776, -0.0640173926949501, -0.06029776483774185, -0.0565781407058239, -0.052858516573905945, -0.04913888871669769, -0.04541926458477974, -0.041699640452861786, -0.03798001632094383, -0.03426039218902588, -0.030540764331817627, -0.026821140199899673, -0.02310151420533657, -0.019381890073418617, -0.015662264078855515, -0.011942639946937561, -0.008223015815019608, -0.004503389820456505, -0.0007837656885385513, 0.002935859141871333, 0.006655483972281218, 0.010375108569860458, 0.014094733633100986, 0.017814358696341515, 0.021533982828259468, 0.02525360882282257, 0.028973232954740524]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 3.0, 5.0, 8.0, 12.0, 14.0, 8.0, 17.0, 20.0, 24.0, 20.0, 37.0, 33.0, 36.0, 38.0, 42.0, 44.0, 39.0, 46.0, 48.0, 44.0, 45.0, 53.0, 35.0, 45.0, 34.0, 37.0, 32.0, 30.0, 31.0, 29.0, 17.0, 21.0, 11.0, 13.0, 5.0, 3.0, 5.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1010514497756958, -0.09765557199716568, -0.09425970166921616, -0.09086382389068604, -0.08746795356273651, -0.08407207578420639, -0.08067619800567627, -0.07728032767772675, -0.07388444989919662, -0.0704885721206665, -0.06709270179271698, -0.06369682401418686, -0.06030094996094704, -0.056905075907707214, -0.053509198129177094, -0.05011332407593727, -0.04671745002269745, -0.043321575969457626, -0.039925701916217804, -0.03652982413768768, -0.03313395008444786, -0.02973807603120804, -0.026342200115323067, -0.022946324199438095, -0.019550450146198273, -0.01615457609295845, -0.012758700177073479, -0.009362825192511082, -0.005966950207948685, -0.0025710761547088623, 0.0008247997611761093, 0.004220675677061081, 0.007616549730300903, 0.0110124247148633, 0.014408299699425697, 0.01780417561531067, 0.02120004966855049, 0.024595923721790314, 0.027991799637675285, 0.03138767555356026, 0.03478354960680008, 0.0381794236600399, 0.041575297713279724, 0.044971175491809845, 0.04836704954504967, 0.05176292359828949, 0.05515880137681961, 0.05855467543005943, 0.061950549483299255, 0.06534642726182938, 0.0687422975897789, 0.07213817536830902, 0.07553404569625854, 0.07892992347478867, 0.08232580125331879, 0.08572167158126831, 0.08911754935979843, 0.09251342713832855, 0.09590929746627808, 0.0993051752448082, 0.10270105302333832, 0.10609692335128784, 0.10949280112981796, 0.11288867890834808, 0.11628454923629761]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 14.0, 9.0, 8.0, 9.0, 18.0, 72.0, 166.0, 1615.0, 4191893.0, 244.0, 84.0, 29.0, 15.0, 14.0, 6.0, 12.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07489013671875, -0.07224273681640625, -0.0695953369140625, -0.06694793701171875, -0.064300537109375, -0.06165313720703125, -0.0590057373046875, -0.05635833740234375, -0.0537109375, -0.05106353759765625, -0.0484161376953125, -0.04576873779296875, -0.043121337890625, -0.04047393798828125, -0.0378265380859375, -0.03517913818359375, -0.03253173828125, -0.02988433837890625, -0.0272369384765625, -0.02458953857421875, -0.021942138671875, -0.01929473876953125, -0.0166473388671875, -0.01399993896484375, -0.0113525390625, -0.00870513916015625, -0.0060577392578125, -0.00341033935546875, -0.000762939453125, 0.00188446044921875, 0.0045318603515625, 0.00717926025390625, 0.00982666015625, 0.01247406005859375, 0.0151214599609375, 0.01776885986328125, 0.020416259765625, 0.02306365966796875, 0.0257110595703125, 0.02835845947265625, 0.031005859375, 0.03365325927734375, 0.0363006591796875, 0.03894805908203125, 0.041595458984375, 0.04424285888671875, 0.0468902587890625, 0.04953765869140625, 0.05218505859375, 0.05483245849609375, 0.0574798583984375, 0.06012725830078125, 0.062774658203125, 0.06542205810546875, 0.0680694580078125, 0.07071685791015625, 0.0733642578125, 0.07601165771484375, 0.0786590576171875, 0.08130645751953125, 0.083953857421875, 0.08660125732421875, 0.0892486572265625, 0.09189605712890625, 0.09454345703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 4.0, 12.0, 10.0, 9.0, 7.0, 15.0, 40.0, 119.0, 228.0, 256.0, 131.0, 47.0, 14.0, 8.0, 11.0, 9.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00737762451171875, -0.0071179866790771484, -0.006858348846435547, -0.006598711013793945, -0.006339073181152344, -0.006079435348510742, -0.005819797515869141, -0.005560159683227539, -0.0053005218505859375, -0.005040884017944336, -0.004781246185302734, -0.004521608352661133, -0.004261970520019531, -0.00400233268737793, -0.003742694854736328, -0.0034830570220947266, -0.003223419189453125, -0.0029637813568115234, -0.002704143524169922, -0.0024445056915283203, -0.0021848678588867188, -0.0019252300262451172, -0.0016655921936035156, -0.001405954360961914, -0.0011463165283203125, -0.0008866786956787109, -0.0006270408630371094, -0.0003674030303955078, -0.00010776519775390625, 0.0001518726348876953, 0.0004115104675292969, 0.0006711483001708984, 0.0009307861328125, 0.0011904239654541016, 0.0014500617980957031, 0.0017096996307373047, 0.0019693374633789062, 0.002228975296020508, 0.0024886131286621094, 0.002748250961303711, 0.0030078887939453125, 0.003267526626586914, 0.0035271644592285156, 0.003786802291870117, 0.004046440124511719, 0.00430607795715332, 0.004565715789794922, 0.0048253536224365234, 0.005084991455078125, 0.0053446292877197266, 0.005604267120361328, 0.00586390495300293, 0.006123542785644531, 0.006383180618286133, 0.006642818450927734, 0.006902456283569336, 0.0071620941162109375, 0.007421731948852539, 0.007681369781494141, 0.007941007614135742, 0.008200645446777344, 0.008460283279418945, 0.008719921112060547, 0.008979558944702148, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 5.0, 13.0, 38.0, 117.0, 422.0, 1267.0, 81219.0, 4109075.0, 1471.0, 421.0, 126.0, 58.0, 21.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0125732421875, -0.01220393180847168, -0.01183462142944336, -0.011465311050415039, -0.011096000671386719, -0.010726690292358398, -0.010357379913330078, -0.009988069534301758, -0.009618759155273438, -0.009249448776245117, -0.008880138397216797, -0.008510828018188477, -0.008141517639160156, -0.007772207260131836, -0.007402896881103516, -0.007033586502075195, -0.006664276123046875, -0.006294965744018555, -0.005925655364990234, -0.005556344985961914, -0.005187034606933594, -0.0048177242279052734, -0.004448413848876953, -0.004079103469848633, -0.0037097930908203125, -0.003340482711791992, -0.002971172332763672, -0.0026018619537353516, -0.0022325515747070312, -0.001863241195678711, -0.0014939308166503906, -0.0011246204376220703, -0.00075531005859375, -0.0003859996795654297, -1.6689300537109375e-05, 0.00035262107849121094, 0.0007219314575195312, 0.0010912418365478516, 0.0014605522155761719, 0.0018298625946044922, 0.0021991729736328125, 0.002568483352661133, 0.002937793731689453, 0.0033071041107177734, 0.0036764144897460938, 0.004045724868774414, 0.004415035247802734, 0.004784345626831055, 0.005153656005859375, 0.005522966384887695, 0.005892276763916016, 0.006261587142944336, 0.006630897521972656, 0.0070002079010009766, 0.007369518280029297, 0.007738828659057617, 0.008108139038085938, 0.008477449417114258, 0.008846759796142578, 0.009216070175170898, 0.009585380554199219, 0.009954690933227539, 0.01032400131225586, 0.01069331169128418, 0.0110626220703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 16.0, 36.0, 155.0, 3775.0, 51.0, 17.0, 5.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028514862060546875, -0.002742379903793335, -0.0026332736015319824, -0.00252416729927063, -0.0024150609970092773, -0.002305954694747925, -0.0021968483924865723, -0.0020877420902252197, -0.001978635787963867, -0.0018695294857025146, -0.0017604231834411621, -0.0016513168811798096, -0.001542210578918457, -0.0014331042766571045, -0.001323997974395752, -0.0012148916721343994, -0.0011057853698730469, -0.0009966790676116943, -0.0008875727653503418, -0.0007784664630889893, -0.0006693601608276367, -0.0005602538585662842, -0.00045114755630493164, -0.0003420412540435791, -0.00023293495178222656, -0.00012382864952087402, -1.4722347259521484e-05, 9.438395500183105e-05, 0.0002034902572631836, 0.00031259655952453613, 0.00042170286178588867, 0.0005308091640472412, 0.0006399154663085938, 0.0007490217685699463, 0.0008581280708312988, 0.0009672343730926514, 0.001076340675354004, 0.0011854469776153564, 0.001294553279876709, 0.0014036595821380615, 0.001512765884399414, 0.0016218721866607666, 0.0017309784889221191, 0.0018400847911834717, 0.0019491910934448242, 0.0020582973957061768, 0.0021674036979675293, 0.002276510000228882, 0.0023856163024902344, 0.002494722604751587, 0.0026038289070129395, 0.002712935209274292, 0.0028220415115356445, 0.002931147813796997, 0.0030402541160583496, 0.003149360418319702, 0.0032584667205810547, 0.0033675730228424072, 0.0034766793251037598, 0.0035857856273651123, 0.003694891929626465, 0.0038039982318878174, 0.00391310453414917, 0.0040222108364105225, 0.004131317138671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1001.0, 17.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001215107156895101, 0.0004822030896320939, 0.002179513219743967, 0.003876823466271162, 0.005574133712798357, 0.007271443959325552, 0.008968754671514034, 0.01066606491804123, 0.012363375164568424, 0.01406068541109562, 0.01575799658894539, 0.01745530590415001, 0.01915261521935463, 0.0208499263972044, 0.02254723757505417, 0.02424454689025879, 0.02594185620546341, 0.02763916552066803, 0.0293364766985178, 0.03103378787636757, 0.03273109719157219, 0.03442840650677681, 0.03612571954727173, 0.03782302886247635, 0.03952033817768097, 0.04121764749288559, 0.04291495680809021, 0.04461226984858513, 0.04630957916378975, 0.04800688847899437, 0.04970420151948929, 0.05140151083469391, 0.05309882014989853, 0.05479612946510315, 0.05649343878030777, 0.05819075182080269, 0.05988806113600731, 0.06158537045121193, 0.06328268349170685, 0.06497999280691147, 0.06667730212211609, 0.06837461143732071, 0.07007192075252533, 0.07176923006772995, 0.07346653938293457, 0.07516385614871979, 0.07686116546392441, 0.07855847477912903, 0.08025578409433365, 0.08195309340953827, 0.08365040272474289, 0.08534771203994751, 0.08704502880573273, 0.08874233812093735, 0.09043964743614197, 0.09213695675134659, 0.09383426606655121, 0.09553157538175583, 0.09722888469696045, 0.09892619401216507, 0.10062350332736969, 0.10232082009315491, 0.10401812940835953, 0.10571543872356415, 0.10741274803876877]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 29.0, 43.0, 63.0, 57.0, 91.0, 90.0, 112.0, 83.0, 92.0, 84.0, 73.0, 52.0, 33.0, 22.0, 19.0, 12.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006871998310089111, -0.006643389351665974, -0.006414780393242836, -0.006186171434819698, -0.005957562476396561, -0.005728953517973423, -0.005500344559550285, -0.005271735601127148, -0.00504312664270401, -0.004814517684280872, -0.004585908725857735, -0.004357299767434597, -0.004128690809011459, -0.0039000818505883217, -0.003671472892165184, -0.0034428639337420464, -0.0032142549753189087, -0.002985646016895771, -0.0027570370584726334, -0.0025284281000494957, -0.002299819141626358, -0.0020712101832032204, -0.0018426012247800827, -0.001613992266356945, -0.0013853833079338074, -0.0011567743495106697, -0.000928165391087532, -0.0006995564326643944, -0.0004709474742412567, -0.00024233851581811905, -1.3729557394981384e-05, 0.00021487940102815628, 0.00044348835945129395, 0.0006720973178744316, 0.0009007062762975693, 0.001129315234720707, 0.0013579241931438446, 0.0015865331515669823, 0.00181514210999012, 0.0020437510684132576, 0.0022723600268363953, 0.002500968985259533, 0.0027295779436826706, 0.0029581869021058083, 0.003186795860528946, 0.0034154048189520836, 0.0036440137773752213, 0.003872622735798359, 0.004101231694221497, 0.004329840652644634, 0.004558449611067772, 0.00478705856949091, 0.005015667527914047, 0.005244276486337185, 0.005472885444760323, 0.00570149440318346, 0.005930103361606598, 0.0061587123200297356, 0.006387321278452873, 0.006615930236876011, 0.0068445391952991486, 0.007073148153722286, 0.007301757112145424, 0.0075303660705685616, 0.007758975028991699]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 27.0, 25.0, 54.0, 69.0, 89.0, 164.0, 229.0, 364.0, 529.0, 855.0, 1397.0, 2572.0, 4858.0, 10688.0, 37155.0, 900380.0, 62487.0, 13481.0, 5897.0, 2922.0, 1634.0, 950.0, 595.0, 356.0, 234.0, 159.0, 104.0, 74.0, 55.0, 25.0, 23.0, 19.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0219573974609375, -0.02134084701538086, -0.02072429656982422, -0.020107746124267578, -0.019491195678710938, -0.018874645233154297, -0.018258094787597656, -0.017641544342041016, -0.017024993896484375, -0.016408443450927734, -0.015791893005371094, -0.015175342559814453, -0.014558792114257812, -0.013942241668701172, -0.013325691223144531, -0.01270914077758789, -0.01209259033203125, -0.01147603988647461, -0.010859489440917969, -0.010242938995361328, -0.009626388549804688, -0.009009838104248047, -0.008393287658691406, -0.007776737213134766, -0.007160186767578125, -0.006543636322021484, -0.005927085876464844, -0.005310535430908203, -0.0046939849853515625, -0.004077434539794922, -0.0034608840942382812, -0.0028443336486816406, -0.002227783203125, -0.0016112327575683594, -0.0009946823120117188, -0.0003781318664550781, 0.0002384185791015625, 0.0008549690246582031, 0.0014715194702148438, 0.0020880699157714844, 0.002704620361328125, 0.0033211708068847656, 0.003937721252441406, 0.004554271697998047, 0.0051708221435546875, 0.005787372589111328, 0.006403923034667969, 0.007020473480224609, 0.00763702392578125, 0.00825357437133789, 0.008870124816894531, 0.009486675262451172, 0.010103225708007812, 0.010719776153564453, 0.011336326599121094, 0.011952877044677734, 0.012569427490234375, 0.013185977935791016, 0.013802528381347656, 0.014419078826904297, 0.015035629272460938, 0.015652179718017578, 0.01626873016357422, 0.01688528060913086, 0.0175018310546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 4.0, 12.0, 10.0, 9.0, 7.0, 15.0, 41.0, 118.0, 230.0, 255.0, 131.0, 46.0, 14.0, 8.0, 10.0, 10.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007373809814453125, -0.007114231586456299, -0.006854653358459473, -0.0065950751304626465, -0.00633549690246582, -0.006075918674468994, -0.005816340446472168, -0.005556762218475342, -0.005297183990478516, -0.0050376057624816895, -0.004778027534484863, -0.004518449306488037, -0.004258871078491211, -0.003999292850494385, -0.0037397146224975586, -0.0034801363945007324, -0.0032205581665039062, -0.00296097993850708, -0.002701401710510254, -0.0024418234825134277, -0.0021822452545166016, -0.0019226670265197754, -0.0016630887985229492, -0.001403510570526123, -0.0011439323425292969, -0.0008843541145324707, -0.0006247758865356445, -0.00036519765853881836, -0.00010561943054199219, 0.00015395879745483398, 0.00041353702545166016, 0.0006731152534484863, 0.0009326934814453125, 0.0011922717094421387, 0.0014518499374389648, 0.001711428165435791, 0.001971006393432617, 0.0022305846214294434, 0.0024901628494262695, 0.0027497410774230957, 0.003009319305419922, 0.003268897533416748, 0.0035284757614135742, 0.0037880539894104004, 0.0040476322174072266, 0.004307210445404053, 0.004566788673400879, 0.004826366901397705, 0.005085945129394531, 0.005345523357391357, 0.005605101585388184, 0.00586467981338501, 0.006124258041381836, 0.006383836269378662, 0.006643414497375488, 0.0069029927253723145, 0.007162570953369141, 0.007422149181365967, 0.007681727409362793, 0.00794130563735962, 0.008200883865356445, 0.008460462093353271, 0.008720040321350098, 0.008979618549346924, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 3.0, 4.0, 7.0, 11.0, 12.0, 17.0, 23.0, 26.0, 33.0, 27.0, 40.0, 55.0, 63.0, 90.0, 138.0, 244.0, 404.0, 768.0, 1681.0, 9253.0, 1018456.0, 13366.0, 1790.0, 783.0, 422.0, 241.0, 154.0, 104.0, 96.0, 50.0, 33.0, 34.0, 27.0, 20.0, 17.0, 12.0, 10.0, 7.0, 11.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03839111328125, -0.03721141815185547, -0.03603172302246094, -0.034852027893066406, -0.033672332763671875, -0.032492637634277344, -0.03131294250488281, -0.03013324737548828, -0.02895355224609375, -0.02777385711669922, -0.026594161987304688, -0.025414466857910156, -0.024234771728515625, -0.023055076599121094, -0.021875381469726562, -0.02069568634033203, -0.0195159912109375, -0.01833629608154297, -0.017156600952148438, -0.015976905822753906, -0.014797210693359375, -0.013617515563964844, -0.012437820434570312, -0.011258125305175781, -0.01007843017578125, -0.008898735046386719, -0.0077190399169921875, -0.006539344787597656, -0.005359649658203125, -0.004179954528808594, -0.0030002593994140625, -0.0018205642700195312, -0.000640869140625, 0.0005388259887695312, 0.0017185211181640625, 0.0028982162475585938, 0.004077911376953125, 0.005257606506347656, 0.0064373016357421875, 0.007616996765136719, 0.00879669189453125, 0.009976387023925781, 0.011156082153320312, 0.012335777282714844, 0.013515472412109375, 0.014695167541503906, 0.015874862670898438, 0.01705455780029297, 0.0182342529296875, 0.01941394805908203, 0.020593643188476562, 0.021773338317871094, 0.022953033447265625, 0.024132728576660156, 0.025312423706054688, 0.02649211883544922, 0.02767181396484375, 0.02885150909423828, 0.030031204223632812, 0.031210899353027344, 0.032390594482421875, 0.033570289611816406, 0.03474998474121094, 0.03592967987060547, 0.037109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 3.0, 2.0, 9.0, 11.0, 11.0, 16.0, 23.0, 24.0, 27.0, 21.0, 31.0, 25.0, 34.0, 32.0, 30.0, 35.0, 37.0, 32.0, 39.0, 48.0, 45.0, 29.0, 51.0, 27.0, 41.0, 33.0, 25.0, 37.0, 41.0, 25.0, 25.0, 23.0, 19.0, 15.0, 17.0, 11.0, 8.0, 6.0, 12.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.019878387451171875, -0.01924896240234375, -0.018619537353515625, -0.0179901123046875, -0.017360687255859375, -0.01673126220703125, -0.016101837158203125, -0.015472412109375, -0.014842987060546875, -0.01421356201171875, -0.013584136962890625, -0.0129547119140625, -0.012325286865234375, -0.01169586181640625, -0.011066436767578125, -0.01043701171875, -0.009807586669921875, -0.00917816162109375, -0.008548736572265625, -0.0079193115234375, -0.007289886474609375, -0.00666046142578125, -0.006031036376953125, -0.005401611328125, -0.004772186279296875, -0.00414276123046875, -0.003513336181640625, -0.0028839111328125, -0.002254486083984375, -0.00162506103515625, -0.000995635986328125, -0.0003662109375, 0.000263214111328125, 0.00089263916015625, 0.001522064208984375, 0.0021514892578125, 0.002780914306640625, 0.00341033935546875, 0.004039764404296875, 0.004669189453125, 0.005298614501953125, 0.00592803955078125, 0.006557464599609375, 0.0071868896484375, 0.007816314697265625, 0.00844573974609375, 0.009075164794921875, 0.00970458984375, 0.010334014892578125, 0.01096343994140625, 0.011592864990234375, 0.0122222900390625, 0.012851715087890625, 0.01348114013671875, 0.014110565185546875, 0.014739990234375, 0.015369415283203125, 0.01599884033203125, 0.016628265380859375, 0.0172576904296875, 0.017887115478515625, 0.01851654052734375, 0.019145965576171875, 0.019775390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 8.0, 6.0, 8.0, 17.0, 15.0, 26.0, 59.0, 70.0, 137.0, 358.0, 1287.0, 34820.0, 1002748.0, 7744.0, 759.0, 209.0, 120.0, 53.0, 40.0, 17.0, 16.0, 9.0, 10.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0829960703849792e-05, -2.014264464378357e-05, -1.9455328583717346e-05, -1.8768012523651123e-05, -1.80806964635849e-05, -1.7393380403518677e-05, -1.6706064343452454e-05, -1.601874828338623e-05, -1.5331432223320007e-05, -1.4644116163253784e-05, -1.3956800103187561e-05, -1.3269484043121338e-05, -1.2582167983055115e-05, -1.1894851922988892e-05, -1.1207535862922668e-05, -1.0520219802856445e-05, -9.832903742790222e-06, -9.145587682723999e-06, -8.458271622657776e-06, -7.770955562591553e-06, -7.08363950252533e-06, -6.3963234424591064e-06, -5.709007382392883e-06, -5.02169132232666e-06, -4.334375262260437e-06, -3.647059202194214e-06, -2.9597431421279907e-06, -2.2724270820617676e-06, -1.5851110219955444e-06, -8.977949619293213e-07, -2.1047890186309814e-07, 4.76837158203125e-07, 1.1641532182693481e-06, 1.8514692783355713e-06, 2.5387853384017944e-06, 3.2261013984680176e-06, 3.913417458534241e-06, 4.600733518600464e-06, 5.288049578666687e-06, 5.97536563873291e-06, 6.662681698799133e-06, 7.3499977588653564e-06, 8.03731381893158e-06, 8.724629878997803e-06, 9.411945939064026e-06, 1.0099261999130249e-05, 1.0786578059196472e-05, 1.1473894119262695e-05, 1.2161210179328918e-05, 1.2848526239395142e-05, 1.3535842299461365e-05, 1.4223158359527588e-05, 1.4910474419593811e-05, 1.5597790479660034e-05, 1.6285106539726257e-05, 1.697242259979248e-05, 1.7659738659858704e-05, 1.8347054719924927e-05, 1.903437077999115e-05, 1.9721686840057373e-05, 2.0409002900123596e-05, 2.109631896018982e-05, 2.1783635020256042e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 10.0, 11.0, 16.0, 21.0, 22.0, 30.0, 51.0, 69.0, 111.0, 116.0, 150.0, 116.0, 73.0, 57.0, 32.0, 30.0, 23.0, 15.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-05, -1.0973773896694183e-05, -1.0622665286064148e-05, -1.0271556675434113e-05, -9.920448064804077e-06, -9.569339454174042e-06, -9.218230843544006e-06, -8.867122232913971e-06, -8.516013622283936e-06, -8.1649050116539e-06, -7.813796401023865e-06, -7.462687790393829e-06, -7.111579179763794e-06, -6.7604705691337585e-06, -6.409361958503723e-06, -6.058253347873688e-06, -5.707144737243652e-06, -5.356036126613617e-06, -5.0049275159835815e-06, -4.653818905353546e-06, -4.302710294723511e-06, -3.951601684093475e-06, -3.60049307346344e-06, -3.2493844628334045e-06, -2.898275852203369e-06, -2.5471672415733337e-06, -2.1960586309432983e-06, -1.844950020313263e-06, -1.4938414096832275e-06, -1.1427327990531921e-06, -7.916241884231567e-07, -4.4051557779312134e-07, -8.940696716308594e-08, 2.6170164346694946e-07, 6.128102540969849e-07, 9.639188647270203e-07, 1.3150274753570557e-06, 1.666136085987091e-06, 2.0172446966171265e-06, 2.368353307247162e-06, 2.7194619178771973e-06, 3.0705705285072327e-06, 3.421679139137268e-06, 3.7727877497673035e-06, 4.123896360397339e-06, 4.475004971027374e-06, 4.82611358165741e-06, 5.177222192287445e-06, 5.5283308029174805e-06, 5.879439413547516e-06, 6.230548024177551e-06, 6.581656634807587e-06, 6.932765245437622e-06, 7.2838738560676575e-06, 7.634982466697693e-06, 7.986091077327728e-06, 8.337199687957764e-06, 8.688308298587799e-06, 9.039416909217834e-06, 9.39052551984787e-06, 9.741634130477905e-06, 1.009274274110794e-05, 1.0443851351737976e-05, 1.0794959962368011e-05, 1.1146068572998047e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 9.0, 7.0, 13.0, 24.0, 36.0, 55.0, 118.0, 333.0, 1906.0, 1043067.0, 2321.0, 365.0, 123.0, 72.0, 34.0, 23.0, 15.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.791188985109329e-05, -4.6232715249061584e-05, -4.455354064702988e-05, -4.287436604499817e-05, -4.119519144296646e-05, -3.9516016840934753e-05, -3.7836842238903046e-05, -3.615766763687134e-05, -3.447849303483963e-05, -3.279931843280792e-05, -3.1120143830776215e-05, -2.9440969228744507e-05, -2.77617946267128e-05, -2.608262002468109e-05, -2.4403445422649384e-05, -2.2724270820617676e-05, -2.1045096218585968e-05, -1.936592161655426e-05, -1.7686747014522552e-05, -1.6007572412490845e-05, -1.4328397810459137e-05, -1.264922320842743e-05, -1.0970048606395721e-05, -9.290874004364014e-06, -7.611699402332306e-06, -5.932524800300598e-06, -4.25335019826889e-06, -2.5741755962371826e-06, -8.950009942054749e-07, 7.841736078262329e-07, 2.4633482098579407e-06, 4.1425228118896484e-06, 5.821697413921356e-06, 7.500872015953064e-06, 9.180046617984772e-06, 1.085922122001648e-05, 1.2538395822048187e-05, 1.4217570424079895e-05, 1.5896745026111603e-05, 1.757591962814331e-05, 1.925509423017502e-05, 2.0934268832206726e-05, 2.2613443434238434e-05, 2.429261803627014e-05, 2.597179263830185e-05, 2.7650967240333557e-05, 2.9330141842365265e-05, 3.100931644439697e-05, 3.268849104642868e-05, 3.436766564846039e-05, 3.6046840250492096e-05, 3.7726014852523804e-05, 3.940518945455551e-05, 4.108436405658722e-05, 4.276353865861893e-05, 4.4442713260650635e-05, 4.612188786268234e-05, 4.780106246471405e-05, 4.948023706674576e-05, 5.1159411668777466e-05, 5.2838586270809174e-05, 5.451776087284088e-05, 5.619693547487259e-05, 5.78761100769043e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 4.0, 7.0, 11.0, 13.0, 22.0, 29.0, 55.0, 130.0, 440.0, 107.0, 65.0, 35.0, 28.0, 9.0, 12.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6524066925048828e-05, -2.5626271963119507e-05, -2.4728477001190186e-05, -2.3830682039260864e-05, -2.2932887077331543e-05, -2.203509211540222e-05, -2.11372971534729e-05, -2.023950219154358e-05, -1.9341707229614258e-05, -1.8443912267684937e-05, -1.7546117305755615e-05, -1.6648322343826294e-05, -1.5750527381896973e-05, -1.4852732419967651e-05, -1.395493745803833e-05, -1.3057142496109009e-05, -1.2159347534179688e-05, -1.1261552572250366e-05, -1.0363757610321045e-05, -9.465962648391724e-06, -8.568167686462402e-06, -7.670372724533081e-06, -6.77257776260376e-06, -5.8747828006744385e-06, -4.976987838745117e-06, -4.079192876815796e-06, -3.1813979148864746e-06, -2.2836029529571533e-06, -1.385807991027832e-06, -4.880130290985107e-07, 4.0978193283081055e-07, 1.3075768947601318e-06, 2.205371856689453e-06, 3.1031668186187744e-06, 4.000961780548096e-06, 4.898756742477417e-06, 5.796551704406738e-06, 6.6943466663360596e-06, 7.592141628265381e-06, 8.489936590194702e-06, 9.387731552124023e-06, 1.0285526514053345e-05, 1.1183321475982666e-05, 1.2081116437911987e-05, 1.2978911399841309e-05, 1.387670636177063e-05, 1.4774501323699951e-05, 1.5672296285629272e-05, 1.6570091247558594e-05, 1.7467886209487915e-05, 1.8365681171417236e-05, 1.9263476133346558e-05, 2.016127109527588e-05, 2.10590660572052e-05, 2.195686101913452e-05, 2.2854655981063843e-05, 2.3752450942993164e-05, 2.4650245904922485e-05, 2.5548040866851807e-05, 2.6445835828781128e-05, 2.734363079071045e-05, 2.824142575263977e-05, 2.9139220714569092e-05, 3.0037015676498413e-05, 3.0934810638427734e-05]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 121.0, 854.0, 30.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07917436212301254, -0.07066558301448822, -0.062156811356544495, -0.05364803597331047, -0.04513926059007645, -0.03663048520684242, -0.0281217098236084, -0.019612934440374374, -0.01110415905714035, -0.0025953836739063263, 0.005913391709327698, 0.014422167092561722, 0.022930942475795746, 0.03143971785902977, 0.039948493242263794, 0.04845726862549782, 0.05696604400873184, 0.06547482311725616, 0.07398359477519989, 0.08249236643314362, 0.09100114554166794, 0.09950992465019226, 0.10801869630813599, 0.11652746796607971, 0.12503623962402344, 0.13354501128196716, 0.1420537829399109, 0.1505625694990158, 0.15907134115695953, 0.16758011281490326, 0.17608889937400818, 0.1845976710319519, 0.19310647249221802, 0.20161524415016174, 0.21012401580810547, 0.2186328023672104, 0.2271415740251541, 0.23565034568309784, 0.24415913224220276, 0.2526679039001465, 0.2611766755580902, 0.26968544721603394, 0.27819421887397766, 0.2867029905319214, 0.2952117919921875, 0.3037205636501312, 0.31222933530807495, 0.3207381069660187, 0.3292468786239624, 0.33775565028190613, 0.34626442193984985, 0.3547731935977936, 0.3632819652557373, 0.3717907667160034, 0.38029953837394714, 0.38880831003189087, 0.3973170816898346, 0.4058258533477783, 0.41433462500572205, 0.42284339666366577, 0.4313521981239319, 0.4398609697818756, 0.44836974143981934, 0.45687851309776306, 0.4653872847557068]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 10.0, 14.0, 11.0, 22.0, 24.0, 27.0, 38.0, 28.0, 39.0, 48.0, 59.0, 65.0, 50.0, 53.0, 48.0, 57.0, 54.0, 48.0, 47.0, 41.0, 36.0, 35.0, 21.0, 23.0, 22.0, 18.0, 17.0, 9.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15125852823257446, -0.14704565703868866, -0.14283278584480286, -0.13861992955207825, -0.13440705835819244, -0.13019418716430664, -0.12598131597042084, -0.12176844477653503, -0.11755558103322983, -0.11334270983934402, -0.10912984609603882, -0.10491697490215302, -0.10070410370826721, -0.096491239964962, -0.0922783687710762, -0.088065505027771, -0.08385263383388519, -0.07963976263999939, -0.07542689889669418, -0.07121402770280838, -0.06700116395950317, -0.06278829276561737, -0.05857542157173157, -0.05436255410313606, -0.05014968663454056, -0.04593681916594505, -0.04172395169734955, -0.037511080503463745, -0.03329821303486824, -0.029085345566272736, -0.02487247623503208, -0.020659606903791428, -0.016446739435195923, -0.012233871035277843, -0.008021002635359764, -0.0038081342354416847, 0.00040473416447639465, 0.004617601633071899, 0.008830470964312553, 0.013043340295553207, 0.017256207764148712, 0.021469075232744217, 0.02568194456398487, 0.029894813895225525, 0.03410768136382103, 0.038320548832416534, 0.04253342002630234, 0.04674628749489784, 0.05095915496349335, 0.05517202243208885, 0.05938488990068436, 0.06359776109457016, 0.06781062483787537, 0.07202349603176117, 0.07623636722564697, 0.08044923841953278, 0.08466210216283798, 0.08887497335672379, 0.09308783710002899, 0.0973007082939148, 0.1015135794878006, 0.1057264432311058, 0.10993931442499161, 0.11415217816829681, 0.11836504936218262]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 10.0, 7.0, 12.0, 25.0, 23.0, 19.0, 41.0, 44.0, 735.0, 3518.0, 4094215.0, 93020.0, 2069.0, 274.0, 39.0, 35.0, 24.0, 28.0, 16.0, 16.0, 12.0, 10.0, 10.0, 9.0, 4.0, 8.0, 2.0, 10.0, 2.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0151824951171875, -0.014658451080322266, -0.014134407043457031, -0.013610363006591797, -0.013086318969726562, -0.012562274932861328, -0.012038230895996094, -0.01151418685913086, -0.010990142822265625, -0.01046609878540039, -0.009942054748535156, -0.009418010711669922, -0.008893966674804688, -0.008369922637939453, -0.007845878601074219, -0.007321834564208984, -0.00679779052734375, -0.006273746490478516, -0.005749702453613281, -0.005225658416748047, -0.0047016143798828125, -0.004177570343017578, -0.0036535263061523438, -0.0031294822692871094, -0.002605438232421875, -0.0020813941955566406, -0.0015573501586914062, -0.0010333061218261719, -0.0005092620849609375, 1.4781951904296875e-05, 0.0005388259887695312, 0.0010628700256347656, 0.0015869140625, 0.0021109580993652344, 0.0026350021362304688, 0.003159046173095703, 0.0036830902099609375, 0.004207134246826172, 0.004731178283691406, 0.005255222320556641, 0.005779266357421875, 0.006303310394287109, 0.006827354431152344, 0.007351398468017578, 0.007875442504882812, 0.008399486541748047, 0.008923530578613281, 0.009447574615478516, 0.00997161865234375, 0.010495662689208984, 0.011019706726074219, 0.011543750762939453, 0.012067794799804688, 0.012591838836669922, 0.013115882873535156, 0.01363992691040039, 0.014163970947265625, 0.01468801498413086, 0.015212059020996094, 0.015736103057861328, 0.016260147094726562, 0.016784191131591797, 0.01730823516845703, 0.017832279205322266, 0.0183563232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 5.0, 14.0, 10.0, 10.0, 9.0, 25.0, 89.0, 184.0, 266.0, 184.0, 71.0, 18.0, 9.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007389068603515625, -0.007132232189178467, -0.006875395774841309, -0.00661855936050415, -0.006361722946166992, -0.006104886531829834, -0.005848050117492676, -0.005591213703155518, -0.005334377288818359, -0.005077540874481201, -0.004820704460144043, -0.004563868045806885, -0.0043070316314697266, -0.004050195217132568, -0.00379335880279541, -0.003536522388458252, -0.0032796859741210938, -0.0030228495597839355, -0.0027660131454467773, -0.002509176731109619, -0.002252340316772461, -0.0019955039024353027, -0.0017386674880981445, -0.0014818310737609863, -0.0012249946594238281, -0.0009681582450866699, -0.0007113218307495117, -0.0004544854164123535, -0.0001976490020751953, 5.918741226196289e-05, 0.0003160238265991211, 0.0005728602409362793, 0.0008296966552734375, 0.0010865330696105957, 0.001343369483947754, 0.0016002058982849121, 0.0018570423126220703, 0.0021138787269592285, 0.0023707151412963867, 0.002627551555633545, 0.002884387969970703, 0.0031412243843078613, 0.0033980607986450195, 0.0036548972129821777, 0.003911733627319336, 0.004168570041656494, 0.004425406455993652, 0.0046822428703308105, 0.004939079284667969, 0.005195915699005127, 0.005452752113342285, 0.005709588527679443, 0.0059664249420166016, 0.00622326135635376, 0.006480097770690918, 0.006736934185028076, 0.006993770599365234, 0.007250607013702393, 0.007507443428039551, 0.007764279842376709, 0.008021116256713867, 0.008277952671051025, 0.008534789085388184, 0.008791625499725342, 0.0090484619140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 27.0, 97.0, 317.0, 678.0, 2795.0, 4186952.0, 2259.0, 639.0, 334.0, 108.0, 35.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0201416015625, -0.019408464431762695, -0.01867532730102539, -0.017942190170288086, -0.01720905303955078, -0.016475915908813477, -0.015742778778076172, -0.015009641647338867, -0.014276504516601562, -0.013543367385864258, -0.012810230255126953, -0.012077093124389648, -0.011343955993652344, -0.010610818862915039, -0.009877681732177734, -0.00914454460144043, -0.008411407470703125, -0.00767827033996582, -0.006945133209228516, -0.006211996078491211, -0.005478858947753906, -0.0047457218170166016, -0.004012584686279297, -0.003279447555541992, -0.0025463104248046875, -0.0018131732940673828, -0.0010800361633300781, -0.00034689903259277344, 0.00038623809814453125, 0.001119375228881836, 0.0018525123596191406, 0.0025856494903564453, 0.00331878662109375, 0.004051923751831055, 0.004785060882568359, 0.005518198013305664, 0.006251335144042969, 0.0069844722747802734, 0.007717609405517578, 0.008450746536254883, 0.009183883666992188, 0.009917020797729492, 0.010650157928466797, 0.011383295059204102, 0.012116432189941406, 0.012849569320678711, 0.013582706451416016, 0.01431584358215332, 0.015048980712890625, 0.01578211784362793, 0.016515254974365234, 0.01724839210510254, 0.017981529235839844, 0.01871466636657715, 0.019447803497314453, 0.020180940628051758, 0.020914077758789062, 0.021647214889526367, 0.022380352020263672, 0.023113489151000977, 0.02384662628173828, 0.024579763412475586, 0.02531290054321289, 0.026046037673950195, 0.0267791748046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 16.0, 24.0, 351.0, 3635.0, 33.0, 11.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009190082550048828, -0.008934974670410156, -0.008679866790771484, -0.008424758911132812, -0.00816965103149414, -0.007914543151855469, -0.007659435272216797, -0.007404327392578125, -0.007149219512939453, -0.006894111633300781, -0.006639003753662109, -0.0063838958740234375, -0.006128787994384766, -0.005873680114746094, -0.005618572235107422, -0.00536346435546875, -0.005108356475830078, -0.004853248596191406, -0.004598140716552734, -0.0043430328369140625, -0.004087924957275391, -0.0038328170776367188, -0.003577709197998047, -0.003322601318359375, -0.003067493438720703, -0.0028123855590820312, -0.0025572776794433594, -0.0023021697998046875, -0.0020470619201660156, -0.0017919540405273438, -0.0015368461608886719, -0.00128173828125, -0.0010266304016113281, -0.0007715225219726562, -0.0005164146423339844, -0.0002613067626953125, -6.198883056640625e-06, 0.00024890899658203125, 0.0005040168762207031, 0.000759124755859375, 0.0010142326354980469, 0.0012693405151367188, 0.0015244483947753906, 0.0017795562744140625, 0.0020346641540527344, 0.0022897720336914062, 0.002544879913330078, 0.00279998779296875, 0.003055095672607422, 0.0033102035522460938, 0.0035653114318847656, 0.0038204193115234375, 0.004075527191162109, 0.004330635070800781, 0.004585742950439453, 0.004840850830078125, 0.005095958709716797, 0.005351066589355469, 0.005606174468994141, 0.0058612823486328125, 0.006116390228271484, 0.006371498107910156, 0.006626605987548828, 0.0068817138671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 993.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02370830811560154, -0.02196001075208187, -0.02021171525120735, -0.018463417887687683, -0.016715120524168015, -0.01496682409197092, -0.013218527659773827, -0.011470230296254158, -0.009721933864057064, -0.00797363743185997, -0.0062253400683403015, -0.0044770436361432076, -0.0027287467382848263, -0.000980449840426445, 0.000767846591770649, 0.0025161439552903175, 0.0042644403874874115, 0.006012737285345793, 0.007761034183204174, 0.009509330615401268, 0.011257627978920937, 0.01300592441111803, 0.014754220843315125, 0.016502518206834793, 0.01825081557035446, 0.01999911293387413, 0.02174740843474865, 0.023495705798268318, 0.025244003161787987, 0.026992298662662506, 0.028740596026182175, 0.030488893389701843, 0.03223719075322151, 0.03398548811674118, 0.03573378548026085, 0.03748208284378052, 0.03923037648200989, 0.040978673845529556, 0.042726971209049225, 0.04447526857256889, 0.04622356593608856, 0.04797186329960823, 0.0497201606631279, 0.05146845430135727, 0.05321675166487694, 0.054965049028396606, 0.056713346391916275, 0.058461643755435944, 0.060209937393665314, 0.06195823475718498, 0.06370653212070465, 0.06545482575893402, 0.06720312684774399, 0.06895142048597336, 0.07069972157478333, 0.0724480152130127, 0.07419631630182266, 0.07594460994005203, 0.077692911028862, 0.07944120466709137, 0.08118950575590134, 0.0829377993941307, 0.08468610048294067, 0.08643439412117004, 0.08818268775939941]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 21.0, 24.0, 43.0, 38.0, 60.0, 80.0, 75.0, 86.0, 106.0, 109.0, 91.0, 67.0, 49.0, 39.0, 33.0, 24.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01140064001083374, -0.011000651866197586, -0.010600663721561432, -0.010200675576925278, -0.009800687432289124, -0.00940069928765297, -0.009000711143016815, -0.008600722998380661, -0.008200734853744507, -0.007800746709108353, -0.0074007585644721985, -0.007000770419836044, -0.00660078227519989, -0.006200794130563736, -0.005800805985927582, -0.005400817841291428, -0.0050008296966552734, -0.004600841552019119, -0.004200853407382965, -0.003800865262746811, -0.0034008771181106567, -0.0030008889734745026, -0.0026009008288383484, -0.002200912684202194, -0.00180092453956604, -0.0014009363949298859, -0.0010009482502937317, -0.0006009601056575775, -0.00020097196102142334, 0.00019901618361473083, 0.000599004328250885, 0.0009989924728870392, 0.0013989806175231934, 0.0017989687621593475, 0.0021989569067955017, 0.002598945051431656, 0.00299893319606781, 0.0033989213407039642, 0.0037989094853401184, 0.004198897629976273, 0.004598885774612427, 0.004998873919248581, 0.005398862063884735, 0.005798850208520889, 0.0061988383531570435, 0.006598826497793198, 0.006998814642429352, 0.007398802787065506, 0.00779879093170166, 0.008198779076337814, 0.008598767220973969, 0.008998755365610123, 0.009398743510246277, 0.009798731654882431, 0.010198719799518585, 0.01059870794415474, 0.010998696088790894, 0.011398684233427048, 0.011798672378063202, 0.012198660522699356, 0.01259864866733551, 0.012998636811971664, 0.013398624956607819, 0.013798613101243973, 0.014198601245880127]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 8.0, 6.0, 14.0, 18.0, 26.0, 33.0, 46.0, 89.0, 143.0, 269.0, 466.0, 864.0, 1899.0, 4055.0, 11287.0, 63361.0, 927677.0, 25599.0, 6909.0, 2770.0, 1331.0, 721.0, 359.0, 198.0, 130.0, 93.0, 59.0, 34.0, 27.0, 17.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0181427001953125, -0.017628788948059082, -0.017114877700805664, -0.016600966453552246, -0.016087055206298828, -0.01557314395904541, -0.015059232711791992, -0.014545321464538574, -0.014031410217285156, -0.013517498970031738, -0.01300358772277832, -0.012489676475524902, -0.011975765228271484, -0.011461853981018066, -0.010947942733764648, -0.01043403148651123, -0.009920120239257812, -0.009406208992004395, -0.008892297744750977, -0.008378386497497559, -0.00786447525024414, -0.007350564002990723, -0.006836652755737305, -0.006322741508483887, -0.005808830261230469, -0.005294919013977051, -0.004781007766723633, -0.004267096519470215, -0.003753185272216797, -0.003239274024963379, -0.002725362777709961, -0.002211451530456543, -0.001697540283203125, -0.001183629035949707, -0.0006697177886962891, -0.0001558065414428711, 0.0003581047058105469, 0.0008720159530639648, 0.0013859272003173828, 0.0018998384475708008, 0.0024137496948242188, 0.0029276609420776367, 0.0034415721893310547, 0.003955483436584473, 0.004469394683837891, 0.004983305931091309, 0.0054972171783447266, 0.0060111284255981445, 0.0065250396728515625, 0.0070389509201049805, 0.0075528621673583984, 0.008066773414611816, 0.008580684661865234, 0.009094595909118652, 0.00960850715637207, 0.010122418403625488, 0.010636329650878906, 0.011150240898132324, 0.011664152145385742, 0.01217806339263916, 0.012691974639892578, 0.013205885887145996, 0.013719797134399414, 0.014233708381652832, 0.01474761962890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 5.0, 14.0, 10.0, 10.0, 9.0, 25.0, 88.0, 182.0, 265.0, 188.0, 69.0, 20.0, 9.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007396697998046875, -0.007139742374420166, -0.006882786750793457, -0.006625831127166748, -0.006368875503540039, -0.00611191987991333, -0.005854964256286621, -0.005598008632659912, -0.005341053009033203, -0.005084097385406494, -0.004827141761779785, -0.004570186138153076, -0.004313230514526367, -0.004056274890899658, -0.0037993192672729492, -0.0035423636436462402, -0.0032854080200195312, -0.0030284523963928223, -0.0027714967727661133, -0.0025145411491394043, -0.0022575855255126953, -0.0020006299018859863, -0.0017436742782592773, -0.0014867186546325684, -0.0012297630310058594, -0.0009728074073791504, -0.0007158517837524414, -0.0004588961601257324, -0.00020194053649902344, 5.501508712768555e-05, 0.00031197071075439453, 0.0005689263343811035, 0.0008258819580078125, 0.0010828375816345215, 0.0013397932052612305, 0.0015967488288879395, 0.0018537044525146484, 0.0021106600761413574, 0.0023676156997680664, 0.0026245713233947754, 0.0028815269470214844, 0.0031384825706481934, 0.0033954381942749023, 0.0036523938179016113, 0.00390934944152832, 0.004166305065155029, 0.004423260688781738, 0.004680216312408447, 0.004937171936035156, 0.005194127559661865, 0.005451083183288574, 0.005708038806915283, 0.005964994430541992, 0.006221950054168701, 0.00647890567779541, 0.006735861301422119, 0.006992816925048828, 0.007249772548675537, 0.007506728172302246, 0.007763683795928955, 0.008020639419555664, 0.008277595043182373, 0.008534550666809082, 0.008791506290435791, 0.0090484619140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 2.0, 10.0, 11.0, 11.0, 13.0, 20.0, 25.0, 31.0, 26.0, 44.0, 45.0, 71.0, 91.0, 131.0, 190.0, 343.0, 767.0, 2016.0, 31238.0, 1004130.0, 6436.0, 1385.0, 563.0, 241.0, 190.0, 115.0, 89.0, 60.0, 52.0, 40.0, 25.0, 24.0, 19.0, 21.0, 9.0, 13.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0275421142578125, -0.026662826538085938, -0.025783538818359375, -0.024904251098632812, -0.02402496337890625, -0.023145675659179688, -0.022266387939453125, -0.021387100219726562, -0.0205078125, -0.019628524780273438, -0.018749237060546875, -0.017869949340820312, -0.01699066162109375, -0.016111373901367188, -0.015232086181640625, -0.014352798461914062, -0.0134735107421875, -0.012594223022460938, -0.011714935302734375, -0.010835647583007812, -0.00995635986328125, -0.009077072143554688, -0.008197784423828125, -0.0073184967041015625, -0.006439208984375, -0.0055599212646484375, -0.004680633544921875, -0.0038013458251953125, -0.00292205810546875, -0.0020427703857421875, -0.001163482666015625, -0.0002841949462890625, 0.0005950927734375, 0.0014743804931640625, 0.002353668212890625, 0.0032329559326171875, 0.00411224365234375, 0.0049915313720703125, 0.005870819091796875, 0.0067501068115234375, 0.00762939453125, 0.008508682250976562, 0.009387969970703125, 0.010267257690429688, 0.01114654541015625, 0.012025833129882812, 0.012905120849609375, 0.013784408569335938, 0.0146636962890625, 0.015542984008789062, 0.016422271728515625, 0.017301559448242188, 0.01818084716796875, 0.019060134887695312, 0.019939422607421875, 0.020818710327148438, 0.021697998046875, 0.022577285766601562, 0.023456573486328125, 0.024335861206054688, 0.02521514892578125, 0.026094436645507812, 0.026973724365234375, 0.027853012084960938, 0.0287322998046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 2.0, 10.0, 11.0, 11.0, 12.0, 15.0, 22.0, 23.0, 20.0, 21.0, 23.0, 35.0, 28.0, 35.0, 38.0, 36.0, 39.0, 29.0, 55.0, 43.0, 39.0, 51.0, 31.0, 27.0, 44.0, 37.0, 35.0, 27.0, 30.0, 26.0, 21.0, 17.0, 16.0, 17.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.01953125, -0.01890707015991211, -0.01828289031982422, -0.017658710479736328, -0.017034530639648438, -0.016410350799560547, -0.015786170959472656, -0.015161991119384766, -0.014537811279296875, -0.013913631439208984, -0.013289451599121094, -0.012665271759033203, -0.012041091918945312, -0.011416912078857422, -0.010792732238769531, -0.01016855239868164, -0.00954437255859375, -0.00892019271850586, -0.008296012878417969, -0.007671833038330078, -0.0070476531982421875, -0.006423473358154297, -0.005799293518066406, -0.005175113677978516, -0.004550933837890625, -0.003926753997802734, -0.0033025741577148438, -0.002678394317626953, -0.0020542144775390625, -0.0014300346374511719, -0.0008058547973632812, -0.00018167495727539062, 0.0004425048828125, 0.0010666847229003906, 0.0016908645629882812, 0.002315044403076172, 0.0029392242431640625, 0.003563404083251953, 0.004187583923339844, 0.004811763763427734, 0.005435943603515625, 0.006060123443603516, 0.006684303283691406, 0.007308483123779297, 0.007932662963867188, 0.008556842803955078, 0.009181022644042969, 0.00980520248413086, 0.01042938232421875, 0.01105356216430664, 0.011677742004394531, 0.012301921844482422, 0.012926101684570312, 0.013550281524658203, 0.014174461364746094, 0.014798641204833984, 0.015422821044921875, 0.016047000885009766, 0.016671180725097656, 0.017295360565185547, 0.017919540405273438, 0.018543720245361328, 0.01916790008544922, 0.01979207992553711, 0.020416259765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 1.0, 7.0, 9.0, 18.0, 20.0, 18.0, 45.0, 45.0, 66.0, 185.0, 246.0, 851.0, 2367.0, 27037.0, 951864.0, 58576.0, 5323.0, 972.0, 451.0, 149.0, 104.0, 69.0, 37.0, 24.0, 10.0, 14.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-1.0192394256591797e-05, -9.928829967975616e-06, -9.665265679359436e-06, -9.401701390743256e-06, -9.138137102127075e-06, -8.874572813510895e-06, -8.611008524894714e-06, -8.347444236278534e-06, -8.083879947662354e-06, -7.820315659046173e-06, -7.556751370429993e-06, -7.293187081813812e-06, -7.029622793197632e-06, -6.766058504581451e-06, -6.502494215965271e-06, -6.2389299273490906e-06, -5.97536563873291e-06, -5.71180135011673e-06, -5.448237061500549e-06, -5.184672772884369e-06, -4.9211084842681885e-06, -4.657544195652008e-06, -4.393979907035828e-06, -4.130415618419647e-06, -3.866851329803467e-06, -3.6032870411872864e-06, -3.339722752571106e-06, -3.0761584639549255e-06, -2.812594175338745e-06, -2.5490298867225647e-06, -2.2854655981063843e-06, -2.021901309490204e-06, -1.7583370208740234e-06, -1.494772732257843e-06, -1.2312084436416626e-06, -9.676441550254822e-07, -7.040798664093018e-07, -4.4051557779312134e-07, -1.7695128917694092e-07, 8.66129994392395e-08, 3.501772880554199e-07, 6.137415766716003e-07, 8.773058652877808e-07, 1.1408701539039612e-06, 1.4044344425201416e-06, 1.667998731136322e-06, 1.9315630197525024e-06, 2.195127308368683e-06, 2.4586915969848633e-06, 2.7222558856010437e-06, 2.985820174217224e-06, 3.2493844628334045e-06, 3.512948751449585e-06, 3.7765130400657654e-06, 4.040077328681946e-06, 4.303641617298126e-06, 4.567205905914307e-06, 4.830770194530487e-06, 5.0943344831466675e-06, 5.357898771762848e-06, 5.621463060379028e-06, 5.885027348995209e-06, 6.148591637611389e-06, 6.41215592622757e-06, 6.67572021484375e-06]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 5.0, 14.0, 10.0, 13.0, 14.0, 21.0, 24.0, 55.0, 59.0, 83.0, 86.0, 204.0, 99.0, 77.0, 65.0, 62.0, 21.0, 15.0, 12.0, 12.0, 2.0, 5.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.450580596923828e-06, -7.257796823978424e-06, -7.06501305103302e-06, -6.872229278087616e-06, -6.679445505142212e-06, -6.486661732196808e-06, -6.293877959251404e-06, -6.101094186306e-06, -5.908310413360596e-06, -5.715526640415192e-06, -5.522742867469788e-06, -5.3299590945243835e-06, -5.1371753215789795e-06, -4.9443915486335754e-06, -4.751607775688171e-06, -4.558824002742767e-06, -4.366040229797363e-06, -4.173256456851959e-06, -3.980472683906555e-06, -3.787688910961151e-06, -3.594905138015747e-06, -3.402121365070343e-06, -3.209337592124939e-06, -3.016553819179535e-06, -2.823770046234131e-06, -2.630986273288727e-06, -2.4382025003433228e-06, -2.2454187273979187e-06, -2.0526349544525146e-06, -1.8598511815071106e-06, -1.6670674085617065e-06, -1.4742836356163025e-06, -1.2814998626708984e-06, -1.0887160897254944e-06, -8.959323167800903e-07, -7.031485438346863e-07, -5.103647708892822e-07, -3.175809979438782e-07, -1.2479722499847412e-07, 6.798654794692993e-08, 2.60770320892334e-07, 4.5355409383773804e-07, 6.463378667831421e-07, 8.391216397285461e-07, 1.0319054126739502e-06, 1.2246891856193542e-06, 1.4174729585647583e-06, 1.6102567315101624e-06, 1.8030405044555664e-06, 1.9958242774009705e-06, 2.1886080503463745e-06, 2.3813918232917786e-06, 2.5741755962371826e-06, 2.7669593691825867e-06, 2.9597431421279907e-06, 3.1525269150733948e-06, 3.345310688018799e-06, 3.538094460964203e-06, 3.730878233909607e-06, 3.923662006855011e-06, 4.116445779800415e-06, 4.309229552745819e-06, 4.502013325691223e-06, 4.694797098636627e-06, 4.887580871582031e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 8.0, 14.0, 14.0, 22.0, 39.0, 66.0, 113.0, 194.0, 647.0, 23591.0, 1022085.0, 1133.0, 314.0, 126.0, 63.0, 32.0, 21.0, 20.0, 8.0, 7.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8298625946044922e-05, -1.7710961401462555e-05, -1.7123296856880188e-05, -1.653563231229782e-05, -1.5947967767715454e-05, -1.5360303223133087e-05, -1.477263867855072e-05, -1.4184974133968353e-05, -1.3597309589385986e-05, -1.300964504480362e-05, -1.2421980500221252e-05, -1.1834315955638885e-05, -1.1246651411056519e-05, -1.0658986866474152e-05, -1.0071322321891785e-05, -9.483657777309418e-06, -8.89599323272705e-06, -8.308328688144684e-06, -7.720664143562317e-06, -7.13299959897995e-06, -6.545335054397583e-06, -5.957670509815216e-06, -5.370005965232849e-06, -4.782341420650482e-06, -4.194676876068115e-06, -3.6070123314857483e-06, -3.0193477869033813e-06, -2.4316832423210144e-06, -1.8440186977386475e-06, -1.2563541531562805e-06, -6.686896085739136e-07, -8.102506399154663e-08, 5.066394805908203e-07, 1.0943040251731873e-06, 1.6819685697555542e-06, 2.269633114337921e-06, 2.857297658920288e-06, 3.444962203502655e-06, 4.032626748085022e-06, 4.620291292667389e-06, 5.207955837249756e-06, 5.795620381832123e-06, 6.38328492641449e-06, 6.970949470996857e-06, 7.558614015579224e-06, 8.14627856016159e-06, 8.733943104743958e-06, 9.321607649326324e-06, 9.909272193908691e-06, 1.0496936738491058e-05, 1.1084601283073425e-05, 1.1672265827655792e-05, 1.225993037223816e-05, 1.2847594916820526e-05, 1.3435259461402893e-05, 1.402292400598526e-05, 1.4610588550567627e-05, 1.5198253095149994e-05, 1.578591763973236e-05, 1.6373582184314728e-05, 1.6961246728897095e-05, 1.754891127347946e-05, 1.813657581806183e-05, 1.8724240362644196e-05, 1.9311904907226562e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 10.0, 14.0, 21.0, 31.0, 28.0, 46.0, 72.0, 95.0, 386.0, 70.0, 71.0, 47.0, 34.0, 10.0, 13.0, 10.0, 3.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2635253369808197e-05, -1.2217089533805847e-05, -1.1798925697803497e-05, -1.1380761861801147e-05, -1.0962598025798798e-05, -1.0544434189796448e-05, -1.0126270353794098e-05, -9.708106517791748e-06, -9.289942681789398e-06, -8.871778845787048e-06, -8.453615009784698e-06, -8.035451173782349e-06, -7.617287337779999e-06, -7.199123501777649e-06, -6.780959665775299e-06, -6.362795829772949e-06, -5.944631993770599e-06, -5.5264681577682495e-06, -5.1083043217659e-06, -4.69014048576355e-06, -4.2719766497612e-06, -3.85381281375885e-06, -3.4356489777565002e-06, -3.0174851417541504e-06, -2.5993213057518005e-06, -2.1811574697494507e-06, -1.7629936337471008e-06, -1.344829797744751e-06, -9.266659617424011e-07, -5.085021257400513e-07, -9.033828973770142e-08, 3.2782554626464844e-07, 7.459893822669983e-07, 1.1641532182693481e-06, 1.582317054271698e-06, 2.000480890274048e-06, 2.4186447262763977e-06, 2.8368085622787476e-06, 3.2549723982810974e-06, 3.6731362342834473e-06, 4.091300070285797e-06, 4.509463906288147e-06, 4.927627742290497e-06, 5.345791578292847e-06, 5.7639554142951965e-06, 6.182119250297546e-06, 6.600283086299896e-06, 7.018446922302246e-06, 7.436610758304596e-06, 7.854774594306946e-06, 8.272938430309296e-06, 8.691102266311646e-06, 9.109266102313995e-06, 9.527429938316345e-06, 9.945593774318695e-06, 1.0363757610321045e-05, 1.0781921446323395e-05, 1.1200085282325745e-05, 1.1618249118328094e-05, 1.2036412954330444e-05, 1.2454576790332794e-05, 1.2872740626335144e-05, 1.3290904462337494e-05, 1.3709068298339844e-05]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 40.0, 599.0, 346.0, 21.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10943986475467682, -0.10366286337375641, -0.0978858694434166, -0.09210887551307678, -0.08633187413215637, -0.08055487275123596, -0.07477787882089615, -0.06900088489055634, -0.06322388350963593, -0.057446885854005814, -0.0516698881983757, -0.04589289054274559, -0.04011589288711548, -0.03433889523148537, -0.028561897575855255, -0.022784899920225143, -0.017007902264595032, -0.01123090460896492, -0.005453906953334808, 0.00032309070229530334, 0.006100088357925415, 0.011877086013555527, 0.01765408366918564, 0.02343108132481575, 0.029208078980445862, 0.034985076636075974, 0.040762074291706085, 0.0465390719473362, 0.05231606960296631, 0.05809306725859642, 0.06387006491422653, 0.06964705884456635, 0.07542404532432556, 0.08120104670524597, 0.08697804063558578, 0.0927550345659256, 0.09853203594684601, 0.10430903732776642, 0.11008603125810623, 0.11586302518844604, 0.12164002656936646, 0.12741702795028687, 0.13319402933120728, 0.1389710158109665, 0.1447480171918869, 0.1505250185728073, 0.15630200505256653, 0.16207900643348694, 0.16785600781440735, 0.17363300919532776, 0.17941001057624817, 0.18518699705600739, 0.1909639984369278, 0.1967409998178482, 0.20251798629760742, 0.20829498767852783, 0.21407198905944824, 0.21984899044036865, 0.22562599182128906, 0.23140297830104828, 0.2371799796819687, 0.2429569810628891, 0.24873396754264832, 0.2545109689235687, 0.26028797030448914]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 9.0, 8.0, 16.0, 7.0, 12.0, 14.0, 18.0, 16.0, 10.0, 21.0, 22.0, 26.0, 35.0, 37.0, 35.0, 36.0, 49.0, 47.0, 46.0, 50.0, 41.0, 38.0, 38.0, 56.0, 37.0, 35.0, 23.0, 29.0, 29.0, 38.0, 17.0, 28.0, 10.0, 13.0, 7.0, 10.0, 9.0, 7.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11164200305938721, -0.10829945653676987, -0.10495691001415253, -0.10161437094211578, -0.09827182441949844, -0.0949292778968811, -0.09158673882484436, -0.08824419230222702, -0.08490164577960968, -0.08155909925699234, -0.078216552734375, -0.07487401366233826, -0.07153146713972092, -0.06818892061710358, -0.06484638154506683, -0.06150383502244949, -0.05816128849983215, -0.05481874197721481, -0.05147619917988777, -0.04813365638256073, -0.04479110985994339, -0.04144856333732605, -0.03810602053999901, -0.03476347774267197, -0.031420931220054626, -0.028078386560082436, -0.024735841900110245, -0.021393297240138054, -0.018050752580165863, -0.014708207920193672, -0.011365663260221481, -0.00802311860024929, -0.0046805739402771, -0.0013380292803049088, 0.002004515379667282, 0.005347060039639473, 0.008689604699611664, 0.012032149359583855, 0.015374694019556046, 0.018717238679528236, 0.022059783339500427, 0.025402327999472618, 0.02874487265944481, 0.03208741545677185, 0.03542996197938919, 0.03877250850200653, 0.04211505129933357, 0.045457594096660614, 0.048800140619277954, 0.052142687141895294, 0.055485229939222336, 0.05882777273654938, 0.06217031925916672, 0.06551286578178406, 0.0688554048538208, 0.07219795137643814, 0.07554049789905548, 0.07888304442167282, 0.08222559094429016, 0.0855681300163269, 0.08891067653894424, 0.09225322306156158, 0.09559576213359833, 0.09893830865621567, 0.10228085517883301]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 2.0, 4.0, 2.0, 5.0, 4.0, 2.0, 4.0, 7.0, 12.0, 12.0, 11.0, 6.0, 22.0, 72.0, 195.0, 4193549.0, 181.0, 79.0, 21.0, 10.0, 9.0, 7.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014276504516601562, -0.001387074589729309, -0.001346498727798462, -0.0013059228658676147, -0.0012653470039367676, -0.0012247711420059204, -0.0011841952800750732, -0.001143619418144226, -0.001103043556213379, -0.0010624676942825317, -0.0010218918323516846, -0.0009813159704208374, -0.0009407401084899902, -0.0009001642465591431, -0.0008595883846282959, -0.0008190125226974487, -0.0007784366607666016, -0.0007378607988357544, -0.0006972849369049072, -0.0006567090749740601, -0.0006161332130432129, -0.0005755573511123657, -0.0005349814891815186, -0.0004944056272506714, -0.0004538297653198242, -0.00041325390338897705, -0.0003726780414581299, -0.0003321021795272827, -0.00029152631759643555, -0.0002509504556655884, -0.0002103745937347412, -0.00016979873180389404, -0.00012922286987304688, -8.864700794219971e-05, -4.807114601135254e-05, -7.495284080505371e-06, 3.30805778503418e-05, 7.365643978118896e-05, 0.00011423230171203613, 0.0001548081636428833, 0.00019538402557373047, 0.00023595988750457764, 0.0002765357494354248, 0.00031711161136627197, 0.00035768747329711914, 0.0003982633352279663, 0.0004388391971588135, 0.00047941505908966064, 0.0005199909210205078, 0.000560566782951355, 0.0006011426448822021, 0.0006417185068130493, 0.0006822943687438965, 0.0007228702306747437, 0.0007634460926055908, 0.000804021954536438, 0.0008445978164672852, 0.0008851736783981323, 0.0009257495403289795, 0.0009663254022598267, 0.0010069012641906738, 0.001047477126121521, 0.0010880529880523682, 0.0011286288499832153, 0.0011692047119140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 15.0, 11.0, 6.0, 11.0, 17.0, 66.0, 153.0, 264.0, 210.0, 100.0, 24.0, 11.0, 9.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007415771484375, -0.007160305976867676, -0.0069048404693603516, -0.006649374961853027, -0.006393909454345703, -0.006138443946838379, -0.005882978439331055, -0.0056275129318237305, -0.005372047424316406, -0.005116581916809082, -0.004861116409301758, -0.004605650901794434, -0.004350185394287109, -0.004094719886779785, -0.003839254379272461, -0.0035837888717651367, -0.0033283233642578125, -0.0030728578567504883, -0.002817392349243164, -0.00256192684173584, -0.0023064613342285156, -0.0020509958267211914, -0.0017955303192138672, -0.001540064811706543, -0.0012845993041992188, -0.0010291337966918945, -0.0007736682891845703, -0.0005182027816772461, -0.0002627372741699219, -7.271766662597656e-06, 0.00024819374084472656, 0.0005036592483520508, 0.000759124755859375, 0.0010145902633666992, 0.0012700557708740234, 0.0015255212783813477, 0.0017809867858886719, 0.002036452293395996, 0.0022919178009033203, 0.0025473833084106445, 0.0028028488159179688, 0.003058314323425293, 0.003313779830932617, 0.0035692453384399414, 0.0038247108459472656, 0.00408017635345459, 0.004335641860961914, 0.004591107368469238, 0.0048465728759765625, 0.005102038383483887, 0.005357503890991211, 0.005612969398498535, 0.005868434906005859, 0.006123900413513184, 0.006379365921020508, 0.006634831428527832, 0.006890296936035156, 0.0071457624435424805, 0.007401227951049805, 0.007656693458557129, 0.007912158966064453, 0.008167624473571777, 0.008423089981079102, 0.008678555488586426, 0.00893402099609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 17.0, 29.0, 43.0, 69.0, 81.0, 104.0, 88.0, 4193366.0, 105.0, 116.0, 80.0, 85.0, 43.0, 31.0, 17.0, 11.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.375810623168945e-05, -9.08728688955307e-05, -8.798763155937195e-05, -8.51023942232132e-05, -8.221715688705444e-05, -7.933191955089569e-05, -7.644668221473694e-05, -7.356144487857819e-05, -7.067620754241943e-05, -6.779097020626068e-05, -6.490573287010193e-05, -6.202049553394318e-05, -5.9135258197784424e-05, -5.625002086162567e-05, -5.336478352546692e-05, -5.0479546189308167e-05, -4.7594308853149414e-05, -4.470907151699066e-05, -4.182383418083191e-05, -3.893859684467316e-05, -3.6053359508514404e-05, -3.316812217235565e-05, -3.02828848361969e-05, -2.7397647500038147e-05, -2.4512410163879395e-05, -2.1627172827720642e-05, -1.874193549156189e-05, -1.5856698155403137e-05, -1.2971460819244385e-05, -1.0086223483085632e-05, -7.20098614692688e-06, -4.3157488107681274e-06, -1.430511474609375e-06, 1.4547258615493774e-06, 4.33996319770813e-06, 7.225200533866882e-06, 1.0110437870025635e-05, 1.2995675206184387e-05, 1.588091254234314e-05, 1.8766149878501892e-05, 2.1651387214660645e-05, 2.4536624550819397e-05, 2.742186188697815e-05, 3.0307099223136902e-05, 3.3192336559295654e-05, 3.607757389545441e-05, 3.896281123161316e-05, 4.184804856777191e-05, 4.4733285903930664e-05, 4.7618523240089417e-05, 5.050376057624817e-05, 5.338899791240692e-05, 5.6274235248565674e-05, 5.9159472584724426e-05, 6.204470992088318e-05, 6.492994725704193e-05, 6.781518459320068e-05, 7.070042192935944e-05, 7.358565926551819e-05, 7.647089660167694e-05, 7.93561339378357e-05, 8.224137127399445e-05, 8.51266086101532e-05, 8.801184594631195e-05, 9.08970832824707e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 4.0046870708465576e-07, 8.009374141693115e-07, 1.2014061212539673e-06, 1.601874828338623e-06, 2.002343535423279e-06, 2.4028122425079346e-06, 2.8032809495925903e-06, 3.203749656677246e-06, 3.604218363761902e-06, 4.004687070846558e-06, 4.405155777931213e-06, 4.805624485015869e-06, 5.206093192100525e-06, 5.606561899185181e-06, 6.0070306062698364e-06, 6.407499313354492e-06, 6.807968020439148e-06, 7.208436727523804e-06, 7.6089054346084595e-06, 8.009374141693115e-06, 8.409842848777771e-06, 8.810311555862427e-06, 9.210780262947083e-06, 9.611248970031738e-06, 1.0011717677116394e-05, 1.041218638420105e-05, 1.0812655091285706e-05, 1.1213123798370361e-05, 1.1613592505455017e-05, 1.2014061212539673e-05, 1.2414529919624329e-05, 1.2814998626708984e-05, 1.321546733379364e-05, 1.3615936040878296e-05, 1.4016404747962952e-05, 1.4416873455047607e-05, 1.4817342162132263e-05, 1.5217810869216919e-05, 1.5618279576301575e-05, 1.601874828338623e-05, 1.6419216990470886e-05, 1.6819685697555542e-05, 1.7220154404640198e-05, 1.7620623111724854e-05, 1.802109181880951e-05, 1.8421560525894165e-05, 1.882202923297882e-05, 1.9222497940063477e-05, 1.9622966647148132e-05, 2.0023435354232788e-05, 2.0423904061317444e-05, 2.08243727684021e-05, 2.1224841475486755e-05, 2.162531018257141e-05, 2.2025778889656067e-05, 2.2426247596740723e-05, 2.282671630382538e-05, 2.3227185010910034e-05, 2.362765371799469e-05, 2.4028122425079346e-05, 2.4428591132164e-05, 2.4829059839248657e-05, 2.5229528546333313e-05, 2.562999725341797e-05]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 39.0, 971.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014892354374751449, -0.00014188833301886916, -0.00013485312229022384, -0.0001278179115615785, -0.00012078269355697557, -0.00011374748282833025, -0.00010671226482372731, -9.967705409508198e-05, -9.264184336643666e-05, -8.560663263779134e-05, -7.857142190914601e-05, -7.153620390454307e-05, -6.450099317589775e-05, -5.746578244725242e-05, -5.043056808062829e-05, -4.339535371400416e-05, -3.6360142985358834e-05, -2.9324930437724106e-05, -2.2289717890089378e-05, -1.525450534245465e-05, -8.219292794819921e-06, -1.1840820661745965e-06, 5.851132300449535e-06, 1.2886346667073667e-05, 1.9921557395718992e-05, 2.695676994335372e-05, 3.399198249098845e-05, 4.102719685761258e-05, 4.8062407586257905e-05, 5.509761831490323e-05, 6.213283631950617e-05, 6.916804704815149e-05, 7.620325777679682e-05, 8.323846850544214e-05, 9.027367923408747e-05, 9.73088972386904e-05, 0.00010434410796733573, 0.00011137931869598106, 0.000118414536700584, 0.00012544974742922932, 0.00013248495815787464, 0.00013952016888651997, 0.0001465553796151653, 0.00015359059034381062, 0.00016062581562437117, 0.0001676610263530165, 0.00017469623708166182, 0.00018173144781030715, 0.00018876665853895247, 0.0001958018692675978, 0.00020283707999624312, 0.00020987229072488844, 0.00021690750145353377, 0.0002239427121821791, 0.00023097793746273965, 0.00023801314819138497, 0.0002450483734719455, 0.00025208358420059085, 0.0002591187949292362, 0.0002661540056578815, 0.0002731892163865268, 0.00028022442711517215, 0.00028725963784381747, 0.0002942948485724628, 0.0003013300593011081]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 10.0, 48.0, 28.0, 92.0, 227.0, 99.0, 127.0, 182.0, 60.0, 43.0, 51.0, 4.0, 11.0, 0.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1179206669330597e-05, -2.000667154788971e-05, -1.8834136426448822e-05, -1.7661601305007935e-05, -1.6489066183567047e-05, -1.531653106212616e-05, -1.4143995940685272e-05, -1.2971460819244385e-05, -1.1798925697803497e-05, -1.062639057636261e-05, -9.453855454921722e-06, -8.281320333480835e-06, -7.1087852120399475e-06, -5.93625009059906e-06, -4.763714969158173e-06, -3.591179847717285e-06, -2.4186447262763977e-06, -1.2461096048355103e-06, -7.35744833946228e-08, 1.0989606380462646e-06, 2.271495759487152e-06, 3.4440308809280396e-06, 4.616566002368927e-06, 5.7891011238098145e-06, 6.961636245250702e-06, 8.13417136669159e-06, 9.306706488132477e-06, 1.0479241609573364e-05, 1.1651776731014252e-05, 1.282431185245514e-05, 1.3996846973896027e-05, 1.5169382095336914e-05, 1.63419172167778e-05, 1.751445233821869e-05, 1.8686987459659576e-05, 1.9859522581100464e-05, 2.103205770254135e-05, 2.220459282398224e-05, 2.3377127945423126e-05, 2.4549663066864014e-05, 2.57221981883049e-05, 2.689473330974579e-05, 2.8067268431186676e-05, 2.9239803552627563e-05, 3.041233867406845e-05, 3.158487379550934e-05, 3.2757408916950226e-05, 3.392994403839111e-05, 3.5102479159832e-05, 3.627501428127289e-05, 3.7447549402713776e-05, 3.862008452415466e-05, 3.979261964559555e-05, 4.096515476703644e-05, 4.2137689888477325e-05, 4.331022500991821e-05, 4.44827601313591e-05, 4.565529525279999e-05, 4.6827830374240875e-05, 4.800036549568176e-05, 4.917290061712265e-05, 5.034543573856354e-05, 5.1517970860004425e-05, 5.269050598144531e-05]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 10.0, 5.0, 10.0, 8.0, 16.0, 17.0, 22.0, 25.0, 38.0, 49.0, 66.0, 80.0, 136.0, 205.0, 344.0, 504.0, 840.0, 1540.0, 3387.0, 9820.0, 64883.0, 933796.0, 21672.0, 5688.0, 2219.0, 1169.0, 684.0, 440.0, 278.0, 178.0, 114.0, 84.0, 59.0, 41.0, 31.0, 20.0, 19.0, 14.0, 11.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020721435546875, -0.020058870315551758, -0.019396305084228516, -0.018733739852905273, -0.01807117462158203, -0.01740860939025879, -0.016746044158935547, -0.016083478927612305, -0.015420913696289062, -0.01475834846496582, -0.014095783233642578, -0.013433218002319336, -0.012770652770996094, -0.012108087539672852, -0.01144552230834961, -0.010782957077026367, -0.010120391845703125, -0.009457826614379883, -0.00879526138305664, -0.008132696151733398, -0.007470130920410156, -0.006807565689086914, -0.006145000457763672, -0.00548243522644043, -0.0048198699951171875, -0.004157304763793945, -0.003494739532470703, -0.002832174301147461, -0.0021696090698242188, -0.0015070438385009766, -0.0008444786071777344, -0.0001819133758544922, 0.00048065185546875, 0.0011432170867919922, 0.0018057823181152344, 0.0024683475494384766, 0.0031309127807617188, 0.003793478012084961, 0.004456043243408203, 0.005118608474731445, 0.0057811737060546875, 0.00644373893737793, 0.007106304168701172, 0.007768869400024414, 0.008431434631347656, 0.009093999862670898, 0.00975656509399414, 0.010419130325317383, 0.011081695556640625, 0.011744260787963867, 0.01240682601928711, 0.013069391250610352, 0.013731956481933594, 0.014394521713256836, 0.015057086944580078, 0.01571965217590332, 0.016382217407226562, 0.017044782638549805, 0.017707347869873047, 0.01836991310119629, 0.01903247833251953, 0.019695043563842773, 0.020357608795166016, 0.021020174026489258, 0.0216827392578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 15.0, 11.0, 6.0, 11.0, 17.0, 66.0, 153.0, 263.0, 211.0, 100.0, 24.0, 11.0, 9.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007415771484375, -0.007160305976867676, -0.0069048404693603516, -0.006649374961853027, -0.006393909454345703, -0.006138443946838379, -0.005882978439331055, -0.0056275129318237305, -0.005372047424316406, -0.005116581916809082, -0.004861116409301758, -0.004605650901794434, -0.004350185394287109, -0.004094719886779785, -0.003839254379272461, -0.0035837888717651367, -0.0033283233642578125, -0.0030728578567504883, -0.002817392349243164, -0.00256192684173584, -0.0023064613342285156, -0.0020509958267211914, -0.0017955303192138672, -0.001540064811706543, -0.0012845993041992188, -0.0010291337966918945, -0.0007736682891845703, -0.0005182027816772461, -0.0002627372741699219, -7.271766662597656e-06, 0.00024819374084472656, 0.0005036592483520508, 0.000759124755859375, 0.0010145902633666992, 0.0012700557708740234, 0.0015255212783813477, 0.0017809867858886719, 0.002036452293395996, 0.0022919178009033203, 0.0025473833084106445, 0.0028028488159179688, 0.003058314323425293, 0.003313779830932617, 0.0035692453384399414, 0.0038247108459472656, 0.00408017635345459, 0.004335641860961914, 0.004591107368469238, 0.0048465728759765625, 0.005102038383483887, 0.005357503890991211, 0.005612969398498535, 0.005868434906005859, 0.006123900413513184, 0.006379365921020508, 0.006634831428527832, 0.006890296936035156, 0.0071457624435424805, 0.007401227951049805, 0.007656693458557129, 0.007912158966064453, 0.008167624473571777, 0.008423089981079102, 0.008678555488586426, 0.00893402099609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 13.0, 11.0, 10.0, 11.0, 11.0, 24.0, 23.0, 31.0, 34.0, 52.0, 71.0, 83.0, 109.0, 151.0, 212.0, 352.0, 686.0, 1449.0, 8627.0, 1021664.0, 11448.0, 1540.0, 689.0, 377.0, 219.0, 139.0, 127.0, 81.0, 64.0, 46.0, 43.0, 32.0, 18.0, 25.0, 12.0, 12.0, 13.0, 4.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.0306854248046875, -0.029796838760375977, -0.028908252716064453, -0.02801966667175293, -0.027131080627441406, -0.026242494583129883, -0.02535390853881836, -0.024465322494506836, -0.023576736450195312, -0.02268815040588379, -0.021799564361572266, -0.020910978317260742, -0.02002239227294922, -0.019133806228637695, -0.018245220184326172, -0.01735663414001465, -0.016468048095703125, -0.015579462051391602, -0.014690876007080078, -0.013802289962768555, -0.012913703918457031, -0.012025117874145508, -0.011136531829833984, -0.010247945785522461, -0.009359359741210938, -0.008470773696899414, -0.007582187652587891, -0.006693601608276367, -0.005805015563964844, -0.00491642951965332, -0.004027843475341797, -0.0031392574310302734, -0.00225067138671875, -0.0013620853424072266, -0.0004734992980957031, 0.0004150867462158203, 0.0013036727905273438, 0.002192258834838867, 0.0030808448791503906, 0.003969430923461914, 0.0048580169677734375, 0.005746603012084961, 0.006635189056396484, 0.007523775100708008, 0.008412361145019531, 0.009300947189331055, 0.010189533233642578, 0.011078119277954102, 0.011966705322265625, 0.012855291366577148, 0.013743877410888672, 0.014632463455200195, 0.015521049499511719, 0.016409635543823242, 0.017298221588134766, 0.01818680763244629, 0.019075393676757812, 0.019963979721069336, 0.02085256576538086, 0.021741151809692383, 0.022629737854003906, 0.02351832389831543, 0.024406909942626953, 0.025295495986938477, 0.02618408203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 12.0, 12.0, 10.0, 10.0, 7.0, 20.0, 16.0, 17.0, 22.0, 29.0, 27.0, 29.0, 29.0, 35.0, 38.0, 45.0, 47.0, 42.0, 37.0, 31.0, 38.0, 44.0, 38.0, 30.0, 40.0, 28.0, 35.0, 34.0, 26.0, 18.0, 25.0, 20.0, 12.0, 18.0, 13.0, 12.0, 12.0, 3.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.02099609375, -0.020388364791870117, -0.019780635833740234, -0.01917290687561035, -0.01856517791748047, -0.017957448959350586, -0.017349720001220703, -0.01674199104309082, -0.016134262084960938, -0.015526533126831055, -0.014918804168701172, -0.014311075210571289, -0.013703346252441406, -0.013095617294311523, -0.01248788833618164, -0.011880159378051758, -0.011272430419921875, -0.010664701461791992, -0.01005697250366211, -0.009449243545532227, -0.008841514587402344, -0.008233785629272461, -0.007626056671142578, -0.007018327713012695, -0.0064105987548828125, -0.00580286979675293, -0.005195140838623047, -0.004587411880493164, -0.003979682922363281, -0.0033719539642333984, -0.0027642250061035156, -0.002156496047973633, -0.00154876708984375, -0.0009410381317138672, -0.0003333091735839844, 0.00027441978454589844, 0.0008821487426757812, 0.001489877700805664, 0.002097606658935547, 0.0027053356170654297, 0.0033130645751953125, 0.003920793533325195, 0.004528522491455078, 0.005136251449584961, 0.005743980407714844, 0.0063517093658447266, 0.006959438323974609, 0.007567167282104492, 0.008174896240234375, 0.008782625198364258, 0.00939035415649414, 0.009998083114624023, 0.010605812072753906, 0.011213541030883789, 0.011821269989013672, 0.012428998947143555, 0.013036727905273438, 0.01364445686340332, 0.014252185821533203, 0.014859914779663086, 0.015467643737792969, 0.01607537269592285, 0.016683101654052734, 0.017290830612182617, 0.0178985595703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 7.0, 7.0, 8.0, 8.0, 6.0, 20.0, 20.0, 24.0, 57.0, 99.0, 135.0, 329.0, 930.0, 9798.0, 976438.0, 56504.0, 3079.0, 566.0, 215.0, 98.0, 67.0, 44.0, 25.0, 17.0, 18.0, 5.0, 6.0, 5.0, 1.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1861324310302734e-05, -1.1487863957881927e-05, -1.111440360546112e-05, -1.0740943253040314e-05, -1.0367482900619507e-05, -9.9940225481987e-06, -9.620562195777893e-06, -9.247101843357086e-06, -8.87364149093628e-06, -8.500181138515472e-06, -8.126720786094666e-06, -7.753260433673859e-06, -7.379800081253052e-06, -7.006339728832245e-06, -6.632879376411438e-06, -6.259419023990631e-06, -5.885958671569824e-06, -5.512498319149017e-06, -5.1390379667282104e-06, -4.7655776143074036e-06, -4.392117261886597e-06, -4.01865690946579e-06, -3.645196557044983e-06, -3.271736204624176e-06, -2.898275852203369e-06, -2.5248154997825623e-06, -2.1513551473617554e-06, -1.7778947949409485e-06, -1.4044344425201416e-06, -1.0309740900993347e-06, -6.575137376785278e-07, -2.8405338525772095e-07, 8.940696716308594e-08, 4.628673195838928e-07, 8.363276720046997e-07, 1.2097880244255066e-06, 1.5832483768463135e-06, 1.9567087292671204e-06, 2.3301690816879272e-06, 2.703629434108734e-06, 3.077089786529541e-06, 3.450550138950348e-06, 3.824010491371155e-06, 4.197470843791962e-06, 4.5709311962127686e-06, 4.9443915486335754e-06, 5.317851901054382e-06, 5.691312253475189e-06, 6.064772605895996e-06, 6.438232958316803e-06, 6.81169331073761e-06, 7.185153663158417e-06, 7.558614015579224e-06, 7.93207436800003e-06, 8.305534720420837e-06, 8.678995072841644e-06, 9.052455425262451e-06, 9.425915777683258e-06, 9.799376130104065e-06, 1.0172836482524872e-05, 1.0546296834945679e-05, 1.0919757187366486e-05, 1.1293217539787292e-05, 1.16666778922081e-05, 1.2040138244628906e-05]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 8.0, 3.0, 4.0, 3.0, 7.0, 10.0, 19.0, 16.0, 40.0, 42.0, 52.0, 86.0, 80.0, 143.0, 104.0, 102.0, 75.0, 53.0, 37.0, 26.0, 23.0, 20.0, 13.0, 7.0, 5.0, 3.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.331371307373047e-06, -7.101334631443024e-06, -6.8712979555130005e-06, -6.641261279582977e-06, -6.411224603652954e-06, -6.181187927722931e-06, -5.951151251792908e-06, -5.7211145758628845e-06, -5.491077899932861e-06, -5.261041224002838e-06, -5.031004548072815e-06, -4.800967872142792e-06, -4.5709311962127686e-06, -4.340894520282745e-06, -4.110857844352722e-06, -3.880821168422699e-06, -3.6507844924926758e-06, -3.4207478165626526e-06, -3.1907111406326294e-06, -2.960674464702606e-06, -2.730637788772583e-06, -2.50060111284256e-06, -2.2705644369125366e-06, -2.0405277609825134e-06, -1.8104910850524902e-06, -1.580454409122467e-06, -1.3504177331924438e-06, -1.1203810572624207e-06, -8.903443813323975e-07, -6.603077054023743e-07, -4.302710294723511e-07, -2.0023435354232788e-07, 2.9802322387695312e-08, 2.598389983177185e-07, 4.898756742477417e-07, 7.199123501777649e-07, 9.499490261077881e-07, 1.1799857020378113e-06, 1.4100223779678345e-06, 1.6400590538978577e-06, 1.8700957298278809e-06, 2.100132405757904e-06, 2.3301690816879272e-06, 2.5602057576179504e-06, 2.7902424335479736e-06, 3.020279109477997e-06, 3.25031578540802e-06, 3.4803524613380432e-06, 3.7103891372680664e-06, 3.94042581319809e-06, 4.170462489128113e-06, 4.400499165058136e-06, 4.630535840988159e-06, 4.860572516918182e-06, 5.0906091928482056e-06, 5.320645868778229e-06, 5.550682544708252e-06, 5.780719220638275e-06, 6.010755896568298e-06, 6.2407925724983215e-06, 6.470829248428345e-06, 6.700865924358368e-06, 6.930902600288391e-06, 7.160939276218414e-06, 7.3909759521484375e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 7.0, 11.0, 8.0, 11.0, 7.0, 23.0, 40.0, 55.0, 86.0, 191.0, 538.0, 5902.0, 1039334.0, 1630.0, 321.0, 156.0, 92.0, 41.0, 34.0, 17.0, 15.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.317223697900772e-05, -2.232380211353302e-05, -2.147536724805832e-05, -2.0626932382583618e-05, -1.9778497517108917e-05, -1.8930062651634216e-05, -1.8081627786159515e-05, -1.7233192920684814e-05, -1.6384758055210114e-05, -1.5536323189735413e-05, -1.4687888324260712e-05, -1.383945345878601e-05, -1.299101859331131e-05, -1.2142583727836609e-05, -1.1294148862361908e-05, -1.0445713996887207e-05, -9.597279131412506e-06, -8.748844265937805e-06, -7.900409400463104e-06, -7.051974534988403e-06, -6.203539669513702e-06, -5.3551048040390015e-06, -4.5066699385643005e-06, -3.6582350730895996e-06, -2.8098002076148987e-06, -1.9613653421401978e-06, -1.1129304766654968e-06, -2.644956111907959e-07, 5.83939254283905e-07, 1.432374119758606e-06, 2.280808985233307e-06, 3.129243850708008e-06, 3.977678716182709e-06, 4.82611358165741e-06, 5.674548447132111e-06, 6.5229833126068115e-06, 7.3714181780815125e-06, 8.219853043556213e-06, 9.068287909030914e-06, 9.916722774505615e-06, 1.0765157639980316e-05, 1.1613592505455017e-05, 1.2462027370929718e-05, 1.3310462236404419e-05, 1.415889710187912e-05, 1.500733196735382e-05, 1.5855766832828522e-05, 1.6704201698303223e-05, 1.7552636563777924e-05, 1.8401071429252625e-05, 1.9249506294727325e-05, 2.0097941160202026e-05, 2.0946376025676727e-05, 2.1794810891151428e-05, 2.264324575662613e-05, 2.349168062210083e-05, 2.434011548757553e-05, 2.5188550353050232e-05, 2.6036985218524933e-05, 2.6885420083999634e-05, 2.7733854949474335e-05, 2.8582289814949036e-05, 2.9430724680423737e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 4.0, 6.0, 5.0, 13.0, 17.0, 22.0, 22.0, 39.0, 70.0, 83.0, 414.0, 94.0, 58.0, 44.0, 28.0, 15.0, 17.0, 12.0, 8.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6391277313232422e-05, -1.5811994671821594e-05, -1.5232712030410767e-05, -1.4653429388999939e-05, -1.4074146747589111e-05, -1.3494864106178284e-05, -1.2915581464767456e-05, -1.2336298823356628e-05, -1.17570161819458e-05, -1.1177733540534973e-05, -1.0598450899124146e-05, -1.0019168257713318e-05, -9.43988561630249e-06, -8.860602974891663e-06, -8.281320333480835e-06, -7.702037692070007e-06, -7.12275505065918e-06, -6.543472409248352e-06, -5.964189767837524e-06, -5.384907126426697e-06, -4.805624485015869e-06, -4.2263418436050415e-06, -3.647059202194214e-06, -3.0677765607833862e-06, -2.4884939193725586e-06, -1.909211277961731e-06, -1.3299286365509033e-06, -7.506459951400757e-07, -1.7136335372924805e-07, 4.079192876815796e-07, 9.872019290924072e-07, 1.5664845705032349e-06, 2.1457672119140625e-06, 2.72504985332489e-06, 3.3043324947357178e-06, 3.883615136146545e-06, 4.462897777557373e-06, 5.042180418968201e-06, 5.621463060379028e-06, 6.200745701789856e-06, 6.780028343200684e-06, 7.359310984611511e-06, 7.938593626022339e-06, 8.517876267433167e-06, 9.097158908843994e-06, 9.676441550254822e-06, 1.025572419166565e-05, 1.0835006833076477e-05, 1.1414289474487305e-05, 1.1993572115898132e-05, 1.257285475730896e-05, 1.3152137398719788e-05, 1.3731420040130615e-05, 1.4310702681541443e-05, 1.488998532295227e-05, 1.5469267964363098e-05, 1.6048550605773926e-05, 1.6627833247184753e-05, 1.720711588859558e-05, 1.778639853000641e-05, 1.8365681171417236e-05, 1.8944963812828064e-05, 1.952424645423889e-05, 2.010352909564972e-05, 2.0682811737060547e-05]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 82.0, 928.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39565974473953247, -0.3821330964565277, -0.36860647797584534, -0.3550798296928406, -0.3415532112121582, -0.32802656292915344, -0.3144999146461487, -0.3009732961654663, -0.28744664788246155, -0.2739199995994568, -0.2603933811187744, -0.24686673283576965, -0.2333400994539261, -0.21981346607208252, -0.20628683269023895, -0.19276019930839539, -0.17923356592655182, -0.16570693254470825, -0.15218029916286469, -0.13865366578102112, -0.12512701749801636, -0.11160038411617279, -0.09807375073432922, -0.08454710990190506, -0.07102047652006149, -0.05749383941292763, -0.04396720230579376, -0.030440568923950195, -0.01691393181681633, -0.0033872947096824646, 0.010139338672161102, 0.023665979504585266, 0.03719261288642883, 0.0507192499935627, 0.06424588710069656, 0.07777252048254013, 0.0912991613149643, 0.10482579469680786, 0.11835242807865143, 0.131879061460495, 0.14540570974349976, 0.15893234312534332, 0.1724589765071869, 0.18598562479019165, 0.19951225817203522, 0.21303889155387878, 0.22656552493572235, 0.24009215831756592, 0.2536187767982483, 0.26714542508125305, 0.2806720435619354, 0.2941986918449402, 0.30772531032562256, 0.3212519586086273, 0.3347786068916321, 0.34830522537231445, 0.3618318736553192, 0.375358521938324, 0.38888514041900635, 0.4024117887020111, 0.4159384071826935, 0.42946505546569824, 0.4429916739463806, 0.4565183222293854, 0.47004497051239014]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 7.0, 8.0, 7.0, 8.0, 8.0, 16.0, 13.0, 22.0, 16.0, 21.0, 19.0, 34.0, 36.0, 31.0, 40.0, 51.0, 36.0, 45.0, 41.0, 68.0, 49.0, 43.0, 40.0, 40.0, 37.0, 30.0, 23.0, 32.0, 24.0, 29.0, 21.0, 13.0, 12.0, 16.0, 13.0, 4.0, 11.0, 11.0, 3.0, 11.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.09758031368255615, -0.09430770576000214, -0.09103509783744812, -0.0877624899148941, -0.08448988199234009, -0.08121727406978607, -0.07794466614723206, -0.07467205822467804, -0.07139945030212402, -0.06812684237957001, -0.06485423445701599, -0.061581626534461975, -0.05830901861190796, -0.05503641068935394, -0.05176380276679993, -0.04849119484424591, -0.045218586921691895, -0.04194597899913788, -0.03867337107658386, -0.035400763154029846, -0.03212815523147583, -0.028855547308921814, -0.025582939386367798, -0.022310331463813782, -0.019037723541259766, -0.01576511561870575, -0.012492507696151733, -0.009219899773597717, -0.005947291851043701, -0.002674683928489685, 0.0005979239940643311, 0.003870531916618347, 0.007143139839172363, 0.01041574776172638, 0.013688355684280396, 0.01696096360683441, 0.020233571529388428, 0.023506179451942444, 0.02677878737449646, 0.030051395297050476, 0.03332400321960449, 0.03659661114215851, 0.039869219064712524, 0.04314182698726654, 0.04641443490982056, 0.04968704283237457, 0.05295965075492859, 0.056232258677482605, 0.05950486660003662, 0.06277747452259064, 0.06605008244514465, 0.06932269036769867, 0.07259529829025269, 0.0758679062128067, 0.07914051413536072, 0.08241312205791473, 0.08568572998046875, 0.08895833790302277, 0.09223094582557678, 0.0955035537481308, 0.09877616167068481, 0.10204876959323883, 0.10532137751579285, 0.10859398543834686, 0.11186659336090088]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 3.0, 1.0, 12.0, 9.0, 5.0, 4.0, 8.0, 8.0, 6.0, 8.0, 14.0, 11.0, 24.0, 21.0, 22.0, 23.0, 65.0, 225.0, 4192602.0, 610.0, 276.0, 112.0, 35.0, 16.0, 19.0, 22.0, 25.0, 10.0, 5.0, 7.0, 6.0, 10.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 6.0, 0.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0], "bins": [-0.0014333724975585938, -0.0013922303915023804, -0.001351088285446167, -0.0013099461793899536, -0.0012688040733337402, -0.0012276619672775269, -0.0011865198612213135, -0.0011453777551651, -0.0011042356491088867, -0.0010630935430526733, -0.00102195143699646, -0.0009808093309402466, -0.0009396672248840332, -0.0008985251188278198, -0.0008573830127716064, -0.0008162409067153931, -0.0007750988006591797, -0.0007339566946029663, -0.0006928145885467529, -0.0006516724824905396, -0.0006105303764343262, -0.0005693882703781128, -0.0005282461643218994, -0.00048710405826568604, -0.00044596195220947266, -0.0004048198461532593, -0.0003636777400970459, -0.0003225356340408325, -0.00028139352798461914, -0.00024025142192840576, -0.00019910931587219238, -0.000157967209815979, -0.00011682510375976562, -7.568299770355225e-05, -3.454089164733887e-05, 6.601214408874512e-06, 4.774332046508789e-05, 8.888542652130127e-05, 0.00013002753257751465, 0.00017116963863372803, 0.0002123117446899414, 0.0002534538507461548, 0.00029459595680236816, 0.00033573806285858154, 0.0003768801689147949, 0.0004180222749710083, 0.0004591643810272217, 0.0005003064870834351, 0.0005414485931396484, 0.0005825906991958618, 0.0006237328052520752, 0.0006648749113082886, 0.000706017017364502, 0.0007471591234207153, 0.0007883012294769287, 0.0008294433355331421, 0.0008705854415893555, 0.0009117275476455688, 0.0009528696537017822, 0.0009940117597579956, 0.001035153865814209, 0.0010762959718704224, 0.0011174380779266357, 0.0011585801839828491, 0.0011997222900390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 11.0, 9.0, 9.0, 16.0, 57.0, 136.0, 257.0, 229.0, 109.0, 29.0, 12.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161378860473633, -0.006906986236572266, -0.0066525936126708984, -0.006398200988769531, -0.006143808364868164, -0.005889415740966797, -0.00563502311706543, -0.0053806304931640625, -0.005126237869262695, -0.004871845245361328, -0.004617452621459961, -0.004363059997558594, -0.0041086673736572266, -0.0038542747497558594, -0.003599882125854492, -0.003345489501953125, -0.003091096878051758, -0.0028367042541503906, -0.0025823116302490234, -0.0023279190063476562, -0.002073526382446289, -0.0018191337585449219, -0.0015647411346435547, -0.0013103485107421875, -0.0010559558868408203, -0.0008015632629394531, -0.0005471706390380859, -0.00029277801513671875, -3.838539123535156e-05, 0.00021600723266601562, 0.0004703998565673828, 0.00072479248046875, 0.0009791851043701172, 0.0012335777282714844, 0.0014879703521728516, 0.0017423629760742188, 0.001996755599975586, 0.002251148223876953, 0.0025055408477783203, 0.0027599334716796875, 0.0030143260955810547, 0.003268718719482422, 0.003523111343383789, 0.0037775039672851562, 0.0040318965911865234, 0.004286289215087891, 0.004540681838989258, 0.004795074462890625, 0.005049467086791992, 0.005303859710693359, 0.0055582523345947266, 0.005812644958496094, 0.006067037582397461, 0.006321430206298828, 0.006575822830200195, 0.0068302154541015625, 0.00708460807800293, 0.007339000701904297, 0.007593393325805664, 0.007847785949707031, 0.008102178573608398, 0.008356571197509766, 0.008610963821411133, 0.0088653564453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 12.0, 35.0, 56.0, 82.0, 77.0, 170.0, 4191054.0, 2308.0, 143.0, 126.0, 103.0, 69.0, 23.0, 13.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004024505615234375, -0.0003880411386489868, -0.00037363171577453613, -0.00035922229290008545, -0.00034481287002563477, -0.0003304034471511841, -0.0003159940242767334, -0.0003015846014022827, -0.00028717517852783203, -0.00027276575565338135, -0.00025835633277893066, -0.00024394690990447998, -0.0002295374870300293, -0.0002151280641555786, -0.00020071864128112793, -0.00018630921840667725, -0.00017189979553222656, -0.00015749037265777588, -0.0001430809497833252, -0.0001286715269088745, -0.00011426210403442383, -9.985268115997314e-05, -8.544325828552246e-05, -7.103383541107178e-05, -5.6624412536621094e-05, -4.221498966217041e-05, -2.7805566787719727e-05, -1.3396143913269043e-05, 1.0132789611816406e-06, 1.5422701835632324e-05, 2.9832124710083008e-05, 4.424154758453369e-05, 5.8650970458984375e-05, 7.306039333343506e-05, 8.746981620788574e-05, 0.00010187923908233643, 0.00011628866195678711, 0.0001306980848312378, 0.00014510750770568848, 0.00015951693058013916, 0.00017392635345458984, 0.00018833577632904053, 0.0002027451992034912, 0.0002171546220779419, 0.00023156404495239258, 0.00024597346782684326, 0.00026038289070129395, 0.00027479231357574463, 0.0002892017364501953, 0.000303611159324646, 0.0003180205821990967, 0.00033243000507354736, 0.00034683942794799805, 0.00036124885082244873, 0.0003756582736968994, 0.0003900676965713501, 0.0004044771194458008, 0.00041888654232025146, 0.00043329596519470215, 0.00044770538806915283, 0.0004621148109436035, 0.0004765242338180542, 0.0004909336566925049, 0.0005053430795669556, 0.0005197525024414062]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4088.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.00014322157949209213, -0.00014053098857402802, -0.0001378403976559639, -0.00013514980673789978, -0.00013245921581983566, -0.00012976862490177155, -0.00012707803398370743, -0.0001243874430656433, -0.00012169685214757919, -0.00011900626122951508, -0.00011631567031145096, -0.00011362507939338684, -0.00011093448847532272, -0.0001082438975572586, -0.00010555330663919449, -0.00010286271572113037, -0.00010017212480306625, -9.748153388500214e-05, -9.479094296693802e-05, -9.21003520488739e-05, -8.940976113080978e-05, -8.671917021274567e-05, -8.402857929468155e-05, -8.133798837661743e-05, -7.864739745855331e-05, -7.59568065404892e-05, -7.326621562242508e-05, -7.057562470436096e-05, -6.788503378629684e-05, -6.519444286823273e-05, -6.250385195016861e-05, -5.981326103210449e-05, -5.7122670114040375e-05, -5.443207919597626e-05, -5.174148827791214e-05, -4.905089735984802e-05, -4.6360306441783905e-05, -4.366971552371979e-05, -4.097912460565567e-05, -3.828853368759155e-05, -3.5597942769527435e-05, -3.290735185146332e-05, -3.02167609333992e-05, -2.7526170015335083e-05, -2.4835579097270966e-05, -2.2144988179206848e-05, -1.945439726114273e-05, -1.6763806343078613e-05, -1.4073215425014496e-05, -1.1382624506950378e-05, -8.692033588886261e-06, -6.0014426708221436e-06, -3.310851752758026e-06, -6.202608346939087e-07, 2.0703300833702087e-06, 4.760921001434326e-06, 7.451511919498444e-06, 1.0142102837562561e-05, 1.2832693755626678e-05, 1.5523284673690796e-05, 1.8213875591754913e-05, 2.090446650981903e-05, 2.3595057427883148e-05, 2.6285648345947266e-05]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 864.0, 135.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002853727783076465, -0.0002710241242311895, -0.00025667547015473247, -0.00024232680152636021, -0.00022797813289798796, -0.00021362947882153094, -0.00019928082474507391, -0.0001849321706686169, -0.00017058350204024464, -0.00015623484796378762, -0.00014188617933541536, -0.00012753752525895834, -0.0001131888639065437, -9.884020255412906e-05, -8.449154847767204e-05, -7.01428871252574e-05, -5.5794225772842765e-05, -4.144556442042813e-05, -2.7096906705992296e-05, -1.2748248991556466e-05, 1.6004123608581722e-06, 1.594907371327281e-05, 3.0297727789729834e-05, 4.464638914214447e-05, 5.899505049455911e-05, 7.334371184697375e-05, 8.769237319938838e-05, 0.00010204102727584541, 0.00011638968862826005, 0.00013073834998067468, 0.0001450870040571317, 0.00015943567268550396, 0.00017378432676196098, 0.000188132980838418, 0.00020248164946679026, 0.00021683030354324728, 0.00023117897217161953, 0.00024552762624807656, 0.0002598762803245336, 0.0002742249344009906, 0.0002885736175812781, 0.0003029222716577351, 0.00031727092573419213, 0.00033161957981064916, 0.00034596826299093664, 0.00036031691706739366, 0.0003746655711438507, 0.0003890142252203077, 0.00040336287929676473, 0.00041771153337322176, 0.0004320601874496788, 0.00044640887062996626, 0.0004607575247064233, 0.0004751061787828803, 0.0004894548328593373, 0.0005038034869357944, 0.0005181521410122514, 0.0005325007950887084, 0.0005468494491651654, 0.0005611981032416224, 0.0005755467573180795, 0.0005898954113945365, 0.0006042440654709935, 0.0006185927777551115, 0.0006329414318315685]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 12.0, 25.0, 46.0, 97.0, 140.0, 181.0, 137.0, 177.0, 99.0, 48.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00029224157333374023, -0.00028496887534856796, -0.0002776961773633957, -0.0002704234793782234, -0.00026315078139305115, -0.0002558780834078789, -0.0002486053854227066, -0.00024133268743753433, -0.00023405998945236206, -0.0002267872914671898, -0.00021951459348201752, -0.00021224189549684525, -0.00020496919751167297, -0.0001976964995265007, -0.00019042380154132843, -0.00018315110355615616, -0.0001758784055709839, -0.00016860570758581161, -0.00016133300960063934, -0.00015406031161546707, -0.0001467876136302948, -0.00013951491564512253, -0.00013224221765995026, -0.00012496951967477798, -0.00011769682168960571, -0.00011042412370443344, -0.00010315142571926117, -9.58787277340889e-05, -8.860602974891663e-05, -8.133333176374435e-05, -7.406063377857208e-05, -6.678793579339981e-05, -5.951523780822754e-05, -5.224253982305527e-05, -4.4969841837882996e-05, -3.7697143852710724e-05, -3.0424445867538452e-05, -2.315174788236618e-05, -1.587904989719391e-05, -8.606351912021637e-06, -1.3336539268493652e-06, 5.9390440583229065e-06, 1.3211742043495178e-05, 2.048444002866745e-05, 2.775713801383972e-05, 3.5029835999011993e-05, 4.2302533984184265e-05, 4.957523196935654e-05, 5.684792995452881e-05, 6.412062793970108e-05, 7.139332592487335e-05, 7.866602391004562e-05, 8.59387218952179e-05, 9.321141988039017e-05, 0.00010048411786556244, 0.00010775681585073471, 0.00011502951383590698, 0.00012230221182107925, 0.00012957490980625153, 0.0001368476077914238, 0.00014412030577659607, 0.00015139300376176834, 0.0001586657017469406, 0.00016593839973211288, 0.00017321109771728516]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 8.0, 2.0, 8.0, 10.0, 16.0, 17.0, 26.0, 29.0, 35.0, 67.0, 88.0, 111.0, 170.0, 242.0, 373.0, 534.0, 909.0, 1455.0, 2649.0, 5553.0, 15080.0, 153695.0, 833031.0, 20151.0, 6659.0, 3032.0, 1639.0, 976.0, 608.0, 430.0, 258.0, 200.0, 135.0, 84.0, 79.0, 50.0, 30.0, 27.0, 34.0, 12.0, 11.0, 8.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020172119140625, -0.01947927474975586, -0.01878643035888672, -0.018093585968017578, -0.017400741577148438, -0.016707897186279297, -0.016015052795410156, -0.015322208404541016, -0.014629364013671875, -0.013936519622802734, -0.013243675231933594, -0.012550830841064453, -0.011857986450195312, -0.011165142059326172, -0.010472297668457031, -0.00977945327758789, -0.00908660888671875, -0.00839376449584961, -0.007700920104980469, -0.007008075714111328, -0.0063152313232421875, -0.005622386932373047, -0.004929542541503906, -0.004236698150634766, -0.003543853759765625, -0.0028510093688964844, -0.0021581649780273438, -0.0014653205871582031, -0.0007724761962890625, -7.963180541992188e-05, 0.0006132125854492188, 0.0013060569763183594, 0.0019989013671875, 0.0026917457580566406, 0.0033845901489257812, 0.004077434539794922, 0.0047702789306640625, 0.005463123321533203, 0.006155967712402344, 0.006848812103271484, 0.007541656494140625, 0.008234500885009766, 0.008927345275878906, 0.009620189666748047, 0.010313034057617188, 0.011005878448486328, 0.011698722839355469, 0.01239156723022461, 0.01308441162109375, 0.01377725601196289, 0.014470100402832031, 0.015162944793701172, 0.015855789184570312, 0.016548633575439453, 0.017241477966308594, 0.017934322357177734, 0.018627166748046875, 0.019320011138916016, 0.020012855529785156, 0.020705699920654297, 0.021398544311523438, 0.022091388702392578, 0.02278423309326172, 0.02347707748413086, 0.024169921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 11.0, 9.0, 9.0, 16.0, 57.0, 136.0, 257.0, 229.0, 109.0, 29.0, 12.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161378860473633, -0.006906986236572266, -0.0066525936126708984, -0.006398200988769531, -0.006143808364868164, -0.005889415740966797, -0.00563502311706543, -0.0053806304931640625, -0.005126237869262695, -0.004871845245361328, -0.004617452621459961, -0.004363059997558594, -0.0041086673736572266, -0.0038542747497558594, -0.003599882125854492, -0.003345489501953125, -0.003091096878051758, -0.0028367042541503906, -0.0025823116302490234, -0.0023279190063476562, -0.002073526382446289, -0.0018191337585449219, -0.0015647411346435547, -0.0013103485107421875, -0.0010559558868408203, -0.0008015632629394531, -0.0005471706390380859, -0.00029277801513671875, -3.838539123535156e-05, 0.00021600723266601562, 0.0004703998565673828, 0.00072479248046875, 0.0009791851043701172, 0.0012335777282714844, 0.0014879703521728516, 0.0017423629760742188, 0.001996755599975586, 0.002251148223876953, 0.0025055408477783203, 0.0027599334716796875, 0.0030143260955810547, 0.003268718719482422, 0.003523111343383789, 0.0037775039672851562, 0.0040318965911865234, 0.004286289215087891, 0.004540681838989258, 0.004795074462890625, 0.005049467086791992, 0.005303859710693359, 0.0055582523345947266, 0.005812644958496094, 0.006067037582397461, 0.006321430206298828, 0.006575822830200195, 0.0068302154541015625, 0.00708460807800293, 0.007339000701904297, 0.007593393325805664, 0.007847785949707031, 0.008102178573608398, 0.008356571197509766, 0.008610963821411133, 0.0088653564453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 12.0, 14.0, 17.0, 22.0, 17.0, 19.0, 19.0, 24.0, 27.0, 32.0, 48.0, 77.0, 114.0, 233.0, 436.0, 1037.0, 2405.0, 170034.0, 868522.0, 3086.0, 1038.0, 534.0, 261.0, 149.0, 76.0, 48.0, 35.0, 38.0, 33.0, 15.0, 13.0, 14.0, 10.0, 18.0, 5.0, 8.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0293121337890625, -0.02836894989013672, -0.027425765991210938, -0.026482582092285156, -0.025539398193359375, -0.024596214294433594, -0.023653030395507812, -0.02270984649658203, -0.02176666259765625, -0.02082347869873047, -0.019880294799804688, -0.018937110900878906, -0.017993927001953125, -0.017050743103027344, -0.016107559204101562, -0.015164375305175781, -0.01422119140625, -0.013278007507324219, -0.012334823608398438, -0.011391639709472656, -0.010448455810546875, -0.009505271911621094, -0.008562088012695312, -0.007618904113769531, -0.00667572021484375, -0.005732536315917969, -0.0047893524169921875, -0.0038461685180664062, -0.002902984619140625, -0.0019598007202148438, -0.0010166168212890625, -7.343292236328125e-05, 0.0008697509765625, 0.0018129348754882812, 0.0027561187744140625, 0.0036993026733398438, 0.004642486572265625, 0.005585670471191406, 0.0065288543701171875, 0.007472038269042969, 0.00841522216796875, 0.009358406066894531, 0.010301589965820312, 0.011244773864746094, 0.012187957763671875, 0.013131141662597656, 0.014074325561523438, 0.015017509460449219, 0.015960693359375, 0.01690387725830078, 0.017847061157226562, 0.018790245056152344, 0.019733428955078125, 0.020676612854003906, 0.021619796752929688, 0.02256298065185547, 0.02350616455078125, 0.02444934844970703, 0.025392532348632812, 0.026335716247558594, 0.027278900146484375, 0.028222084045410156, 0.029165267944335938, 0.03010845184326172, 0.0310516357421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 17.0, 22.0, 16.0, 20.0, 17.0, 22.0, 24.0, 25.0, 28.0, 30.0, 29.0, 41.0, 35.0, 42.0, 36.0, 32.0, 47.0, 45.0, 34.0, 36.0, 42.0, 36.0, 32.0, 31.0, 29.0, 31.0, 30.0, 15.0, 13.0, 14.0, 10.0, 19.0, 4.0, 8.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0174102783203125, -0.016849994659423828, -0.016289710998535156, -0.015729427337646484, -0.015169143676757812, -0.01460886001586914, -0.014048576354980469, -0.013488292694091797, -0.012928009033203125, -0.012367725372314453, -0.011807441711425781, -0.01124715805053711, -0.010686874389648438, -0.010126590728759766, -0.009566307067871094, -0.009006023406982422, -0.00844573974609375, -0.007885456085205078, -0.007325172424316406, -0.006764888763427734, -0.0062046051025390625, -0.005644321441650391, -0.005084037780761719, -0.004523754119873047, -0.003963470458984375, -0.003403186798095703, -0.0028429031372070312, -0.0022826194763183594, -0.0017223358154296875, -0.0011620521545410156, -0.0006017684936523438, -4.1484832763671875e-05, 0.000518798828125, 0.0010790824890136719, 0.0016393661499023438, 0.0021996498107910156, 0.0027599334716796875, 0.0033202171325683594, 0.0038805007934570312, 0.004440784454345703, 0.005001068115234375, 0.005561351776123047, 0.006121635437011719, 0.006681919097900391, 0.0072422027587890625, 0.007802486419677734, 0.008362770080566406, 0.008923053741455078, 0.00948333740234375, 0.010043621063232422, 0.010603904724121094, 0.011164188385009766, 0.011724472045898438, 0.01228475570678711, 0.012845039367675781, 0.013405323028564453, 0.013965606689453125, 0.014525890350341797, 0.015086174011230469, 0.01564645767211914, 0.016206741333007812, 0.016767024993896484, 0.017327308654785156, 0.017887592315673828, 0.0184478759765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 1.0, 7.0, 5.0, 4.0, 4.0, 7.0, 10.0, 24.0, 35.0, 44.0, 86.0, 196.0, 344.0, 1235.0, 44626.0, 997557.0, 3239.0, 567.0, 241.0, 117.0, 63.0, 38.0, 25.0, 18.0, 11.0, 6.0, 8.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4007091522216797e-05, -1.3597309589385986e-05, -1.3187527656555176e-05, -1.2777745723724365e-05, -1.2367963790893555e-05, -1.1958181858062744e-05, -1.1548399925231934e-05, -1.1138617992401123e-05, -1.0728836059570312e-05, -1.0319054126739502e-05, -9.909272193908691e-06, -9.499490261077881e-06, -9.08970832824707e-06, -8.67992639541626e-06, -8.27014446258545e-06, -7.860362529754639e-06, -7.450580596923828e-06, -7.040798664093018e-06, -6.631016731262207e-06, -6.2212347984313965e-06, -5.811452865600586e-06, -5.401670932769775e-06, -4.991888999938965e-06, -4.582107067108154e-06, -4.172325134277344e-06, -3.762543201446533e-06, -3.3527612686157227e-06, -2.942979335784912e-06, -2.5331974029541016e-06, -2.123415470123291e-06, -1.7136335372924805e-06, -1.30385160446167e-06, -8.940696716308594e-07, -4.842877388000488e-07, -7.450580596923828e-08, 3.3527612686157227e-07, 7.450580596923828e-07, 1.1548399925231934e-06, 1.564621925354004e-06, 1.9744038581848145e-06, 2.384185791015625e-06, 2.7939677238464355e-06, 3.203749656677246e-06, 3.6135315895080566e-06, 4.023313522338867e-06, 4.433095455169678e-06, 4.842877388000488e-06, 5.252659320831299e-06, 5.662441253662109e-06, 6.07222318649292e-06, 6.4820051193237305e-06, 6.891787052154541e-06, 7.3015689849853516e-06, 7.711350917816162e-06, 8.121132850646973e-06, 8.530914783477783e-06, 8.940696716308594e-06, 9.350478649139404e-06, 9.760260581970215e-06, 1.0170042514801025e-05, 1.0579824447631836e-05, 1.0989606380462646e-05, 1.1399388313293457e-05, 1.1809170246124268e-05, 1.2218952178955078e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 3.0, 4.0, 4.0, 7.0, 4.0, 6.0, 5.0, 18.0, 23.0, 29.0, 31.0, 56.0, 64.0, 69.0, 102.0, 146.0, 84.0, 74.0, 75.0, 40.0, 34.0, 30.0, 20.0, 14.0, 10.0, 7.0, 4.0, 5.0, 8.0, 4.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.165836334228516e-06, -7.927417755126953e-06, -7.68899917602539e-06, -7.450580596923828e-06, -7.212162017822266e-06, -6.973743438720703e-06, -6.735324859619141e-06, -6.496906280517578e-06, -6.258487701416016e-06, -6.020069122314453e-06, -5.781650543212891e-06, -5.543231964111328e-06, -5.304813385009766e-06, -5.066394805908203e-06, -4.827976226806641e-06, -4.589557647705078e-06, -4.351139068603516e-06, -4.112720489501953e-06, -3.874301910400391e-06, -3.635883331298828e-06, -3.3974647521972656e-06, -3.159046173095703e-06, -2.9206275939941406e-06, -2.682209014892578e-06, -2.4437904357910156e-06, -2.205371856689453e-06, -1.9669532775878906e-06, -1.7285346984863281e-06, -1.4901161193847656e-06, -1.2516975402832031e-06, -1.0132789611816406e-06, -7.748603820800781e-07, -5.364418029785156e-07, -2.980232238769531e-07, -5.960464477539063e-08, 1.7881393432617188e-07, 4.172325134277344e-07, 6.556510925292969e-07, 8.940696716308594e-07, 1.1324882507324219e-06, 1.3709068298339844e-06, 1.6093254089355469e-06, 1.8477439880371094e-06, 2.086162567138672e-06, 2.3245811462402344e-06, 2.562999725341797e-06, 2.8014183044433594e-06, 3.039836883544922e-06, 3.2782554626464844e-06, 3.516674041748047e-06, 3.7550926208496094e-06, 3.993511199951172e-06, 4.231929779052734e-06, 4.470348358154297e-06, 4.708766937255859e-06, 4.947185516357422e-06, 5.185604095458984e-06, 5.424022674560547e-06, 5.662441253662109e-06, 5.900859832763672e-06, 6.139278411865234e-06, 6.377696990966797e-06, 6.616115570068359e-06, 6.854534149169922e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 7.0, 5.0, 16.0, 20.0, 41.0, 92.0, 232.0, 632.0, 1028564.0, 18057.0, 510.0, 178.0, 78.0, 36.0, 17.0, 16.0, 7.0, 9.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.497729241847992e-05, -4.3820589780807495e-05, -4.266388714313507e-05, -4.1507184505462646e-05, -4.035048186779022e-05, -3.91937792301178e-05, -3.8037076592445374e-05, -3.688037395477295e-05, -3.5723671317100525e-05, -3.45669686794281e-05, -3.3410266041755676e-05, -3.225356340408325e-05, -3.109686076641083e-05, -2.9940158128738403e-05, -2.878345549106598e-05, -2.7626752853393555e-05, -2.647005021572113e-05, -2.5313347578048706e-05, -2.4156644940376282e-05, -2.2999942302703857e-05, -2.1843239665031433e-05, -2.068653702735901e-05, -1.9529834389686584e-05, -1.837313175201416e-05, -1.7216429114341736e-05, -1.605972647666931e-05, -1.4903023838996887e-05, -1.3746321201324463e-05, -1.2589618563652039e-05, -1.1432915925979614e-05, -1.027621328830719e-05, -9.119510650634766e-06, -7.962808012962341e-06, -6.806105375289917e-06, -5.649402737617493e-06, -4.492700099945068e-06, -3.335997462272644e-06, -2.1792948246002197e-06, -1.0225921869277954e-06, 1.341104507446289e-07, 1.2908130884170532e-06, 2.4475157260894775e-06, 3.604218363761902e-06, 4.760921001434326e-06, 5.9176236391067505e-06, 7.074326276779175e-06, 8.231028914451599e-06, 9.387731552124023e-06, 1.0544434189796448e-05, 1.1701136827468872e-05, 1.2857839465141296e-05, 1.401454210281372e-05, 1.5171244740486145e-05, 1.632794737815857e-05, 1.7484650015830994e-05, 1.8641352653503418e-05, 1.9798055291175842e-05, 2.0954757928848267e-05, 2.211146056652069e-05, 2.3268163204193115e-05, 2.442486584186554e-05, 2.5581568479537964e-05, 2.6738271117210388e-05, 2.7894973754882812e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 8.0, 10.0, 12.0, 21.0, 36.0, 83.0, 463.0, 146.0, 71.0, 46.0, 17.0, 11.0, 7.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7358531951904297e-05, -2.6673078536987305e-05, -2.5987625122070312e-05, -2.530217170715332e-05, -2.4616718292236328e-05, -2.3931264877319336e-05, -2.3245811462402344e-05, -2.256035804748535e-05, -2.187490463256836e-05, -2.1189451217651367e-05, -2.0503997802734375e-05, -1.9818544387817383e-05, -1.913309097290039e-05, -1.84476375579834e-05, -1.7762184143066406e-05, -1.7076730728149414e-05, -1.6391277313232422e-05, -1.570582389831543e-05, -1.5020370483398438e-05, -1.4334917068481445e-05, -1.3649463653564453e-05, -1.2964010238647461e-05, -1.2278556823730469e-05, -1.1593103408813477e-05, -1.0907649993896484e-05, -1.0222196578979492e-05, -9.5367431640625e-06, -8.851289749145508e-06, -8.165836334228516e-06, -7.4803829193115234e-06, -6.794929504394531e-06, -6.109476089477539e-06, -5.424022674560547e-06, -4.738569259643555e-06, -4.0531158447265625e-06, -3.3676624298095703e-06, -2.682209014892578e-06, -1.996755599975586e-06, -1.3113021850585938e-06, -6.258487701416016e-07, 5.960464477539063e-08, 7.450580596923828e-07, 1.430511474609375e-06, 2.115964889526367e-06, 2.8014183044433594e-06, 3.4868717193603516e-06, 4.172325134277344e-06, 4.857778549194336e-06, 5.543231964111328e-06, 6.22868537902832e-06, 6.9141387939453125e-06, 7.599592208862305e-06, 8.285045623779297e-06, 8.970499038696289e-06, 9.655952453613281e-06, 1.0341405868530273e-05, 1.1026859283447266e-05, 1.1712312698364258e-05, 1.239776611328125e-05, 1.3083219528198242e-05, 1.3768672943115234e-05, 1.4454126358032227e-05, 1.5139579772949219e-05, 1.582503318786621e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 15.0, 833.0, 164.0, 3.0, 2.0, 2.0], "bins": [-0.5653712749481201, -0.5559164881706238, -0.5464617013931274, -0.5370069146156311, -0.5275521278381348, -0.5180974006652832, -0.5086426138877869, -0.49918779730796814, -0.4897330403327942, -0.48027825355529785, -0.4708234667778015, -0.46136870980262756, -0.4519139230251312, -0.4424591362476349, -0.43300434947013855, -0.4235495626926422, -0.4140947759151459, -0.40463998913764954, -0.3951852023601532, -0.38573044538497925, -0.3762756586074829, -0.3668208718299866, -0.35736608505249023, -0.3479112982749939, -0.33845651149749756, -0.3290017247200012, -0.3195469379425049, -0.31009218096733093, -0.3006373941898346, -0.29118260741233826, -0.2817278206348419, -0.2722730338573456, -0.26281827688217163, -0.2533634901046753, -0.24390871822834015, -0.2344539314508438, -0.22499915957450867, -0.21554437279701233, -0.206089586019516, -0.19663479924201965, -0.18718001246452332, -0.17772522568702698, -0.16827045381069183, -0.1588156670331955, -0.14936089515686035, -0.139906108379364, -0.13045132160186768, -0.12099654227495193, -0.11154177039861679, -0.10208699107170105, -0.09263220429420471, -0.08317742496728897, -0.07372264564037323, -0.06426786631345749, -0.05481308326125145, -0.04535830020904541, -0.03590352088212967, -0.02644873969256878, -0.01699395850300789, -0.007539177313446999, 0.0019156038761138916, 0.011370383203029633, 0.020825166255235672, 0.03027994930744171, 0.03973472863435745]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 4.0, 11.0, 12.0, 15.0, 17.0, 21.0, 19.0, 21.0, 29.0, 29.0, 50.0, 43.0, 43.0, 44.0, 47.0, 48.0, 52.0, 58.0, 37.0, 58.0, 39.0, 31.0, 39.0, 28.0, 31.0, 32.0, 20.0, 16.0, 14.0, 9.0, 7.0, 8.0, 13.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0904165506362915, -0.08730985969305038, -0.08420316874980927, -0.08109647780656815, -0.07798978686332703, -0.0748831033706665, -0.07177641242742538, -0.06866972148418427, -0.06556303054094315, -0.062456339597702026, -0.05934964865446091, -0.056242961436510086, -0.05313627049326897, -0.05002957955002785, -0.046922892332077026, -0.04381620138883591, -0.04070951044559479, -0.03760281950235367, -0.03449612855911255, -0.03138944134116173, -0.02828275039792061, -0.02517605945467949, -0.02206937037408352, -0.01896268129348755, -0.01585599035024643, -0.012749300338327885, -0.00964261032640934, -0.006535920314490795, -0.0034292303025722504, -0.0003225402906537056, 0.002784149721264839, 0.005890838801860809, 0.008997529745101929, 0.012104219757020473, 0.015210909768939018, 0.01831759884953499, 0.021424289792776108, 0.024530980736017227, 0.027637669816613197, 0.030744358897209167, 0.03385104984045029, 0.036957740783691406, 0.040064431726932526, 0.04317111894488335, 0.046277809888124466, 0.049384500831365585, 0.052491188049316406, 0.055597878992557526, 0.058704569935798645, 0.061811260879039764, 0.06491795182228088, 0.068024642765522, 0.07113133370876312, 0.07423801720142365, 0.07734470814466476, 0.08045139908790588, 0.083558090031147, 0.08666478097438812, 0.08977147191762924, 0.09287816286087036, 0.09598484635353088, 0.099091537296772, 0.10219822824001312, 0.10530491918325424, 0.10841161012649536]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 7.0, 14.0, 9.0, 13.0, 26.0, 85.0, 2331.0, 4191427.0, 152.0, 74.0, 19.0, 10.0, 9.0, 12.0, 13.0, 3.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007352828979492188, -0.0007142797112464905, -0.0006932765245437622, -0.0006722733378410339, -0.0006512701511383057, -0.0006302669644355774, -0.0006092637777328491, -0.0005882605910301208, -0.0005672574043273926, -0.0005462542176246643, -0.000525251030921936, -0.0005042478442192078, -0.0004832446575164795, -0.0004622414708137512, -0.00044123828411102295, -0.0004202350974082947, -0.0003992319107055664, -0.00037822872400283813, -0.00035722553730010986, -0.0003362223505973816, -0.0003152191638946533, -0.00029421597719192505, -0.0002732127904891968, -0.0002522096037864685, -0.00023120641708374023, -0.00021020323038101196, -0.0001892000436782837, -0.00016819685697555542, -0.00014719367027282715, -0.00012619048357009888, -0.0001051872968673706, -8.418411016464233e-05, -6.318092346191406e-05, -4.217773675918579e-05, -2.117455005645752e-05, -1.7136335372924805e-07, 2.0831823348999023e-05, 4.1835010051727295e-05, 6.283819675445557e-05, 8.384138345718384e-05, 0.00010484457015991211, 0.00012584775686264038, 0.00014685094356536865, 0.00016785413026809692, 0.0001888573169708252, 0.00020986050367355347, 0.00023086369037628174, 0.00025186687707901, 0.0002728700637817383, 0.00029387325048446655, 0.0003148764371871948, 0.0003358796238899231, 0.00035688281059265137, 0.00037788599729537964, 0.0003988891839981079, 0.0004198923707008362, 0.00044089555740356445, 0.0004618987441062927, 0.000482901930809021, 0.0005039051175117493, 0.0005249083042144775, 0.0005459114909172058, 0.0005669146776199341, 0.0005879178643226624, 0.0006089210510253906]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 9.0, 9.0, 16.0, 55.0, 129.0, 264.0, 225.0, 113.0, 31.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161617279052734, -0.006907463073730469, -0.006653308868408203, -0.0063991546630859375, -0.006145000457763672, -0.005890846252441406, -0.005636692047119141, -0.005382537841796875, -0.005128383636474609, -0.004874229431152344, -0.004620075225830078, -0.0043659210205078125, -0.004111766815185547, -0.0038576126098632812, -0.0036034584045410156, -0.00334930419921875, -0.0030951499938964844, -0.0028409957885742188, -0.002586841583251953, -0.0023326873779296875, -0.002078533172607422, -0.0018243789672851562, -0.0015702247619628906, -0.001316070556640625, -0.0010619163513183594, -0.0008077621459960938, -0.0005536079406738281, -0.0002994537353515625, -4.5299530029296875e-05, 0.00020885467529296875, 0.0004630088806152344, 0.0007171630859375, 0.0009713172912597656, 0.0012254714965820312, 0.0014796257019042969, 0.0017337799072265625, 0.001987934112548828, 0.0022420883178710938, 0.0024962425231933594, 0.002750396728515625, 0.0030045509338378906, 0.0032587051391601562, 0.003512859344482422, 0.0037670135498046875, 0.004021167755126953, 0.004275321960449219, 0.004529476165771484, 0.00478363037109375, 0.005037784576416016, 0.005291938781738281, 0.005546092987060547, 0.0058002471923828125, 0.006054401397705078, 0.006308555603027344, 0.006562709808349609, 0.006816864013671875, 0.007071018218994141, 0.007325172424316406, 0.007579326629638672, 0.007833480834960938, 0.008087635040283203, 0.008341789245605469, 0.008595943450927734, 0.00885009765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 35.0, 45.0, 97.0, 128.0, 126.0, 4193410.0, 134.0, 105.0, 84.0, 53.0, 31.0, 18.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008306503295898438, -0.0008111335337162018, -0.0007916167378425598, -0.0007720999419689178, -0.0007525831460952759, -0.0007330663502216339, -0.0007135495543479919, -0.00069403275847435, -0.000674515962600708, -0.000654999166727066, -0.0006354823708534241, -0.0006159655749797821, -0.0005964487791061401, -0.0005769319832324982, -0.0005574151873588562, -0.0005378983914852142, -0.0005183815956115723, -0.0004988647997379303, -0.00047934800386428833, -0.00045983120799064636, -0.0004403144121170044, -0.0004207976162433624, -0.00040128082036972046, -0.0003817640244960785, -0.0003622472286224365, -0.00034273043274879456, -0.0003232136368751526, -0.0003036968410015106, -0.00028418004512786865, -0.0002646632492542267, -0.0002451464533805847, -0.00022562965750694275, -0.00020611286163330078, -0.0001865960657596588, -0.00016707926988601685, -0.00014756247401237488, -0.0001280456781387329, -0.00010852888226509094, -8.901208639144897e-05, -6.949529051780701e-05, -4.997849464416504e-05, -3.046169877052307e-05, -1.0944902896881104e-05, 8.571892976760864e-06, 2.8088688850402832e-05, 4.76054847240448e-05, 6.712228059768677e-05, 8.663907647132874e-05, 0.0001061558723449707, 0.00012567266821861267, 0.00014518946409225464, 0.0001647062599658966, 0.00018422305583953857, 0.00020373985171318054, 0.0002232566475868225, 0.00024277344346046448, 0.00026229023933410645, 0.0002818070352077484, 0.0003013238310813904, 0.00032084062695503235, 0.0003403574228286743, 0.0003598742187023163, 0.00037939101457595825, 0.0003989078104496002, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4093.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.854534149169922e-06, -3.998167812824249e-06, -1.1418014764785767e-06, 1.714564859867096e-06, 4.5709311962127686e-06, 7.427297532558441e-06, 1.0283663868904114e-05, 1.3140030205249786e-05, 1.599639654159546e-05, 1.885276287794113e-05, 2.1709129214286804e-05, 2.4565495550632477e-05, 2.742186188697815e-05, 3.0278228223323822e-05, 3.3134594559669495e-05, 3.599096089601517e-05, 3.884732723236084e-05, 4.170369356870651e-05, 4.4560059905052185e-05, 4.741642624139786e-05, 5.027279257774353e-05, 5.31291589140892e-05, 5.5985525250434875e-05, 5.884189158678055e-05, 6.169825792312622e-05, 6.45546242594719e-05, 6.741099059581757e-05, 7.026735693216324e-05, 7.312372326850891e-05, 7.598008960485458e-05, 7.883645594120026e-05, 8.169282227754593e-05, 8.45491886138916e-05, 8.740555495023727e-05, 9.026192128658295e-05, 9.311828762292862e-05, 9.597465395927429e-05, 9.883102029561996e-05, 0.00010168738663196564, 0.00010454375296831131, 0.00010740011930465698, 0.00011025648564100266, 0.00011311285197734833, 0.000115969218313694, 0.00011882558465003967, 0.00012168195098638535, 0.00012453831732273102, 0.0001273946836590767, 0.00013025104999542236, 0.00013310741633176804, 0.0001359637826681137, 0.00013882014900445938, 0.00014167651534080505, 0.00014453288167715073, 0.0001473892480134964, 0.00015024561434984207, 0.00015310198068618774, 0.00015595834702253342, 0.0001588147133588791, 0.00016167107969522476, 0.00016452744603157043, 0.0001673838123679161, 0.00017024017870426178, 0.00017309654504060745, 0.00017595291137695312]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 980.0, 26.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007240754785016179, -0.0007026340463198721, -0.0006811925559304655, -0.0006597511237487197, -0.000638309633359313, -0.0006168682011775672, -0.0005954267689958215, -0.0005739852786064148, -0.000552543846424669, -0.0005311024142429233, -0.0005096609238535166, -0.0004882194916717708, -0.0004667780303861946, -0.00044533656910061836, -0.0004238951369188726, -0.00040245367563329637, -0.00038101221434772015, -0.0003595707530621439, -0.0003381292917765677, -0.00031668785959482193, -0.0002952463983092457, -0.0002738049370236695, -0.0002523635048419237, -0.0002309220435563475, -0.00020948058227077127, -0.00018803912098519504, -0.00016659767425153404, -0.00014515622751787305, -0.00012371476623229682, -0.00010227331222267821, -8.08318582130596e-05, -5.939041147939861e-05, -3.7948950193822384e-05, -1.6507496184203774e-05, 4.933957825414836e-06, 2.6375411835033447e-05, 4.781686584465206e-05, 6.925831985427067e-05, 9.069977386388928e-05, 0.00011214122059755027, 0.0001335826818831265, 0.00015502414316870272, 0.00017646558990236372, 0.0001979070366360247, 0.00021934849792160094, 0.00024078995920717716, 0.00026223139138892293, 0.00028367285267449915, 0.0003051143139600754, 0.0003265557752456516, 0.0003479972365312278, 0.0003694386687129736, 0.0003908801299985498, 0.00041232159128412604, 0.0004337630234658718, 0.00045520448475144804, 0.00047664594603702426, 0.00049808737821877, 0.0005195288686081767, 0.0005409703007899225, 0.0005624117329716682, 0.0005838532233610749, 0.0006052946555428207, 0.0006267360877245665, 0.0006481775781139731]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 2.0, 14.0, 27.0, 84.0, 106.0, 222.0, 159.0, 192.0, 91.0, 64.0, 13.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014632940292358398, -0.00013832375407218933, -0.00013031810522079468, -0.00012231245636940002, -0.00011430680751800537, -0.00010630115866661072, -9.829550981521606e-05, -9.028986096382141e-05, -8.228421211242676e-05, -7.42785632610321e-05, -6.627291440963745e-05, -5.82672655582428e-05, -5.0261616706848145e-05, -4.225596785545349e-05, -3.425031900405884e-05, -2.6244670152664185e-05, -1.823902130126953e-05, -1.0233372449874878e-05, -2.2277235984802246e-06, 5.777925252914429e-06, 1.3783574104309082e-05, 2.1789222955703735e-05, 2.979487180709839e-05, 3.780052065849304e-05, 4.5806169509887695e-05, 5.381181836128235e-05, 6.1817467212677e-05, 6.982311606407166e-05, 7.782876491546631e-05, 8.583441376686096e-05, 9.384006261825562e-05, 0.00010184571146965027, 0.00010985136032104492, 0.00011785700917243958, 0.00012586265802383423, 0.00013386830687522888, 0.00014187395572662354, 0.0001498796045780182, 0.00015788525342941284, 0.0001658909022808075, 0.00017389655113220215, 0.0001819021999835968, 0.00018990784883499146, 0.0001979134976863861, 0.00020591914653778076, 0.00021392479538917542, 0.00022193044424057007, 0.00022993609309196472, 0.00023794174194335938, 0.00024594739079475403, 0.0002539530396461487, 0.00026195868849754333, 0.000269964337348938, 0.00027796998620033264, 0.0002859756350517273, 0.00029398128390312195, 0.0003019869327545166, 0.00030999258160591125, 0.0003179982304573059, 0.00032600387930870056, 0.0003340095281600952, 0.00034201517701148987, 0.0003500208258628845, 0.0003580264747142792, 0.00036603212356567383]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 7.0, 10.0, 4.0, 8.0, 9.0, 14.0, 10.0, 19.0, 35.0, 63.0, 108.0, 239.0, 488.0, 1033.0, 2908.0, 12267.0, 890052.0, 128634.0, 8578.0, 2330.0, 852.0, 402.0, 190.0, 99.0, 58.0, 26.0, 22.0, 14.0, 13.0, 10.0, 7.0, 5.0, 6.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03643798828125, -0.03539395332336426, -0.034349918365478516, -0.03330588340759277, -0.03226184844970703, -0.03121781349182129, -0.030173778533935547, -0.029129743576049805, -0.028085708618164062, -0.02704167366027832, -0.025997638702392578, -0.024953603744506836, -0.023909568786621094, -0.02286553382873535, -0.02182149887084961, -0.020777463912963867, -0.019733428955078125, -0.018689393997192383, -0.01764535903930664, -0.0166013240814209, -0.015557289123535156, -0.014513254165649414, -0.013469219207763672, -0.01242518424987793, -0.011381149291992188, -0.010337114334106445, -0.009293079376220703, -0.008249044418334961, -0.007205009460449219, -0.0061609745025634766, -0.005116939544677734, -0.004072904586791992, -0.00302886962890625, -0.001984834671020508, -0.0009407997131347656, 0.00010323524475097656, 0.0011472702026367188, 0.002191305160522461, 0.003235340118408203, 0.004279375076293945, 0.0053234100341796875, 0.00636744499206543, 0.007411479949951172, 0.008455514907836914, 0.009499549865722656, 0.010543584823608398, 0.01158761978149414, 0.012631654739379883, 0.013675689697265625, 0.014719724655151367, 0.01576375961303711, 0.01680779457092285, 0.017851829528808594, 0.018895864486694336, 0.019939899444580078, 0.02098393440246582, 0.022027969360351562, 0.023072004318237305, 0.024116039276123047, 0.02516007423400879, 0.02620410919189453, 0.027248144149780273, 0.028292179107666016, 0.029336214065551758, 0.0303802490234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 9.0, 9.0, 16.0, 55.0, 129.0, 264.0, 225.0, 113.0, 31.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161617279052734, -0.006907463073730469, -0.006653308868408203, -0.0063991546630859375, -0.006145000457763672, -0.005890846252441406, -0.005636692047119141, -0.005382537841796875, -0.005128383636474609, -0.004874229431152344, -0.004620075225830078, -0.0043659210205078125, -0.004111766815185547, -0.0038576126098632812, -0.0036034584045410156, -0.00334930419921875, -0.0030951499938964844, -0.0028409957885742188, -0.002586841583251953, -0.0023326873779296875, -0.002078533172607422, -0.0018243789672851562, -0.0015702247619628906, -0.001316070556640625, -0.0010619163513183594, -0.0008077621459960938, -0.0005536079406738281, -0.0002994537353515625, -4.5299530029296875e-05, 0.00020885467529296875, 0.0004630088806152344, 0.0007171630859375, 0.0009713172912597656, 0.0012254714965820312, 0.0014796257019042969, 0.0017337799072265625, 0.001987934112548828, 0.0022420883178710938, 0.0024962425231933594, 0.002750396728515625, 0.0030045509338378906, 0.0032587051391601562, 0.003512859344482422, 0.0037670135498046875, 0.004021167755126953, 0.004275321960449219, 0.004529476165771484, 0.00478363037109375, 0.005037784576416016, 0.005291938781738281, 0.005546092987060547, 0.0058002471923828125, 0.006054401397705078, 0.006308555603027344, 0.006562709808349609, 0.006816864013671875, 0.007071018218994141, 0.007325172424316406, 0.007579326629638672, 0.007833480834960938, 0.008087635040283203, 0.008341789245605469, 0.008595943450927734, 0.00885009765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 7.0, 8.0, 12.0, 14.0, 26.0, 17.0, 28.0, 23.0, 34.0, 34.0, 56.0, 92.0, 180.0, 391.0, 876.0, 3224.0, 964860.0, 75165.0, 1939.0, 724.0, 286.0, 142.0, 70.0, 52.0, 33.0, 37.0, 24.0, 18.0, 23.0, 15.0, 24.0, 14.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0262908935546875, -0.025438547134399414, -0.024586200714111328, -0.023733854293823242, -0.022881507873535156, -0.02202916145324707, -0.021176815032958984, -0.0203244686126709, -0.019472122192382812, -0.018619775772094727, -0.01776742935180664, -0.016915082931518555, -0.01606273651123047, -0.015210390090942383, -0.014358043670654297, -0.013505697250366211, -0.012653350830078125, -0.011801004409790039, -0.010948657989501953, -0.010096311569213867, -0.009243965148925781, -0.008391618728637695, -0.007539272308349609, -0.0066869258880615234, -0.0058345794677734375, -0.0049822330474853516, -0.004129886627197266, -0.0032775402069091797, -0.0024251937866210938, -0.0015728473663330078, -0.0007205009460449219, 0.00013184547424316406, 0.00098419189453125, 0.001836538314819336, 0.002688884735107422, 0.003541231155395508, 0.004393577575683594, 0.00524592399597168, 0.006098270416259766, 0.0069506168365478516, 0.0078029632568359375, 0.008655309677124023, 0.00950765609741211, 0.010360002517700195, 0.011212348937988281, 0.012064695358276367, 0.012917041778564453, 0.013769388198852539, 0.014621734619140625, 0.015474081039428711, 0.016326427459716797, 0.017178773880004883, 0.01803112030029297, 0.018883466720581055, 0.01973581314086914, 0.020588159561157227, 0.021440505981445312, 0.0222928524017334, 0.023145198822021484, 0.02399754524230957, 0.024849891662597656, 0.025702238082885742, 0.026554584503173828, 0.027406930923461914, 0.02825927734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 7.0, 9.0, 12.0, 15.0, 25.0, 16.0, 28.0, 23.0, 31.0, 29.0, 31.0, 36.0, 40.0, 36.0, 36.0, 46.0, 42.0, 42.0, 31.0, 42.0, 29.0, 38.0, 30.0, 38.0, 30.0, 36.0, 25.0, 17.0, 24.0, 14.0, 25.0, 14.0, 16.0, 13.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.016326904296875, -0.015796899795532227, -0.015266895294189453, -0.01473689079284668, -0.014206886291503906, -0.013676881790161133, -0.01314687728881836, -0.012616872787475586, -0.012086868286132812, -0.011556863784790039, -0.011026859283447266, -0.010496854782104492, -0.009966850280761719, -0.009436845779418945, -0.008906841278076172, -0.008376836776733398, -0.007846832275390625, -0.0073168277740478516, -0.006786823272705078, -0.006256818771362305, -0.005726814270019531, -0.005196809768676758, -0.004666805267333984, -0.004136800765991211, -0.0036067962646484375, -0.003076791763305664, -0.0025467872619628906, -0.002016782760620117, -0.0014867782592773438, -0.0009567737579345703, -0.0004267692565917969, 0.00010323524475097656, 0.00063323974609375, 0.0011632442474365234, 0.0016932487487792969, 0.0022232532501220703, 0.0027532577514648438, 0.003283262252807617, 0.0038132667541503906, 0.004343271255493164, 0.0048732757568359375, 0.005403280258178711, 0.005933284759521484, 0.006463289260864258, 0.006993293762207031, 0.007523298263549805, 0.008053302764892578, 0.008583307266235352, 0.009113311767578125, 0.009643316268920898, 0.010173320770263672, 0.010703325271606445, 0.011233329772949219, 0.011763334274291992, 0.012293338775634766, 0.012823343276977539, 0.013353347778320312, 0.013883352279663086, 0.01441335678100586, 0.014943361282348633, 0.015473365783691406, 0.01600337028503418, 0.016533374786376953, 0.017063379287719727, 0.0175933837890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 17.0, 9.0, 15.0, 18.0, 23.0, 20.0, 25.0, 32.0, 72.0, 93.0, 250.0, 414.0, 1661.0, 6416.0, 899259.0, 131110.0, 7112.0, 1013.0, 472.0, 150.0, 115.0, 45.0, 37.0, 19.0, 34.0, 16.0, 20.0, 17.0, 14.0, 6.0, 9.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.3942203521728516e-06, -5.185604095458984e-06, -4.976987838745117e-06, -4.76837158203125e-06, -4.559755325317383e-06, -4.351139068603516e-06, -4.1425228118896484e-06, -3.933906555175781e-06, -3.725290298461914e-06, -3.516674041748047e-06, -3.3080577850341797e-06, -3.0994415283203125e-06, -2.8908252716064453e-06, -2.682209014892578e-06, -2.473592758178711e-06, -2.2649765014648438e-06, -2.0563602447509766e-06, -1.8477439880371094e-06, -1.6391277313232422e-06, -1.430511474609375e-06, -1.2218952178955078e-06, -1.0132789611816406e-06, -8.046627044677734e-07, -5.960464477539062e-07, -3.8743019104003906e-07, -1.7881393432617188e-07, 2.9802322387695312e-08, 2.384185791015625e-07, 4.470348358154297e-07, 6.556510925292969e-07, 8.642673492431641e-07, 1.0728836059570312e-06, 1.2814998626708984e-06, 1.4901161193847656e-06, 1.6987323760986328e-06, 1.9073486328125e-06, 2.115964889526367e-06, 2.3245811462402344e-06, 2.5331974029541016e-06, 2.7418136596679688e-06, 2.950429916381836e-06, 3.159046173095703e-06, 3.3676624298095703e-06, 3.5762786865234375e-06, 3.7848949432373047e-06, 3.993511199951172e-06, 4.202127456665039e-06, 4.410743713378906e-06, 4.6193599700927734e-06, 4.827976226806641e-06, 5.036592483520508e-06, 5.245208740234375e-06, 5.453824996948242e-06, 5.662441253662109e-06, 5.8710575103759766e-06, 6.079673767089844e-06, 6.288290023803711e-06, 6.496906280517578e-06, 6.705522537231445e-06, 6.9141387939453125e-06, 7.12275505065918e-06, 7.331371307373047e-06, 7.539987564086914e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 10.0, 10.0, 22.0, 9.0, 10.0, 17.0, 20.0, 43.0, 30.0, 50.0, 61.0, 53.0, 50.0, 113.0, 69.0, 59.0, 54.0, 43.0, 41.0, 27.0, 24.0, 15.0, 24.0, 11.0, 16.0, 15.0, 14.0, 9.0, 15.0, 8.0, 5.0, 1.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3974647521972656e-06, -3.275461494922638e-06, -3.1534582376480103e-06, -3.0314549803733826e-06, -2.909451723098755e-06, -2.787448465824127e-06, -2.6654452085494995e-06, -2.543441951274872e-06, -2.421438694000244e-06, -2.2994354367256165e-06, -2.1774321794509888e-06, -2.055428922176361e-06, -1.9334256649017334e-06, -1.8114224076271057e-06, -1.689419150352478e-06, -1.5674158930778503e-06, -1.4454126358032227e-06, -1.323409378528595e-06, -1.2014061212539673e-06, -1.0794028639793396e-06, -9.57399606704712e-07, -8.353963494300842e-07, -7.133930921554565e-07, -5.913898348808289e-07, -4.6938657760620117e-07, -3.473833203315735e-07, -2.253800630569458e-07, -1.0337680578231812e-07, 1.862645149230957e-08, 1.4062970876693726e-07, 2.6263296604156494e-07, 3.8463622331619263e-07, 5.066394805908203e-07, 6.28642737865448e-07, 7.506459951400757e-07, 8.726492524147034e-07, 9.94652509689331e-07, 1.1166557669639587e-06, 1.2386590242385864e-06, 1.3606622815132141e-06, 1.4826655387878418e-06, 1.6046687960624695e-06, 1.7266720533370972e-06, 1.8486753106117249e-06, 1.9706785678863525e-06, 2.0926818251609802e-06, 2.214685082435608e-06, 2.3366883397102356e-06, 2.4586915969848633e-06, 2.580694854259491e-06, 2.7026981115341187e-06, 2.8247013688087463e-06, 2.946704626083374e-06, 3.0687078833580017e-06, 3.1907111406326294e-06, 3.312714397907257e-06, 3.4347176551818848e-06, 3.5567209124565125e-06, 3.67872416973114e-06, 3.800727427005768e-06, 3.9227306842803955e-06, 4.044733941555023e-06, 4.166737198829651e-06, 4.2887404561042786e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 10.0, 13.0, 21.0, 28.0, 76.0, 225.0, 1763.0, 1044655.0, 1365.0, 213.0, 77.0, 36.0, 16.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.504753112792969e-05, -3.418140113353729e-05, -3.33152711391449e-05, -3.24491411447525e-05, -3.158301115036011e-05, -3.071688115596771e-05, -2.9850751161575317e-05, -2.8984621167182922e-05, -2.8118491172790527e-05, -2.7252361178398132e-05, -2.6386231184005737e-05, -2.5520101189613342e-05, -2.4653971195220947e-05, -2.3787841200828552e-05, -2.2921711206436157e-05, -2.2055581212043762e-05, -2.1189451217651367e-05, -2.0323321223258972e-05, -1.9457191228866577e-05, -1.8591061234474182e-05, -1.7724931240081787e-05, -1.6858801245689392e-05, -1.5992671251296997e-05, -1.5126541256904602e-05, -1.4260411262512207e-05, -1.3394281268119812e-05, -1.2528151273727417e-05, -1.1662021279335022e-05, -1.0795891284942627e-05, -9.929761290550232e-06, -9.063631296157837e-06, -8.197501301765442e-06, -7.331371307373047e-06, -6.465241312980652e-06, -5.599111318588257e-06, -4.732981324195862e-06, -3.866851329803467e-06, -3.0007213354110718e-06, -2.1345913410186768e-06, -1.2684613466262817e-06, -4.023313522338867e-07, 4.637986421585083e-07, 1.3299286365509033e-06, 2.1960586309432983e-06, 3.0621886253356934e-06, 3.928318619728088e-06, 4.794448614120483e-06, 5.660578608512878e-06, 6.5267086029052734e-06, 7.3928385972976685e-06, 8.258968591690063e-06, 9.125098586082458e-06, 9.991228580474854e-06, 1.0857358574867249e-05, 1.1723488569259644e-05, 1.2589618563652039e-05, 1.3455748558044434e-05, 1.4321878552436829e-05, 1.5188008546829224e-05, 1.605413854122162e-05, 1.6920268535614014e-05, 1.778639853000641e-05, 1.8652528524398804e-05, 1.95186585187912e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 7.0, 7.0, 11.0, 20.0, 20.0, 23.0, 58.0, 84.0, 523.0, 93.0, 52.0, 27.0, 19.0, 14.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1696090698242188e-05, -2.1158717572689056e-05, -2.0621344447135925e-05, -2.0083971321582794e-05, -1.9546598196029663e-05, -1.9009225070476532e-05, -1.84718519449234e-05, -1.793447881937027e-05, -1.739710569381714e-05, -1.6859732568264008e-05, -1.6322359442710876e-05, -1.5784986317157745e-05, -1.5247613191604614e-05, -1.4710240066051483e-05, -1.4172866940498352e-05, -1.3635493814945221e-05, -1.309812068939209e-05, -1.2560747563838959e-05, -1.2023374438285828e-05, -1.1486001312732697e-05, -1.0948628187179565e-05, -1.0411255061626434e-05, -9.873881936073303e-06, -9.336508810520172e-06, -8.799135684967041e-06, -8.26176255941391e-06, -7.724389433860779e-06, -7.187016308307648e-06, -6.649643182754517e-06, -6.1122700572013855e-06, -5.574896931648254e-06, -5.037523806095123e-06, -4.500150680541992e-06, -3.962777554988861e-06, -3.42540442943573e-06, -2.888031303882599e-06, -2.3506581783294678e-06, -1.8132850527763367e-06, -1.2759119272232056e-06, -7.385388016700745e-07, -2.0116567611694336e-07, 3.3620744943618774e-07, 8.735805749893188e-07, 1.41095370054245e-06, 1.948326826095581e-06, 2.485699951648712e-06, 3.0230730772018433e-06, 3.5604462027549744e-06, 4.0978193283081055e-06, 4.6351924538612366e-06, 5.172565579414368e-06, 5.709938704967499e-06, 6.24731183052063e-06, 6.784684956073761e-06, 7.322058081626892e-06, 7.859431207180023e-06, 8.396804332733154e-06, 8.934177458286285e-06, 9.471550583839417e-06, 1.0008923709392548e-05, 1.0546296834945679e-05, 1.108366996049881e-05, 1.1621043086051941e-05, 1.2158416211605072e-05, 1.2695789337158203e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 83.0, 830.0, 83.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06314918398857117, -0.057644203305244446, -0.052139222621917725, -0.046634241938591, -0.04112926125526428, -0.03562428057193756, -0.03011929616332054, -0.02461431547999382, -0.0191093347966671, -0.013604354113340378, -0.008099372498691082, -0.002594390884041786, 0.002910589799284935, 0.008415570482611656, 0.013920553028583527, 0.019425533711910248, 0.02493051439523697, 0.03043549507856369, 0.03594047576189041, 0.04144545644521713, 0.046950437128543854, 0.052455417811870575, 0.057960402220487595, 0.06346538662910461, 0.06897036731243134, 0.07447534799575806, 0.07998032867908478, 0.0854853093624115, 0.09099029004573822, 0.09649527072906494, 0.10200025141239166, 0.10750523209571838, 0.1130102127790451, 0.11851519346237183, 0.12402017414569855, 0.12952515482902527, 0.135030135512352, 0.1405351161956787, 0.14604009687900543, 0.15154507756233215, 0.15705005824565887, 0.1625550389289856, 0.16806001961231232, 0.17356500029563904, 0.17906998097896576, 0.18457496166229248, 0.1900799423456192, 0.19558492302894592, 0.20108991861343384, 0.20659489929676056, 0.21209987998008728, 0.217604860663414, 0.22310984134674072, 0.22861482203006744, 0.23411980271339417, 0.2396247833967209, 0.2451297640800476, 0.2506347596645355, 0.25613972544670105, 0.26164472103118896, 0.2671496868133545, 0.2726546823978424, 0.27815964818000793, 0.28366464376449585, 0.2891696095466614]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 13.0, 12.0, 8.0, 26.0, 27.0, 15.0, 29.0, 29.0, 38.0, 47.0, 56.0, 59.0, 69.0, 65.0, 61.0, 62.0, 51.0, 49.0, 52.0, 33.0, 32.0, 26.0, 23.0, 24.0, 10.0, 15.0, 17.0, 7.0, 11.0, 4.0, 10.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10185462236404419, -0.09835190325975418, -0.09484918415546417, -0.09134646505117416, -0.08784374594688416, -0.08434103429317474, -0.08083831518888474, -0.07733559608459473, -0.07383287698030472, -0.07033015787601471, -0.0668274387717247, -0.06332471966743469, -0.05982200428843498, -0.056319285184144974, -0.052816569805145264, -0.049313850700855255, -0.04581113159656525, -0.04230841249227524, -0.03880569338798523, -0.03530297800898552, -0.03180025890469551, -0.028297539800405502, -0.024794822558760643, -0.021292105317115784, -0.017789386212825775, -0.014286668039858341, -0.010783949866890907, -0.007281231693923473, -0.0037785135209560394, -0.0002757944166660309, 0.0032269228249788284, 0.006729640066623688, 0.010232359170913696, 0.01373507734388113, 0.017237795516848564, 0.020740512758493423, 0.024243231862783432, 0.02774595096707344, 0.0312486682087183, 0.03475138545036316, 0.03825410455465317, 0.041756823658943176, 0.045259542763233185, 0.048762258142232895, 0.0522649772465229, 0.05576769635081291, 0.05927041172981262, 0.06277313083410263, 0.06627584993839264, 0.06977856904268265, 0.07328128814697266, 0.07678400725126266, 0.08028672635555267, 0.08378943800926208, 0.0872921571135521, 0.0907948762178421, 0.09429759532213211, 0.09780031442642212, 0.10130303353071213, 0.10480575263500214, 0.10830846428871155, 0.11181119084358215, 0.11531390249729156, 0.11881662160158157, 0.12231934070587158]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 2.0, 9.0, 9.0, 12.0, 10.0, 7.0, 15.0, 24.0, 18.0, 11.0, 15.0, 17.0, 19.0, 20.0, 37.0, 38.0, 51.0, 71.0, 100.0, 118.0, 228.0, 767.0, 4187432.0, 3638.0, 793.0, 286.0, 116.0, 67.0, 52.0, 71.0, 39.0, 20.0, 20.0, 18.0, 22.0, 12.0, 7.0, 5.0, 9.0, 6.0, 11.0, 8.0, 8.0, 11.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0], "bins": [-0.0014867782592773438, -0.001444116234779358, -0.001401454210281372, -0.0013587921857833862, -0.0013161301612854004, -0.0012734681367874146, -0.0012308061122894287, -0.0011881440877914429, -0.001145482063293457, -0.0011028200387954712, -0.0010601580142974854, -0.0010174959897994995, -0.0009748339653015137, -0.0009321719408035278, -0.000889509916305542, -0.0008468478918075562, -0.0008041858673095703, -0.0007615238428115845, -0.0007188618183135986, -0.0006761997938156128, -0.000633537769317627, -0.0005908757448196411, -0.0005482137203216553, -0.0005055516958236694, -0.0004628896713256836, -0.00042022764682769775, -0.0003775656223297119, -0.0003349035978317261, -0.00029224157333374023, -0.0002495795488357544, -0.00020691752433776855, -0.00016425549983978271, -0.00012159347534179688, -7.893145084381104e-05, -3.6269426345825195e-05, 6.3925981521606445e-06, 4.9054622650146484e-05, 9.171664714813232e-05, 0.00013437867164611816, 0.000177040696144104, 0.00021970272064208984, 0.0002623647451400757, 0.0003050267696380615, 0.00034768879413604736, 0.0003903508186340332, 0.00043301284313201904, 0.0004756748676300049, 0.0005183368921279907, 0.0005609989166259766, 0.0006036609411239624, 0.0006463229656219482, 0.0006889849901199341, 0.0007316470146179199, 0.0007743090391159058, 0.0008169710636138916, 0.0008596330881118774, 0.0009022951126098633, 0.0009449571371078491, 0.000987619161605835, 0.0010302811861038208, 0.0010729432106018066, 0.0011156052350997925, 0.0011582672595977783, 0.0012009292840957642, 0.00124359130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 8.0, 9.0, 16.0, 45.0, 123.0, 269.0, 220.0, 118.0, 42.0, 12.0, 10.0, 11.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162570953369141, -0.006909370422363281, -0.006656169891357422, -0.0064029693603515625, -0.006149768829345703, -0.005896568298339844, -0.005643367767333984, -0.005390167236328125, -0.005136966705322266, -0.004883766174316406, -0.004630565643310547, -0.0043773651123046875, -0.004124164581298828, -0.0038709640502929688, -0.0036177635192871094, -0.00336456298828125, -0.0031113624572753906, -0.0028581619262695312, -0.002604961395263672, -0.0023517608642578125, -0.002098560333251953, -0.0018453598022460938, -0.0015921592712402344, -0.001338958740234375, -0.0010857582092285156, -0.0008325576782226562, -0.0005793571472167969, -0.0003261566162109375, -7.295608520507812e-05, 0.00018024444580078125, 0.0004334449768066406, 0.0006866455078125, 0.0009398460388183594, 0.0011930465698242188, 0.0014462471008300781, 0.0016994476318359375, 0.0019526481628417969, 0.0022058486938476562, 0.0024590492248535156, 0.002712249755859375, 0.0029654502868652344, 0.0032186508178710938, 0.003471851348876953, 0.0037250518798828125, 0.003978252410888672, 0.004231452941894531, 0.004484653472900391, 0.00473785400390625, 0.004991054534912109, 0.005244255065917969, 0.005497455596923828, 0.0057506561279296875, 0.006003856658935547, 0.006257057189941406, 0.006510257720947266, 0.006763458251953125, 0.007016658782958984, 0.007269859313964844, 0.007523059844970703, 0.0077762603759765625, 0.008029460906982422, 0.008282661437988281, 0.00853586196899414, 0.0087890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 19.0, 37.0, 66.0, 91.0, 136.0, 367.0, 1787.0, 4189489.0, 1623.0, 336.0, 129.0, 82.0, 50.0, 35.0, 22.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0015964508056640625, -0.0015613436698913574, -0.0015262365341186523, -0.0014911293983459473, -0.0014560222625732422, -0.0014209151268005371, -0.001385807991027832, -0.001350700855255127, -0.0013155937194824219, -0.0012804865837097168, -0.0012453794479370117, -0.0012102723121643066, -0.0011751651763916016, -0.0011400580406188965, -0.0011049509048461914, -0.0010698437690734863, -0.0010347366333007812, -0.0009996294975280762, -0.0009645223617553711, -0.000929415225982666, -0.0008943080902099609, -0.0008592009544372559, -0.0008240938186645508, -0.0007889866828918457, -0.0007538795471191406, -0.0007187724113464355, -0.0006836652755737305, -0.0006485581398010254, -0.0006134510040283203, -0.0005783438682556152, -0.0005432367324829102, -0.0005081295967102051, -0.0004730224609375, -0.0004379153251647949, -0.00040280818939208984, -0.00036770105361938477, -0.0003325939178466797, -0.0002974867820739746, -0.00026237964630126953, -0.00022727251052856445, -0.00019216537475585938, -0.0001570582389831543, -0.00012195110321044922, -8.684396743774414e-05, -5.173683166503906e-05, -1.6629695892333984e-05, 1.8477439880371094e-05, 5.358457565307617e-05, 8.869171142578125e-05, 0.00012379884719848633, 0.0001589059829711914, 0.00019401311874389648, 0.00022912025451660156, 0.00026422739028930664, 0.0002993345260620117, 0.0003344416618347168, 0.0003695487976074219, 0.00040465593338012695, 0.00043976306915283203, 0.0004748702049255371, 0.0005099773406982422, 0.0005450844764709473, 0.0005801916122436523, 0.0006152987480163574, 0.0006504058837890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4048.0, 24.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020301342010498047, -0.00019025243818759918, -0.0001774914562702179, -0.0001647304743528366, -0.00015196949243545532, -0.00013920851051807404, -0.00012644752860069275, -0.00011368654668331146, -0.00010092556476593018, -8.816458284854889e-05, -7.54036009311676e-05, -6.264261901378632e-05, -4.988163709640503e-05, -3.712065517902374e-05, -2.4359673261642456e-05, -1.159869134426117e-05, 1.1622905731201172e-06, 1.3923272490501404e-05, 2.668425440788269e-05, 3.944523632526398e-05, 5.2206218242645264e-05, 6.496720016002655e-05, 7.772818207740784e-05, 9.048916399478912e-05, 0.00010325014591217041, 0.0001160111278295517, 0.00012877210974693298, 0.00014153309166431427, 0.00015429407358169556, 0.00016705505549907684, 0.00017981603741645813, 0.00019257701933383942, 0.0002053380012512207, 0.000218098983168602, 0.00023085996508598328, 0.00024362094700336456, 0.00025638192892074585, 0.00026914291083812714, 0.0002819038927555084, 0.0002946648746728897, 0.000307425856590271, 0.0003201868385076523, 0.00033294782042503357, 0.00034570880234241486, 0.00035846978425979614, 0.00037123076617717743, 0.0003839917480945587, 0.00039675273001194, 0.0004095137119293213, 0.0004222746938467026, 0.00043503567576408386, 0.00044779665768146515, 0.00046055763959884644, 0.0004733186215162277, 0.000486079603433609, 0.0004988405853509903, 0.0005116015672683716, 0.0005243625491857529, 0.0005371235311031342, 0.0005498845130205154, 0.0005626454949378967, 0.000575406476855278, 0.0005881674587726593, 0.0006009284406900406, 0.0006136894226074219]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 244.0, 733.0, 22.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001141307526268065, -0.0011142055736854672, -0.0010871035046875477, -0.00106000155210495, -0.0010328995995223522, -0.0010057975305244327, -0.000978695577941835, -0.0009515935671515763, -0.0009244915563613176, -0.000897389545571059, -0.0008702875347808003, -0.0008431855821982026, -0.000816083571407944, -0.0007889815606176853, -0.0007618796080350876, -0.0007347775972448289, -0.0007076755864545703, -0.0006805735756643116, -0.000653471564874053, -0.0006263696122914553, -0.0005992676015011966, -0.000572165590710938, -0.0005450636381283402, -0.0005179616273380816, -0.000490859616547823, -0.0004637576057575643, -0.0004366556240711361, -0.00040955364238470793, -0.0003824516315944493, -0.00035534962080419064, -0.00032824763911776245, -0.00030114565743133426, -0.0002740435884334147, -0.00024694157764315605, -0.00021983959595672786, -0.00019273759971838444, -0.00016563560348004103, -0.0001385336072416976, -0.00011143161100335419, -8.432961476501077e-05, -5.7227618526667356e-05, -3.012562228832394e-05, -3.023626049980521e-06, 2.4078370188362896e-05, 5.1180366426706314e-05, 7.828236266504973e-05, 0.00010538435890339315, 0.00013248635514173657, 0.00015958835138007998, 0.0001866903476184234, 0.00021379234385676682, 0.00024089434009511024, 0.00026799633633345366, 0.0002950983471237123, 0.0003222003288101405, 0.0003493023104965687, 0.0003764043212868273, 0.00040350633207708597, 0.00043060831376351416, 0.00045771029544994235, 0.000484812306240201, 0.0005119143170304596, 0.0005390163278207183, 0.000566118280403316, 0.0005932202911935747]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 10.0, 27.0, 46.0, 66.0, 114.0, 153.0, 161.0, 126.0, 117.0, 77.0, 47.0, 26.0, 13.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0013595819473266602, -0.0013292189687490463, -0.0012988559901714325, -0.0012684930115938187, -0.0012381300330162048, -0.001207767054438591, -0.0011774040758609772, -0.0011470410972833633, -0.0011166781187057495, -0.0010863151401281357, -0.0010559521615505219, -0.001025589182972908, -0.0009952262043952942, -0.0009648632258176804, -0.0009345002472400665, -0.0009041372686624527, -0.0008737742900848389, -0.000843411311507225, -0.0008130483329296112, -0.0007826853543519974, -0.0007523223757743835, -0.0007219593971967697, -0.0006915964186191559, -0.000661233440041542, -0.0006308704614639282, -0.0006005074828863144, -0.0005701445043087006, -0.0005397815257310867, -0.0005094185471534729, -0.00047905556857585907, -0.00044869258999824524, -0.0004183296114206314, -0.0003879666328430176, -0.00035760365426540375, -0.0003272406756877899, -0.0002968776971101761, -0.00026651471853256226, -0.00023615173995494843, -0.0002057887613773346, -0.00017542578279972076, -0.00014506280422210693, -0.0001146998256444931, -8.433684706687927e-05, -5.397386848926544e-05, -2.361088991165161e-05, 6.752088665962219e-06, 3.711506724357605e-05, 6.747804582118988e-05, 9.784102439880371e-05, 0.00012820400297641754, 0.00015856698155403137, 0.0001889299601316452, 0.00021929293870925903, 0.00024965591728687286, 0.0002800188958644867, 0.0003103818744421005, 0.00034074485301971436, 0.0003711078315973282, 0.000401470810174942, 0.00043183378875255585, 0.0004621967673301697, 0.0004925597459077835, 0.0005229227244853973, 0.0005532857030630112, 0.000583648681640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 10.0, 13.0, 7.0, 10.0, 21.0, 23.0, 23.0, 47.0, 57.0, 57.0, 109.0, 164.0, 309.0, 458.0, 874.0, 1733.0, 3964.0, 11264.0, 80638.0, 914859.0, 22315.0, 6302.0, 2517.0, 1164.0, 628.0, 319.0, 184.0, 135.0, 80.0, 51.0, 38.0, 34.0, 19.0, 24.0, 27.0, 11.0, 9.0, 9.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01837158203125, -0.01774311065673828, -0.017114639282226562, -0.016486167907714844, -0.015857696533203125, -0.015229225158691406, -0.014600753784179688, -0.013972282409667969, -0.01334381103515625, -0.012715339660644531, -0.012086868286132812, -0.011458396911621094, -0.010829925537109375, -0.010201454162597656, -0.009572982788085938, -0.008944511413574219, -0.0083160400390625, -0.007687568664550781, -0.0070590972900390625, -0.006430625915527344, -0.005802154541015625, -0.005173683166503906, -0.0045452117919921875, -0.003916740417480469, -0.00328826904296875, -0.0026597976684570312, -0.0020313262939453125, -0.0014028549194335938, -0.000774383544921875, -0.00014591217041015625, 0.0004825592041015625, 0.0011110305786132812, 0.001739501953125, 0.0023679733276367188, 0.0029964447021484375, 0.0036249160766601562, 0.004253387451171875, 0.004881858825683594, 0.0055103302001953125, 0.006138801574707031, 0.00676727294921875, 0.007395744323730469, 0.008024215698242188, 0.008652687072753906, 0.009281158447265625, 0.009909629821777344, 0.010538101196289062, 0.011166572570800781, 0.0117950439453125, 0.012423515319824219, 0.013051986694335938, 0.013680458068847656, 0.014308929443359375, 0.014937400817871094, 0.015565872192382812, 0.01619434356689453, 0.01682281494140625, 0.01745128631591797, 0.018079757690429688, 0.018708229064941406, 0.019336700439453125, 0.019965171813964844, 0.020593643188476562, 0.02122211456298828, 0.0218505859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 8.0, 9.0, 16.0, 45.0, 123.0, 269.0, 220.0, 118.0, 42.0, 11.0, 11.0, 11.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162570953369141, -0.006909370422363281, -0.006656169891357422, -0.0064029693603515625, -0.006149768829345703, -0.005896568298339844, -0.005643367767333984, -0.005390167236328125, -0.005136966705322266, -0.004883766174316406, -0.004630565643310547, -0.0043773651123046875, -0.004124164581298828, -0.0038709640502929688, -0.0036177635192871094, -0.00336456298828125, -0.0031113624572753906, -0.0028581619262695312, -0.002604961395263672, -0.0023517608642578125, -0.002098560333251953, -0.0018453598022460938, -0.0015921592712402344, -0.001338958740234375, -0.0010857582092285156, -0.0008325576782226562, -0.0005793571472167969, -0.0003261566162109375, -7.295608520507812e-05, 0.00018024444580078125, 0.0004334449768066406, 0.0006866455078125, 0.0009398460388183594, 0.0011930465698242188, 0.0014462471008300781, 0.0016994476318359375, 0.0019526481628417969, 0.0022058486938476562, 0.0024590492248535156, 0.002712249755859375, 0.0029654502868652344, 0.0032186508178710938, 0.003471851348876953, 0.0037250518798828125, 0.003978252410888672, 0.004231452941894531, 0.004484653472900391, 0.00473785400390625, 0.004991054534912109, 0.005244255065917969, 0.005497455596923828, 0.0057506561279296875, 0.006003856658935547, 0.006257057189941406, 0.006510257720947266, 0.006763458251953125, 0.007016658782958984, 0.007269859313964844, 0.007523059844970703, 0.0077762603759765625, 0.008029460906982422, 0.008282661437988281, 0.00853586196899414, 0.0087890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 17.0, 18.0, 9.0, 19.0, 24.0, 27.0, 21.0, 44.0, 38.0, 69.0, 140.0, 282.0, 709.0, 2291.0, 597852.0, 443244.0, 2288.0, 678.0, 281.0, 129.0, 86.0, 53.0, 33.0, 31.0, 27.0, 22.0, 14.0, 14.0, 15.0, 9.0, 5.0, 8.0, 4.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030914306640625, -0.029848098754882812, -0.028781890869140625, -0.027715682983398438, -0.02664947509765625, -0.025583267211914062, -0.024517059326171875, -0.023450851440429688, -0.0223846435546875, -0.021318435668945312, -0.020252227783203125, -0.019186019897460938, -0.01811981201171875, -0.017053604125976562, -0.015987396240234375, -0.014921188354492188, -0.01385498046875, -0.012788772583007812, -0.011722564697265625, -0.010656356811523438, -0.00959014892578125, -0.008523941040039062, -0.007457733154296875, -0.0063915252685546875, -0.0053253173828125, -0.0042591094970703125, -0.003192901611328125, -0.0021266937255859375, -0.00106048583984375, 5.7220458984375e-06, 0.001071929931640625, 0.0021381378173828125, 0.003204345703125, 0.0042705535888671875, 0.005336761474609375, 0.0064029693603515625, 0.00746917724609375, 0.008535385131835938, 0.009601593017578125, 0.010667800903320312, 0.0117340087890625, 0.012800216674804688, 0.013866424560546875, 0.014932632446289062, 0.01599884033203125, 0.017065048217773438, 0.018131256103515625, 0.019197463989257812, 0.020263671875, 0.021329879760742188, 0.022396087646484375, 0.023462295532226562, 0.02452850341796875, 0.025594711303710938, 0.026660919189453125, 0.027727127075195312, 0.0287933349609375, 0.029859542846679688, 0.030925750732421875, 0.03199195861816406, 0.03305816650390625, 0.03412437438964844, 0.035190582275390625, 0.03625679016113281, 0.037322998046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 10.0, 17.0, 18.0, 10.0, 18.0, 24.0, 28.0, 19.0, 39.0, 28.0, 31.0, 35.0, 42.0, 52.0, 51.0, 55.0, 59.0, 43.0, 39.0, 39.0, 40.0, 44.0, 40.0, 31.0, 30.0, 25.0, 23.0, 15.0, 13.0, 14.0, 10.0, 5.0, 8.0, 4.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.016721248626708984, -0.01612377166748047, -0.015526294708251953, -0.014928817749023438, -0.014331340789794922, -0.013733863830566406, -0.01313638687133789, -0.012538909912109375, -0.01194143295288086, -0.011343955993652344, -0.010746479034423828, -0.010149002075195312, -0.009551525115966797, -0.008954048156738281, -0.008356571197509766, -0.00775909423828125, -0.007161617279052734, -0.006564140319824219, -0.005966663360595703, -0.0053691864013671875, -0.004771709442138672, -0.004174232482910156, -0.0035767555236816406, -0.002979278564453125, -0.0023818016052246094, -0.0017843246459960938, -0.0011868476867675781, -0.0005893707275390625, 8.106231689453125e-06, 0.0006055831909179688, 0.0012030601501464844, 0.001800537109375, 0.0023980140686035156, 0.0029954910278320312, 0.003592967987060547, 0.0041904449462890625, 0.004787921905517578, 0.005385398864746094, 0.005982875823974609, 0.006580352783203125, 0.007177829742431641, 0.007775306701660156, 0.008372783660888672, 0.008970260620117188, 0.009567737579345703, 0.010165214538574219, 0.010762691497802734, 0.01136016845703125, 0.011957645416259766, 0.012555122375488281, 0.013152599334716797, 0.013750076293945312, 0.014347553253173828, 0.014945030212402344, 0.01554250717163086, 0.016139984130859375, 0.01673746109008789, 0.017334938049316406, 0.017932415008544922, 0.018529891967773438, 0.019127368927001953, 0.01972484588623047, 0.020322322845458984, 0.0209197998046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 17.0, 14.0, 20.0, 46.0, 61.0, 111.0, 227.0, 531.0, 2243.0, 34725.0, 998807.0, 9618.0, 1303.0, 401.0, 156.0, 87.0, 54.0, 28.0, 22.0, 12.0, 14.0, 8.0, 5.0, 5.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1458061635494232e-05, -1.111440360546112e-05, -1.0770745575428009e-05, -1.0427087545394897e-05, -1.0083429515361786e-05, -9.739771485328674e-06, -9.396113455295563e-06, -9.052455425262451e-06, -8.70879739522934e-06, -8.365139365196228e-06, -8.021481335163116e-06, -7.677823305130005e-06, -7.334165275096893e-06, -6.990507245063782e-06, -6.64684921503067e-06, -6.303191184997559e-06, -5.959533154964447e-06, -5.6158751249313354e-06, -5.272217094898224e-06, -4.928559064865112e-06, -4.584901034832001e-06, -4.241243004798889e-06, -3.897584974765778e-06, -3.553926944732666e-06, -3.2102689146995544e-06, -2.866610884666443e-06, -2.5229528546333313e-06, -2.1792948246002197e-06, -1.8356367945671082e-06, -1.4919787645339966e-06, -1.148320734500885e-06, -8.046627044677734e-07, -4.6100467443466187e-07, -1.1734664440155029e-07, 2.2631138563156128e-07, 5.699694156646729e-07, 9.136274456977844e-07, 1.257285475730896e-06, 1.6009435057640076e-06, 1.944601535797119e-06, 2.2882595658302307e-06, 2.6319175958633423e-06, 2.975575625896454e-06, 3.3192336559295654e-06, 3.662891685962677e-06, 4.0065497159957886e-06, 4.3502077460289e-06, 4.693865776062012e-06, 5.037523806095123e-06, 5.381181836128235e-06, 5.7248398661613464e-06, 6.068497896194458e-06, 6.41215592622757e-06, 6.755813956260681e-06, 7.099471986293793e-06, 7.443130016326904e-06, 7.786788046360016e-06, 8.130446076393127e-06, 8.474104106426239e-06, 8.81776213645935e-06, 9.161420166492462e-06, 9.505078196525574e-06, 9.848736226558685e-06, 1.0192394256591797e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 19.0, 19.0, 29.0, 38.0, 61.0, 53.0, 107.0, 91.0, 141.0, 112.0, 69.0, 56.0, 39.0, 28.0, 31.0, 16.0, 18.0, 7.0, 11.0, 4.0, 4.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.1336904764175415e-06, -5.949288606643677e-06, -5.764886736869812e-06, -5.580484867095947e-06, -5.3960829973220825e-06, -5.211681127548218e-06, -5.027279257774353e-06, -4.842877388000488e-06, -4.6584755182266235e-06, -4.474073648452759e-06, -4.289671778678894e-06, -4.105269908905029e-06, -3.9208680391311646e-06, -3.7364661693573e-06, -3.552064299583435e-06, -3.3676624298095703e-06, -3.1832605600357056e-06, -2.998858690261841e-06, -2.814456820487976e-06, -2.6300549507141113e-06, -2.4456530809402466e-06, -2.261251211166382e-06, -2.076849341392517e-06, -1.8924474716186523e-06, -1.7080456018447876e-06, -1.5236437320709229e-06, -1.339241862297058e-06, -1.1548399925231934e-06, -9.704381227493286e-07, -7.860362529754639e-07, -6.016343832015991e-07, -4.172325134277344e-07, -2.3283064365386963e-07, -4.842877388000488e-08, 1.3597309589385986e-07, 3.203749656677246e-07, 5.047768354415894e-07, 6.891787052154541e-07, 8.735805749893188e-07, 1.0579824447631836e-06, 1.2423843145370483e-06, 1.426786184310913e-06, 1.6111880540847778e-06, 1.7955899238586426e-06, 1.9799917936325073e-06, 2.164393663406372e-06, 2.348795533180237e-06, 2.5331974029541016e-06, 2.7175992727279663e-06, 2.902001142501831e-06, 3.086403012275696e-06, 3.2708048820495605e-06, 3.4552067518234253e-06, 3.63960862159729e-06, 3.824010491371155e-06, 4.0084123611450195e-06, 4.192814230918884e-06, 4.377216100692749e-06, 4.561617970466614e-06, 4.7460198402404785e-06, 4.930421710014343e-06, 5.114823579788208e-06, 5.299225449562073e-06, 5.4836273193359375e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 19.0, 26.0, 35.0, 80.0, 186.0, 880.0, 1032242.0, 14260.0, 490.0, 125.0, 72.0, 31.0, 33.0, 18.0, 12.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.2961368560791016e-05, -3.206636756658554e-05, -3.1171366572380066e-05, -3.027636557817459e-05, -2.9381364583969116e-05, -2.848636358976364e-05, -2.7591362595558167e-05, -2.669636160135269e-05, -2.5801360607147217e-05, -2.4906359612941742e-05, -2.4011358618736267e-05, -2.3116357624530792e-05, -2.2221356630325317e-05, -2.1326355636119843e-05, -2.0431354641914368e-05, -1.9536353647708893e-05, -1.8641352653503418e-05, -1.7746351659297943e-05, -1.6851350665092468e-05, -1.5956349670886993e-05, -1.5061348676681519e-05, -1.4166347682476044e-05, -1.3271346688270569e-05, -1.2376345694065094e-05, -1.1481344699859619e-05, -1.0586343705654144e-05, -9.69134271144867e-06, -8.796341717243195e-06, -7.90134072303772e-06, -7.006339728832245e-06, -6.11133873462677e-06, -5.216337740421295e-06, -4.32133674621582e-06, -3.4263357520103455e-06, -2.5313347578048706e-06, -1.6363337635993958e-06, -7.413327693939209e-07, 1.5366822481155396e-07, 1.0486692190170288e-06, 1.9436702132225037e-06, 2.8386712074279785e-06, 3.7336722016334534e-06, 4.628673195838928e-06, 5.523674190044403e-06, 6.418675184249878e-06, 7.313676178455353e-06, 8.208677172660828e-06, 9.103678166866302e-06, 9.998679161071777e-06, 1.0893680155277252e-05, 1.1788681149482727e-05, 1.2683682143688202e-05, 1.3578683137893677e-05, 1.4473684132099152e-05, 1.5368685126304626e-05, 1.62636861205101e-05, 1.7158687114715576e-05, 1.805368810892105e-05, 1.8948689103126526e-05, 1.9843690097332e-05, 2.0738691091537476e-05, 2.163369208574295e-05, 2.2528693079948425e-05, 2.34236940741539e-05, 2.4318695068359375e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 12.0, 14.0, 17.0, 31.0, 52.0, 67.0, 507.0, 72.0, 66.0, 32.0, 31.0, 19.0, 22.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.8537044525146484e-05, -1.8034130334854126e-05, -1.7531216144561768e-05, -1.702830195426941e-05, -1.652538776397705e-05, -1.6022473573684692e-05, -1.5519559383392334e-05, -1.5016645193099976e-05, -1.4513731002807617e-05, -1.4010816812515259e-05, -1.35079026222229e-05, -1.3004988431930542e-05, -1.2502074241638184e-05, -1.1999160051345825e-05, -1.1496245861053467e-05, -1.0993331670761108e-05, -1.049041748046875e-05, -9.987503290176392e-06, -9.484589099884033e-06, -8.981674909591675e-06, -8.478760719299316e-06, -7.975846529006958e-06, -7.4729323387146e-06, -6.970018148422241e-06, -6.467103958129883e-06, -5.964189767837524e-06, -5.461275577545166e-06, -4.958361387252808e-06, -4.455447196960449e-06, -3.952533006668091e-06, -3.4496188163757324e-06, -2.946704626083374e-06, -2.4437904357910156e-06, -1.9408762454986572e-06, -1.4379620552062988e-06, -9.350478649139404e-07, -4.3213367462158203e-07, 7.078051567077637e-08, 5.736947059631348e-07, 1.0766088962554932e-06, 1.5795230865478516e-06, 2.08243727684021e-06, 2.5853514671325684e-06, 3.0882656574249268e-06, 3.591179847717285e-06, 4.0940940380096436e-06, 4.597008228302002e-06, 5.09992241859436e-06, 5.602836608886719e-06, 6.105750799179077e-06, 6.6086649894714355e-06, 7.111579179763794e-06, 7.614493370056152e-06, 8.11740756034851e-06, 8.620321750640869e-06, 9.123235940933228e-06, 9.626150131225586e-06, 1.0129064321517944e-05, 1.0631978511810303e-05, 1.1134892702102661e-05, 1.163780689239502e-05, 1.2140721082687378e-05, 1.2643635272979736e-05, 1.3146549463272095e-05, 1.3649463653564453e-05]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 28.0, 133.0, 690.0, 120.0, 24.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10095751285552979, -0.09785737842321396, -0.09475723654031754, -0.09165710210800171, -0.08855696022510529, -0.08545682579278946, -0.08235669136047363, -0.07925654947757721, -0.07615640759468079, -0.07305627316236496, -0.06995613127946854, -0.06685599684715271, -0.06375585496425629, -0.06065572053194046, -0.057555582374334335, -0.05445544421672821, -0.051355309784412384, -0.04825517162680626, -0.045155033469200134, -0.04205489903688431, -0.038954757153987885, -0.03585462272167206, -0.03275448456406593, -0.02965434640645981, -0.026554208248853683, -0.02345407009124756, -0.020353931933641434, -0.017253795638680458, -0.014153657481074333, -0.011053519323468208, -0.007953383028507233, -0.004853244870901108, -0.001753106713294983, 0.0013470309786498547, 0.004447168670594692, 0.0075473058968782425, 0.010647444054484367, 0.013747582212090492, 0.016847718507051468, 0.019947856664657593, 0.023047994822263718, 0.026148132979869843, 0.029248271137475967, 0.03234840929508209, 0.03544854372739792, 0.03854868561029434, 0.04164882004261017, 0.04474895820021629, 0.04784909635782242, 0.05094923451542854, 0.05404937267303467, 0.057149507105350494, 0.06024964898824692, 0.06334978342056274, 0.06644992530345917, 0.069550059735775, 0.07265019416809082, 0.07575032860040665, 0.07885047048330307, 0.0819506049156189, 0.08505074679851532, 0.08815088123083115, 0.09125101566314697, 0.0943511575460434, 0.09745129942893982]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 11.0, 10.0, 10.0, 7.0, 21.0, 21.0, 21.0, 23.0, 24.0, 36.0, 34.0, 44.0, 47.0, 50.0, 47.0, 46.0, 41.0, 58.0, 48.0, 45.0, 33.0, 54.0, 37.0, 42.0, 30.0, 21.0, 17.0, 14.0, 17.0, 18.0, 12.0, 13.0, 7.0, 2.0, 7.0, 1.0, 2.0, 6.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08758425712585449, -0.084969162940979, -0.08235406875610352, -0.07973897457122803, -0.07712388038635254, -0.07450878620147705, -0.07189369201660156, -0.06927859783172607, -0.06666350364685059, -0.0640484094619751, -0.06143331527709961, -0.05881822109222412, -0.05620312690734863, -0.053588032722473145, -0.050972938537597656, -0.04835784435272217, -0.04574275016784668, -0.04312765598297119, -0.0405125617980957, -0.037897467613220215, -0.03528237342834473, -0.03266727924346924, -0.03005218505859375, -0.02743709087371826, -0.024821996688842773, -0.022206902503967285, -0.019591808319091797, -0.01697671413421631, -0.01436161994934082, -0.011746525764465332, -0.009131431579589844, -0.0065163373947143555, -0.003901243209838867, -0.001286149024963379, 0.0013289451599121094, 0.003944039344787598, 0.006559133529663086, 0.009174227714538574, 0.011789321899414062, 0.01440441608428955, 0.01701951026916504, 0.019634604454040527, 0.022249698638916016, 0.024864792823791504, 0.027479887008666992, 0.03009498119354248, 0.03271007537841797, 0.03532516956329346, 0.037940263748168945, 0.040555357933044434, 0.04317045211791992, 0.04578554630279541, 0.0484006404876709, 0.05101573467254639, 0.053630828857421875, 0.05624592304229736, 0.05886101722717285, 0.06147611141204834, 0.06409120559692383, 0.06670629978179932, 0.0693213939666748, 0.07193648815155029, 0.07455158233642578, 0.07716667652130127, 0.07978177070617676]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 11.0, 11.0, 8.0, 14.0, 15.0, 18.0, 19.0, 27.0, 44.0, 63.0, 79.0, 137.0, 169.0, 383.0, 1254.0, 15528.0, 4172339.0, 2448.0, 680.0, 306.0, 180.0, 124.0, 77.0, 67.0, 37.0, 33.0, 37.0, 18.0, 29.0, 18.0, 14.0, 15.0, 12.0, 11.0, 3.0, 10.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0797119140625, -0.07698822021484375, -0.0742645263671875, -0.07154083251953125, -0.068817138671875, -0.06609344482421875, -0.0633697509765625, -0.06064605712890625, -0.05792236328125, -0.05519866943359375, -0.0524749755859375, -0.04975128173828125, -0.047027587890625, -0.04430389404296875, -0.0415802001953125, -0.03885650634765625, -0.0361328125, -0.03340911865234375, -0.0306854248046875, -0.02796173095703125, -0.025238037109375, -0.02251434326171875, -0.0197906494140625, -0.01706695556640625, -0.01434326171875, -0.01161956787109375, -0.0088958740234375, -0.00617218017578125, -0.003448486328125, -0.00072479248046875, 0.0019989013671875, 0.00472259521484375, 0.0074462890625, 0.01016998291015625, 0.0128936767578125, 0.01561737060546875, 0.018341064453125, 0.02106475830078125, 0.0237884521484375, 0.02651214599609375, 0.02923583984375, 0.03195953369140625, 0.0346832275390625, 0.03740692138671875, 0.040130615234375, 0.04285430908203125, 0.0455780029296875, 0.04830169677734375, 0.051025390625, 0.05374908447265625, 0.0564727783203125, 0.05919647216796875, 0.061920166015625, 0.06464385986328125, 0.0673675537109375, 0.07009124755859375, 0.07281494140625, 0.07553863525390625, 0.0782623291015625, 0.08098602294921875, 0.083709716796875, 0.08643341064453125, 0.0891571044921875, 0.09188079833984375, 0.0946044921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 9.0, 15.0, 9.0, 9.0, 13.0, 45.0, 120.0, 257.0, 233.0, 122.0, 43.0, 11.0, 11.0, 11.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162809371948242, -0.006909847259521484, -0.0066568851470947266, -0.006403923034667969, -0.006150960922241211, -0.005897998809814453, -0.005645036697387695, -0.0053920745849609375, -0.00513911247253418, -0.004886150360107422, -0.004633188247680664, -0.004380226135253906, -0.0041272640228271484, -0.0038743019104003906, -0.003621339797973633, -0.003368377685546875, -0.003115415573120117, -0.0028624534606933594, -0.0026094913482666016, -0.0023565292358398438, -0.002103567123413086, -0.0018506050109863281, -0.0015976428985595703, -0.0013446807861328125, -0.0010917186737060547, -0.0008387565612792969, -0.0005857944488525391, -0.00033283233642578125, -7.987022399902344e-05, 0.00017309188842773438, 0.0004260540008544922, 0.00067901611328125, 0.0009319782257080078, 0.0011849403381347656, 0.0014379024505615234, 0.0016908645629882812, 0.001943826675415039, 0.002196788787841797, 0.0024497509002685547, 0.0027027130126953125, 0.0029556751251220703, 0.003208637237548828, 0.003461599349975586, 0.0037145614624023438, 0.0039675235748291016, 0.004220485687255859, 0.004473447799682617, 0.004726409912109375, 0.004979372024536133, 0.005232334136962891, 0.0054852962493896484, 0.005738258361816406, 0.005991220474243164, 0.006244182586669922, 0.00649714469909668, 0.0067501068115234375, 0.007003068923950195, 0.007256031036376953, 0.007508993148803711, 0.007761955261230469, 0.008014917373657227, 0.008267879486083984, 0.008520841598510742, 0.0087738037109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 8.0, 4.0, 4.0, 11.0, 13.0, 17.0, 25.0, 22.0, 29.0, 51.0, 51.0, 58.0, 116.0, 362.0, 2306.0, 30882.0, 4146628.0, 11877.0, 1163.0, 215.0, 121.0, 62.0, 62.0, 38.0, 24.0, 13.0, 23.0, 17.0, 12.0, 6.0, 5.0, 11.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0251617431640625, -0.024384021759033203, -0.023606300354003906, -0.02282857894897461, -0.022050857543945312, -0.021273136138916016, -0.02049541473388672, -0.019717693328857422, -0.018939971923828125, -0.018162250518798828, -0.01738452911376953, -0.016606807708740234, -0.015829086303710938, -0.01505136489868164, -0.014273643493652344, -0.013495922088623047, -0.01271820068359375, -0.011940479278564453, -0.011162757873535156, -0.01038503646850586, -0.009607315063476562, -0.008829593658447266, -0.008051872253417969, -0.007274150848388672, -0.006496429443359375, -0.005718708038330078, -0.004940986633300781, -0.004163265228271484, -0.0033855438232421875, -0.0026078224182128906, -0.0018301010131835938, -0.0010523796081542969, -0.000274658203125, 0.0005030632019042969, 0.0012807846069335938, 0.0020585060119628906, 0.0028362274169921875, 0.0036139488220214844, 0.004391670227050781, 0.005169391632080078, 0.005947113037109375, 0.006724834442138672, 0.007502555847167969, 0.008280277252197266, 0.009057998657226562, 0.00983572006225586, 0.010613441467285156, 0.011391162872314453, 0.01216888427734375, 0.012946605682373047, 0.013724327087402344, 0.01450204849243164, 0.015279769897460938, 0.016057491302490234, 0.01683521270751953, 0.017612934112548828, 0.018390655517578125, 0.019168376922607422, 0.01994609832763672, 0.020723819732666016, 0.021501541137695312, 0.02227926254272461, 0.023056983947753906, 0.023834705352783203, 0.0246124267578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 12.0, 12.0, 13.0, 14.0, 26.0, 55.0, 145.0, 600.0, 2208.0, 639.0, 189.0, 56.0, 12.0, 15.0, 7.0, 9.0, 7.0, 2.0, 2.0, 8.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01253509521484375, -0.012137889862060547, -0.011740684509277344, -0.01134347915649414, -0.010946273803710938, -0.010549068450927734, -0.010151863098144531, -0.009754657745361328, -0.009357452392578125, -0.008960247039794922, -0.008563041687011719, -0.008165836334228516, -0.0077686309814453125, -0.007371425628662109, -0.006974220275878906, -0.006577014923095703, -0.0061798095703125, -0.005782604217529297, -0.005385398864746094, -0.004988193511962891, -0.0045909881591796875, -0.004193782806396484, -0.0037965774536132812, -0.003399372100830078, -0.003002166748046875, -0.002604961395263672, -0.0022077560424804688, -0.0018105506896972656, -0.0014133453369140625, -0.0010161399841308594, -0.0006189346313476562, -0.00022172927856445312, 0.00017547607421875, 0.0005726814270019531, 0.0009698867797851562, 0.0013670921325683594, 0.0017642974853515625, 0.0021615028381347656, 0.0025587081909179688, 0.002955913543701172, 0.003353118896484375, 0.003750324249267578, 0.004147529602050781, 0.004544734954833984, 0.0049419403076171875, 0.005339145660400391, 0.005736351013183594, 0.006133556365966797, 0.00653076171875, 0.006927967071533203, 0.007325172424316406, 0.007722377777099609, 0.008119583129882812, 0.008516788482666016, 0.008913993835449219, 0.009311199188232422, 0.009708404541015625, 0.010105609893798828, 0.010502815246582031, 0.010900020599365234, 0.011297225952148438, 0.01169443130493164, 0.012091636657714844, 0.012488842010498047, 0.01288604736328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 22.0, 104.0, 586.0, 211.0, 41.0, 17.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014731462113559246, -0.013573849573731422, -0.012416237965226173, -0.01125862542539835, -0.010101012885570526, -0.008943401277065277, -0.0077857887372374535, -0.0066281771287322044, -0.005470564588904381, -0.0043129525147378445, -0.0031553402077406645, -0.0019977279007434845, -0.0008401158265769482, 0.00031749624758958817, 0.0014751087874174118, 0.002632720395922661, 0.0037903329357504845, 0.004947945009917021, 0.006105557084083557, 0.007263169623911381, 0.008420782163739204, 0.009578393772244453, 0.010736006312072277, 0.011893617920577526, 0.01305123046040535, 0.014208843000233173, 0.015366454608738422, 0.016524067148566246, 0.017681678757071495, 0.018839292228221893, 0.019996903836727142, 0.02115451544523239, 0.02231213077902794, 0.023469742387533188, 0.024627355858683586, 0.025784967467188835, 0.026942579075694084, 0.028100192546844482, 0.02925780415534973, 0.03041541576385498, 0.03157302737236023, 0.03273063898086548, 0.03388825058937073, 0.03504586219787598, 0.036203477531671524, 0.03736108914017677, 0.03851870074868202, 0.03967631235718727, 0.04083392769098282, 0.04199153929948807, 0.04314915090799332, 0.044306762516498566, 0.04546437785029411, 0.04662198945879936, 0.04777960106730461, 0.04893721267580986, 0.05009482428431511, 0.05125243589282036, 0.05241004750132561, 0.053567662835121155, 0.054725274443626404, 0.05588288605213165, 0.0570404976606369, 0.05819810926914215, 0.0593557208776474]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 20.0, 17.0, 28.0, 24.0, 16.0, 28.0, 28.0, 58.0, 43.0, 50.0, 42.0, 28.0, 45.0, 47.0, 55.0, 53.0, 45.0, 40.0, 53.0, 34.0, 26.0, 26.0, 24.0, 30.0, 18.0, 19.0, 15.0, 14.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.03885149955749512, -0.0377403162419796, -0.03662913292646408, -0.03551795333623886, -0.03440677002072334, -0.033295586705207825, -0.032184407114982605, -0.031073223799467087, -0.02996204048395157, -0.02885085716843605, -0.02773967571556568, -0.026628494262695312, -0.025517310947179794, -0.024406127631664276, -0.023294946178793907, -0.022183764725923538, -0.02107258141040802, -0.019961398094892502, -0.018850216642022133, -0.017739035189151764, -0.016627851873636246, -0.015516669489443302, -0.014405487105250359, -0.013294304721057415, -0.012183122336864471, -0.011071939952671528, -0.009960757568478584, -0.00884957518428564, -0.007738392800092697, -0.006627210415899754, -0.00551602803170681, -0.004404845647513866, -0.003293663263320923, -0.0021824808791279793, -0.0010712984949350357, 3.988388925790787e-05, 0.0011510662734508514, 0.002262248657643795, 0.0033734310418367386, 0.004484613426029682, 0.005595795810222626, 0.006706978194415569, 0.007818160578608513, 0.008929342962801456, 0.0100405253469944, 0.011151707731187344, 0.012262890115380287, 0.01337407249957323, 0.014485254883766174, 0.015596437267959118, 0.01670761965215206, 0.01781880110502243, 0.01892998442053795, 0.020041167736053467, 0.021152349188923836, 0.022263530641794205, 0.023374713957309723, 0.02448589727282524, 0.02559707872569561, 0.02670826017856598, 0.027819443494081497, 0.028930626809597015, 0.030041808262467384, 0.031152989715337753, 0.03226417303085327]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 8.0, 9.0, 10.0, 3.0, 20.0, 24.0, 26.0, 43.0, 51.0, 64.0, 99.0, 121.0, 203.0, 241.0, 333.0, 447.0, 691.0, 985.0, 1526.0, 2742.0, 5228.0, 14781.0, 174752.0, 813876.0, 18174.0, 5891.0, 2858.0, 1596.0, 1046.0, 756.0, 517.0, 401.0, 238.0, 214.0, 160.0, 103.0, 81.0, 66.0, 46.0, 28.0, 22.0, 27.0, 15.0, 13.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.041656494140625, -0.04043436050415039, -0.03921222686767578, -0.03799009323120117, -0.03676795959472656, -0.03554582595825195, -0.034323692321777344, -0.033101558685302734, -0.031879425048828125, -0.030657291412353516, -0.029435157775878906, -0.028213024139404297, -0.026990890502929688, -0.025768756866455078, -0.02454662322998047, -0.02332448959350586, -0.02210235595703125, -0.02088022232055664, -0.01965808868408203, -0.018435955047607422, -0.017213821411132812, -0.015991687774658203, -0.014769554138183594, -0.013547420501708984, -0.012325286865234375, -0.011103153228759766, -0.009881019592285156, -0.008658885955810547, -0.0074367523193359375, -0.006214618682861328, -0.004992485046386719, -0.0037703514099121094, -0.0025482177734375, -0.0013260841369628906, -0.00010395050048828125, 0.0011181831359863281, 0.0023403167724609375, 0.003562450408935547, 0.004784584045410156, 0.006006717681884766, 0.007228851318359375, 0.008450984954833984, 0.009673118591308594, 0.010895252227783203, 0.012117385864257812, 0.013339519500732422, 0.014561653137207031, 0.01578378677368164, 0.01700592041015625, 0.01822805404663086, 0.01945018768310547, 0.020672321319580078, 0.021894454956054688, 0.023116588592529297, 0.024338722229003906, 0.025560855865478516, 0.026782989501953125, 0.028005123138427734, 0.029227256774902344, 0.030449390411376953, 0.03167152404785156, 0.03289365768432617, 0.03411579132080078, 0.03533792495727539, 0.03656005859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 16.0, 10.0, 8.0, 15.0, 43.0, 121.0, 252.0, 239.0, 122.0, 42.0, 11.0, 11.0, 12.0, 9.0, 9.0, 7.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162928581237793, -0.006910085678100586, -0.006657242774963379, -0.006404399871826172, -0.006151556968688965, -0.005898714065551758, -0.005645871162414551, -0.005393028259277344, -0.005140185356140137, -0.00488734245300293, -0.004634499549865723, -0.004381656646728516, -0.004128813743591309, -0.0038759708404541016, -0.0036231279373168945, -0.0033702850341796875, -0.0031174421310424805, -0.0028645992279052734, -0.0026117563247680664, -0.0023589134216308594, -0.0021060705184936523, -0.0018532276153564453, -0.0016003847122192383, -0.0013475418090820312, -0.0010946989059448242, -0.0008418560028076172, -0.0005890130996704102, -0.0003361701965332031, -8.33272933959961e-05, 0.00016951560974121094, 0.00042235851287841797, 0.000675201416015625, 0.000928044319152832, 0.001180887222290039, 0.001433730125427246, 0.0016865730285644531, 0.0019394159317016602, 0.002192258834838867, 0.0024451017379760742, 0.0026979446411132812, 0.0029507875442504883, 0.0032036304473876953, 0.0034564733505249023, 0.0037093162536621094, 0.003962159156799316, 0.0042150020599365234, 0.0044678449630737305, 0.0047206878662109375, 0.0049735307693481445, 0.0052263736724853516, 0.005479216575622559, 0.005732059478759766, 0.005984902381896973, 0.00623774528503418, 0.006490588188171387, 0.006743431091308594, 0.006996273994445801, 0.007249116897583008, 0.007501959800720215, 0.007754802703857422, 0.008007645606994629, 0.008260488510131836, 0.008513331413269043, 0.00876617431640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 5.0, 13.0, 13.0, 16.0, 16.0, 24.0, 31.0, 46.0, 66.0, 85.0, 109.0, 143.0, 221.0, 352.0, 649.0, 1672.0, 41944.0, 997069.0, 3825.0, 886.0, 467.0, 255.0, 163.0, 130.0, 76.0, 60.0, 43.0, 52.0, 34.0, 29.0, 14.0, 11.0, 6.0, 9.0, 6.0, 1.0, 3.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03769636154174805, -0.036360740661621094, -0.03502511978149414, -0.03368949890136719, -0.032353878021240234, -0.03101825714111328, -0.029682636260986328, -0.028347015380859375, -0.027011394500732422, -0.02567577362060547, -0.024340152740478516, -0.023004531860351562, -0.02166891098022461, -0.020333290100097656, -0.018997669219970703, -0.01766204833984375, -0.016326427459716797, -0.014990806579589844, -0.01365518569946289, -0.012319564819335938, -0.010983943939208984, -0.009648323059082031, -0.008312702178955078, -0.006977081298828125, -0.005641460418701172, -0.004305839538574219, -0.0029702186584472656, -0.0016345977783203125, -0.0002989768981933594, 0.0010366439819335938, 0.002372264862060547, 0.0037078857421875, 0.005043506622314453, 0.006379127502441406, 0.007714748382568359, 0.009050369262695312, 0.010385990142822266, 0.011721611022949219, 0.013057231903076172, 0.014392852783203125, 0.015728473663330078, 0.01706409454345703, 0.018399715423583984, 0.019735336303710938, 0.02107095718383789, 0.022406578063964844, 0.023742198944091797, 0.02507781982421875, 0.026413440704345703, 0.027749061584472656, 0.02908468246459961, 0.030420303344726562, 0.031755924224853516, 0.03309154510498047, 0.03442716598510742, 0.035762786865234375, 0.03709840774536133, 0.03843402862548828, 0.039769649505615234, 0.04110527038574219, 0.04244089126586914, 0.043776512145996094, 0.04511213302612305, 0.04644775390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 10.0, 9.0, 14.0, 16.0, 20.0, 25.0, 32.0, 35.0, 43.0, 45.0, 52.0, 45.0, 39.0, 35.0, 53.0, 64.0, 46.0, 46.0, 47.0, 42.0, 37.0, 38.0, 30.0, 23.0, 25.0, 31.0, 21.0, 20.0, 8.0, 6.0, 5.0, 9.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171051025390625, -0.016519784927368164, -0.015934467315673828, -0.015349149703979492, -0.014763832092285156, -0.01417851448059082, -0.013593196868896484, -0.013007879257202148, -0.012422561645507812, -0.011837244033813477, -0.01125192642211914, -0.010666608810424805, -0.010081291198730469, -0.009495973587036133, -0.008910655975341797, -0.008325338363647461, -0.007740020751953125, -0.007154703140258789, -0.006569385528564453, -0.005984067916870117, -0.005398750305175781, -0.004813432693481445, -0.004228115081787109, -0.0036427974700927734, -0.0030574798583984375, -0.0024721622467041016, -0.0018868446350097656, -0.0013015270233154297, -0.0007162094116210938, -0.0001308917999267578, 0.0004544258117675781, 0.001039743423461914, 0.00162506103515625, 0.002210378646850586, 0.002795696258544922, 0.003381013870239258, 0.003966331481933594, 0.00455164909362793, 0.005136966705322266, 0.0057222843170166016, 0.0063076019287109375, 0.0068929195404052734, 0.007478237152099609, 0.008063554763793945, 0.008648872375488281, 0.009234189987182617, 0.009819507598876953, 0.010404825210571289, 0.010990142822265625, 0.011575460433959961, 0.012160778045654297, 0.012746095657348633, 0.013331413269042969, 0.013916730880737305, 0.01450204849243164, 0.015087366104125977, 0.015672683715820312, 0.01625800132751465, 0.016843318939208984, 0.01742863655090332, 0.018013954162597656, 0.018599271774291992, 0.019184589385986328, 0.019769906997680664, 0.020355224609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 11.0, 7.0, 16.0, 22.0, 29.0, 31.0, 37.0, 55.0, 58.0, 103.0, 141.0, 314.0, 455.0, 1007.0, 3273.0, 16442.0, 970193.0, 48851.0, 4466.0, 1402.0, 596.0, 362.0, 162.0, 120.0, 78.0, 66.0, 44.0, 36.0, 25.0, 21.0, 24.0, 12.0, 3.0, 12.0, 10.0, 7.0, 1.0, 7.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.798197627067566e-05, -1.7307698726654053e-05, -1.6633421182632446e-05, -1.595914363861084e-05, -1.5284866094589233e-05, -1.4610588550567627e-05, -1.393631100654602e-05, -1.3262033462524414e-05, -1.2587755918502808e-05, -1.1913478374481201e-05, -1.1239200830459595e-05, -1.0564923286437988e-05, -9.890645742416382e-06, -9.216368198394775e-06, -8.542090654373169e-06, -7.867813110351562e-06, -7.193535566329956e-06, -6.51925802230835e-06, -5.844980478286743e-06, -5.170702934265137e-06, -4.49642539024353e-06, -3.822147846221924e-06, -3.1478703022003174e-06, -2.473592758178711e-06, -1.7993152141571045e-06, -1.125037670135498e-06, -4.507601261138916e-07, 2.2351741790771484e-07, 8.977949619293213e-07, 1.5720725059509277e-06, 2.246350049972534e-06, 2.9206275939941406e-06, 3.594905138015747e-06, 4.2691826820373535e-06, 4.94346022605896e-06, 5.617737770080566e-06, 6.292015314102173e-06, 6.966292858123779e-06, 7.640570402145386e-06, 8.314847946166992e-06, 8.989125490188599e-06, 9.663403034210205e-06, 1.0337680578231812e-05, 1.1011958122253418e-05, 1.1686235666275024e-05, 1.2360513210296631e-05, 1.3034790754318237e-05, 1.3709068298339844e-05, 1.438334584236145e-05, 1.5057623386383057e-05, 1.5731900930404663e-05, 1.640617847442627e-05, 1.7080456018447876e-05, 1.7754733562469482e-05, 1.842901110649109e-05, 1.9103288650512695e-05, 1.9777566194534302e-05, 2.0451843738555908e-05, 2.1126121282577515e-05, 2.180039882659912e-05, 2.2474676370620728e-05, 2.3148953914642334e-05, 2.382323145866394e-05, 2.4497509002685547e-05]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 10.0, 5.0, 16.0, 14.0, 18.0, 21.0, 20.0, 38.0, 25.0, 53.0, 96.0, 96.0, 140.0, 91.0, 79.0, 45.0, 33.0, 32.0, 18.0, 25.0, 20.0, 18.0, 11.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.927417755126953e-06, -7.636845111846924e-06, -7.3462724685668945e-06, -7.055699825286865e-06, -6.765127182006836e-06, -6.474554538726807e-06, -6.183981895446777e-06, -5.893409252166748e-06, -5.602836608886719e-06, -5.3122639656066895e-06, -5.02169132232666e-06, -4.731118679046631e-06, -4.4405460357666016e-06, -4.149973392486572e-06, -3.859400749206543e-06, -3.5688281059265137e-06, -3.2782554626464844e-06, -2.987682819366455e-06, -2.6971101760864258e-06, -2.4065375328063965e-06, -2.115964889526367e-06, -1.8253922462463379e-06, -1.5348196029663086e-06, -1.2442469596862793e-06, -9.5367431640625e-07, -6.631016731262207e-07, -3.725290298461914e-07, -8.195638656616211e-08, 2.086162567138672e-07, 4.991888999938965e-07, 7.897615432739258e-07, 1.080334186553955e-06, 1.3709068298339844e-06, 1.6614794731140137e-06, 1.952052116394043e-06, 2.2426247596740723e-06, 2.5331974029541016e-06, 2.823770046234131e-06, 3.11434268951416e-06, 3.4049153327941895e-06, 3.6954879760742188e-06, 3.986060619354248e-06, 4.276633262634277e-06, 4.567205905914307e-06, 4.857778549194336e-06, 5.148351192474365e-06, 5.4389238357543945e-06, 5.729496479034424e-06, 6.020069122314453e-06, 6.310641765594482e-06, 6.601214408874512e-06, 6.891787052154541e-06, 7.18235969543457e-06, 7.4729323387146e-06, 7.763504981994629e-06, 8.054077625274658e-06, 8.344650268554688e-06, 8.635222911834717e-06, 8.925795555114746e-06, 9.216368198394775e-06, 9.506940841674805e-06, 9.797513484954834e-06, 1.0088086128234863e-05, 1.0378658771514893e-05, 1.0669231414794922e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 7.0, 8.0, 13.0, 17.0, 21.0, 22.0, 43.0, 58.0, 97.0, 160.0, 406.0, 2040.0, 1034552.0, 9792.0, 715.0, 223.0, 128.0, 65.0, 56.0, 30.0, 23.0, 16.0, 6.0, 10.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-8.761882781982422e-05, -8.52951779961586e-05, -8.297152817249298e-05, -8.064787834882736e-05, -7.832422852516174e-05, -7.600057870149612e-05, -7.36769288778305e-05, -7.135327905416489e-05, -6.902962923049927e-05, -6.670597940683365e-05, -6.438232958316803e-05, -6.205867975950241e-05, -5.973502993583679e-05, -5.741138011217117e-05, -5.5087730288505554e-05, -5.2764080464839935e-05, -5.0440430641174316e-05, -4.81167808175087e-05, -4.579313099384308e-05, -4.346948117017746e-05, -4.114583134651184e-05, -3.882218152284622e-05, -3.64985316991806e-05, -3.4174881875514984e-05, -3.1851232051849365e-05, -2.9527582228183746e-05, -2.7203932404518127e-05, -2.488028258085251e-05, -2.255663275718689e-05, -2.023298293352127e-05, -1.7909333109855652e-05, -1.5585683286190033e-05, -1.3262033462524414e-05, -1.0938383638858795e-05, -8.614733815193176e-06, -6.291083991527557e-06, -3.9674341678619385e-06, -1.6437843441963196e-06, 6.798654794692993e-07, 3.0035153031349182e-06, 5.327165126800537e-06, 7.650814950466156e-06, 9.974464774131775e-06, 1.2298114597797394e-05, 1.4621764421463013e-05, 1.694541424512863e-05, 1.926906406879425e-05, 2.159271389245987e-05, 2.3916363716125488e-05, 2.6240013539791107e-05, 2.8563663363456726e-05, 3.0887313187122345e-05, 3.3210963010787964e-05, 3.553461283445358e-05, 3.78582626581192e-05, 4.018191248178482e-05, 4.250556230545044e-05, 4.482921212911606e-05, 4.715286195278168e-05, 4.9476511776447296e-05, 5.1800161600112915e-05, 5.4123811423778534e-05, 5.644746124744415e-05, 5.877111107110977e-05, 6.109476089477539e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 8.0, 8.0, 8.0, 21.0, 16.0, 23.0, 22.0, 44.0, 120.0, 346.0, 120.0, 81.0, 40.0, 35.0, 22.0, 14.0, 17.0, 8.0, 7.0, 4.0, 4.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.844499588012695e-05, -3.745127469301224e-05, -3.645755350589752e-05, -3.5463832318782806e-05, -3.447011113166809e-05, -3.3476389944553375e-05, -3.248266875743866e-05, -3.1488947570323944e-05, -3.049522638320923e-05, -2.9501505196094513e-05, -2.8507784008979797e-05, -2.7514062821865082e-05, -2.6520341634750366e-05, -2.552662044763565e-05, -2.4532899260520935e-05, -2.353917807340622e-05, -2.2545456886291504e-05, -2.155173569917679e-05, -2.0558014512062073e-05, -1.9564293324947357e-05, -1.857057213783264e-05, -1.7576850950717926e-05, -1.658312976360321e-05, -1.5589408576488495e-05, -1.459568738937378e-05, -1.3601966202259064e-05, -1.2608245015144348e-05, -1.1614523828029633e-05, -1.0620802640914917e-05, -9.627081453800201e-06, -8.633360266685486e-06, -7.63963907957077e-06, -6.645917892456055e-06, -5.652196705341339e-06, -4.6584755182266235e-06, -3.664754331111908e-06, -2.6710331439971924e-06, -1.6773119568824768e-06, -6.835907697677612e-07, 3.1013041734695435e-07, 1.30385160446167e-06, 2.2975727915763855e-06, 3.291293978691101e-06, 4.285015165805817e-06, 5.278736352920532e-06, 6.272457540035248e-06, 7.266178727149963e-06, 8.259899914264679e-06, 9.253621101379395e-06, 1.024734228849411e-05, 1.1241063475608826e-05, 1.2234784662723541e-05, 1.3228505849838257e-05, 1.4222227036952972e-05, 1.5215948224067688e-05, 1.6209669411182404e-05, 1.720339059829712e-05, 1.8197111785411835e-05, 1.919083297252655e-05, 2.0184554159641266e-05, 2.117827534675598e-05, 2.2171996533870697e-05, 2.3165717720985413e-05, 2.4159438908100128e-05, 2.5153160095214844e-05]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 30.0, 921.0, 62.0], "bins": [-0.558448314666748, -0.5495374798774719, -0.5406267046928406, -0.5317158699035645, -0.5228050947189331, -0.513894259929657, -0.5049834847450256, -0.4960726499557495, -0.4871618449687958, -0.47825103998184204, -0.4693402349948883, -0.46042943000793457, -0.45151859521865845, -0.4426077902317047, -0.433696985244751, -0.42478618025779724, -0.4158753752708435, -0.40696457028388977, -0.39805376529693604, -0.3891429603099823, -0.38023215532302856, -0.37132132053375244, -0.3624105155467987, -0.35349971055984497, -0.34458890557289124, -0.3356781005859375, -0.32676729559898376, -0.31785649061203003, -0.3089456558227539, -0.30003485083580017, -0.29112404584884644, -0.2822132408618927, -0.2733024060726166, -0.26439160108566284, -0.2554807960987091, -0.24656997621059418, -0.23765917122364044, -0.2287483662366867, -0.21983754634857178, -0.21092674136161804, -0.2020159512758255, -0.19310514628887177, -0.18419432640075684, -0.1752835214138031, -0.16637271642684937, -0.15746191143989563, -0.1485511064529419, -0.13964028656482697, -0.13072948157787323, -0.1218186765909195, -0.11290786415338516, -0.10399705171585083, -0.0950862467288971, -0.08617544174194336, -0.07726462930440903, -0.0683538168668747, -0.05944300442934036, -0.05053219571709633, -0.041621387004852295, -0.03271057829260826, -0.023799769580364227, -0.014888960868120193, -0.00597815215587616, 0.002932656556367874, 0.011843464337289333]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 11.0, 17.0, 17.0, 22.0, 23.0, 22.0, 44.0, 32.0, 36.0, 38.0, 39.0, 66.0, 53.0, 65.0, 54.0, 59.0, 51.0, 41.0, 51.0, 32.0, 33.0, 31.0, 21.0, 17.0, 16.0, 13.0, 17.0, 11.0, 3.0, 10.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08399641513824463, -0.08156851679086685, -0.07914061099290848, -0.0767127126455307, -0.07428480684757233, -0.07185690850019455, -0.06942901015281677, -0.0670011043548584, -0.06457320600748062, -0.062145303934812546, -0.05971740186214447, -0.05728950351476669, -0.05486160144209862, -0.05243369936943054, -0.050005801022052765, -0.04757789894938469, -0.045149996876716614, -0.04272209480404854, -0.04029419273138046, -0.037866294384002686, -0.03543839231133461, -0.033010490238666534, -0.030582590028643608, -0.028154689818620682, -0.025726787745952606, -0.02329888567328453, -0.020870985463261604, -0.018443085253238678, -0.016015183180570602, -0.013587282039225101, -0.0111593808978796, -0.008731480687856674, -0.006303578615188599, -0.0038756774738430977, -0.0014477763324975967, 0.0009801248088479042, 0.003408025950193405, 0.005835927091538906, 0.008263828232884407, 0.010691728442907333, 0.013119630515575409, 0.01554753165692091, 0.01797543279826641, 0.020403333008289337, 0.022831235080957413, 0.02525913715362549, 0.027687037363648415, 0.03011493757367134, 0.032542839646339417, 0.03497074171900749, 0.03739864379167557, 0.039826542139053345, 0.04225444421172142, 0.044682346284389496, 0.04711024463176727, 0.04953814670443535, 0.051966048777103424, 0.0543939508497715, 0.056821852922439575, 0.05924975126981735, 0.06167765334248543, 0.0641055554151535, 0.06653345376253128, 0.06896135210990906, 0.07138925790786743]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 5.0, 8.0, 7.0, 8.0, 5.0, 9.0, 15.0, 27.0, 24.0, 28.0, 44.0, 78.0, 274.0, 1536.0, 4191353.0, 497.0, 104.0, 44.0, 35.0, 34.0, 20.0, 19.0, 17.0, 14.0, 11.0, 5.0, 8.0, 8.0, 6.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.095703125, -2.024200439453125, -1.95269775390625, -1.881195068359375, -1.8096923828125, -1.738189697265625, -1.66668701171875, -1.595184326171875, -1.523681640625, -1.452178955078125, -1.38067626953125, -1.309173583984375, -1.2376708984375, -1.166168212890625, -1.09466552734375, -1.023162841796875, -0.95166015625, -0.880157470703125, -0.80865478515625, -0.737152099609375, -0.6656494140625, -0.594146728515625, -0.52264404296875, -0.451141357421875, -0.379638671875, -0.308135986328125, -0.23663330078125, -0.165130615234375, -0.0936279296875, -0.022125244140625, 0.04937744140625, 0.120880126953125, 0.1923828125, 0.263885498046875, 0.33538818359375, 0.406890869140625, 0.4783935546875, 0.549896240234375, 0.62139892578125, 0.692901611328125, 0.764404296875, 0.835906982421875, 0.90740966796875, 0.978912353515625, 1.0504150390625, 1.121917724609375, 1.19342041015625, 1.264923095703125, 1.33642578125, 1.407928466796875, 1.47943115234375, 1.550933837890625, 1.6224365234375, 1.693939208984375, 1.76544189453125, 1.836944580078125, 1.908447265625, 1.979949951171875, 2.05145263671875, 2.122955322265625, 2.1944580078125, 2.265960693359375, 2.33746337890625, 2.408966064453125, 2.48046875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 5.0, 16.0, 39.0, 112.0, 216.0, 259.0, 145.0, 47.0, 14.0, 11.0, 13.0, 7.0, 10.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007163882255554199, -0.0069119930267333984, -0.006660103797912598, -0.006408214569091797, -0.006156325340270996, -0.005904436111450195, -0.0056525468826293945, -0.005400657653808594, -0.005148768424987793, -0.004896879196166992, -0.004644989967346191, -0.004393100738525391, -0.00414121150970459, -0.003889322280883789, -0.0036374330520629883, -0.0033855438232421875, -0.0031336545944213867, -0.002881765365600586, -0.002629876136779785, -0.0023779869079589844, -0.0021260976791381836, -0.0018742084503173828, -0.001622319221496582, -0.0013704299926757812, -0.0011185407638549805, -0.0008666515350341797, -0.0006147623062133789, -0.0003628730773925781, -0.00011098384857177734, 0.00014090538024902344, 0.0003927946090698242, 0.000644683837890625, 0.0008965730667114258, 0.0011484622955322266, 0.0014003515243530273, 0.0016522407531738281, 0.001904129981994629, 0.0021560192108154297, 0.0024079084396362305, 0.0026597976684570312, 0.002911686897277832, 0.003163576126098633, 0.0034154653549194336, 0.0036673545837402344, 0.003919243812561035, 0.004171133041381836, 0.004423022270202637, 0.0046749114990234375, 0.004926800727844238, 0.005178689956665039, 0.00543057918548584, 0.005682468414306641, 0.005934357643127441, 0.006186246871948242, 0.006438136100769043, 0.006690025329589844, 0.0069419145584106445, 0.007193803787231445, 0.007445693016052246, 0.007697582244873047, 0.007949471473693848, 0.008201360702514648, 0.00845324993133545, 0.00870513916015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 10.0, 11.0, 19.0, 18.0, 35.0, 49.0, 101.0, 145.0, 267.0, 603.0, 1485.0, 4477.0, 26272.0, 4135100.0, 19698.0, 3598.0, 1217.0, 497.0, 269.0, 132.0, 84.0, 51.0, 33.0, 29.0, 19.0, 13.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.04852294921875, -0.046929359436035156, -0.04533576965332031, -0.04374217987060547, -0.042148590087890625, -0.04055500030517578, -0.03896141052246094, -0.037367820739746094, -0.03577423095703125, -0.034180641174316406, -0.03258705139160156, -0.03099346160888672, -0.029399871826171875, -0.02780628204345703, -0.026212692260742188, -0.024619102478027344, -0.0230255126953125, -0.021431922912597656, -0.019838333129882812, -0.01824474334716797, -0.016651153564453125, -0.015057563781738281, -0.013463973999023438, -0.011870384216308594, -0.01027679443359375, -0.008683204650878906, -0.0070896148681640625, -0.005496025085449219, -0.003902435302734375, -0.0023088455200195312, -0.0007152557373046875, 0.0008783340454101562, 0.002471923828125, 0.004065513610839844, 0.0056591033935546875, 0.007252693176269531, 0.008846282958984375, 0.010439872741699219, 0.012033462524414062, 0.013627052307128906, 0.01522064208984375, 0.016814231872558594, 0.018407821655273438, 0.02000141143798828, 0.021595001220703125, 0.02318859100341797, 0.024782180786132812, 0.026375770568847656, 0.0279693603515625, 0.029562950134277344, 0.031156539916992188, 0.03275012969970703, 0.034343719482421875, 0.03593730926513672, 0.03753089904785156, 0.039124488830566406, 0.04071807861328125, 0.042311668395996094, 0.04390525817871094, 0.04549884796142578, 0.047092437744140625, 0.04868602752685547, 0.05027961730957031, 0.051873207092285156, 0.053466796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 5.0, 9.0, 10.0, 26.0, 60.0, 252.0, 3067.0, 407.0, 96.0, 35.0, 14.0, 9.0, 7.0, 7.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.01409149169921875, -0.013717055320739746, -0.013342618942260742, -0.012968182563781738, -0.012593746185302734, -0.01221930980682373, -0.011844873428344727, -0.011470437049865723, -0.011096000671386719, -0.010721564292907715, -0.010347127914428711, -0.009972691535949707, -0.009598255157470703, -0.0092238187789917, -0.008849382400512695, -0.008474946022033691, -0.008100509643554688, -0.007726073265075684, -0.00735163688659668, -0.006977200508117676, -0.006602764129638672, -0.006228327751159668, -0.005853891372680664, -0.00547945499420166, -0.005105018615722656, -0.004730582237243652, -0.0043561458587646484, -0.0039817094802856445, -0.0036072731018066406, -0.0032328367233276367, -0.002858400344848633, -0.002483963966369629, -0.002109527587890625, -0.001735091209411621, -0.0013606548309326172, -0.0009862184524536133, -0.0006117820739746094, -0.00023734569549560547, 0.00013709068298339844, 0.0005115270614624023, 0.0008859634399414062, 0.0012603998184204102, 0.001634836196899414, 0.002009272575378418, 0.002383708953857422, 0.0027581453323364258, 0.0031325817108154297, 0.0035070180892944336, 0.0038814544677734375, 0.004255890846252441, 0.004630327224731445, 0.005004763603210449, 0.005379199981689453, 0.005753636360168457, 0.006128072738647461, 0.006502509117126465, 0.006876945495605469, 0.007251381874084473, 0.0076258182525634766, 0.00800025463104248, 0.008374691009521484, 0.008749127388000488, 0.009123563766479492, 0.009498000144958496, 0.0098724365234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 18.0, 111.0, 628.0, 153.0, 47.0, 22.0, 14.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055271510034799576, -0.048703815788030624, -0.04213612154126167, -0.03556842729449272, -0.02900073304772377, -0.02243303880095482, -0.015865344554185867, -0.009297650307416916, -0.0027299560606479645, 0.003837738186120987, 0.010405432432889938, 0.01697312667965889, 0.02354082092642784, 0.030108515173196793, 0.036676209419965744, 0.043243903666734695, 0.04981159791350365, 0.0563792921602726, 0.06294699013233185, 0.0695146769285202, 0.07608237862586975, 0.0826500654220581, 0.08921776711940765, 0.09578545391559601, 0.10235315561294556, 0.10892084985971451, 0.11548854410648346, 0.12205623835325241, 0.12862393260002136, 0.13519161939620972, 0.14175932109355927, 0.1483270227909088, 0.15489470958709717, 0.16146239638328552, 0.16803009808063507, 0.17459779977798462, 0.18116548657417297, 0.18773317337036133, 0.19430087506771088, 0.20086857676506042, 0.20743626356124878, 0.21400395035743713, 0.22057165205478668, 0.22713935375213623, 0.23370704054832458, 0.24027472734451294, 0.2468424290418625, 0.25341013073921204, 0.2599778175354004, 0.26654550433158875, 0.2731131911277771, 0.27968090772628784, 0.2862485945224762, 0.29281628131866455, 0.2993839979171753, 0.30595168471336365, 0.312519371509552, 0.31908705830574036, 0.3256547451019287, 0.33222246170043945, 0.3387901484966278, 0.34535783529281616, 0.3519255518913269, 0.35849323868751526, 0.3650609254837036]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 7.0, 8.0, 12.0, 11.0, 20.0, 16.0, 35.0, 35.0, 36.0, 40.0, 56.0, 52.0, 44.0, 49.0, 53.0, 51.0, 71.0, 60.0, 48.0, 46.0, 40.0, 47.0, 37.0, 22.0, 22.0, 15.0, 15.0, 11.0, 11.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035768866539001465, -0.0345376580953598, -0.03330644965171814, -0.03207524120807648, -0.030844032764434814, -0.029612824320793152, -0.02838161587715149, -0.027150407433509827, -0.025919198989868164, -0.0246879905462265, -0.02345678210258484, -0.022225573658943176, -0.020994365215301514, -0.01976315677165985, -0.01853194832801819, -0.017300739884376526, -0.016069531440734863, -0.0148383229970932, -0.013607114553451538, -0.012375906109809875, -0.011144697666168213, -0.00991348922252655, -0.008682280778884888, -0.007451072335243225, -0.0062198638916015625, -0.0049886554479599, -0.0037574470043182373, -0.0025262385606765747, -0.0012950301170349121, -6.382167339324951e-05, 0.001167386770248413, 0.0023985952138900757, 0.0036298036575317383, 0.004861012101173401, 0.0060922205448150635, 0.007323428988456726, 0.008554637432098389, 0.009785845875740051, 0.011017054319381714, 0.012248262763023376, 0.013479471206665039, 0.014710679650306702, 0.015941888093948364, 0.017173096537590027, 0.01840430498123169, 0.019635513424873352, 0.020866721868515015, 0.022097930312156677, 0.02332913875579834, 0.024560347199440002, 0.025791555643081665, 0.027022764086723328, 0.02825397253036499, 0.029485180974006653, 0.030716389417648315, 0.03194759786128998, 0.03317880630493164, 0.0344100147485733, 0.035641223192214966, 0.03687243163585663, 0.03810364007949829, 0.039334848523139954, 0.040566056966781616, 0.04179726541042328, 0.04302847385406494]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 11.0, 20.0, 33.0, 38.0, 74.0, 128.0, 196.0, 376.0, 896.0, 2119.0, 6072.0, 26431.0, 954107.0, 44849.0, 8121.0, 2785.0, 1128.0, 536.0, 241.0, 138.0, 87.0, 43.0, 31.0, 12.0, 16.0, 11.0, 4.0, 3.0, 6.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0655517578125, -0.0633382797241211, -0.06112480163574219, -0.05891132354736328, -0.056697845458984375, -0.05448436737060547, -0.05227088928222656, -0.050057411193847656, -0.04784393310546875, -0.045630455017089844, -0.04341697692871094, -0.04120349884033203, -0.038990020751953125, -0.03677654266357422, -0.03456306457519531, -0.032349586486816406, -0.0301361083984375, -0.027922630310058594, -0.025709152221679688, -0.02349567413330078, -0.021282196044921875, -0.01906871795654297, -0.016855239868164062, -0.014641761779785156, -0.01242828369140625, -0.010214805603027344, -0.008001327514648438, -0.005787849426269531, -0.003574371337890625, -0.0013608932495117188, 0.0008525848388671875, 0.0030660629272460938, 0.005279541015625, 0.007493019104003906, 0.009706497192382812, 0.011919975280761719, 0.014133453369140625, 0.01634693145751953, 0.018560409545898438, 0.020773887634277344, 0.02298736572265625, 0.025200843811035156, 0.027414321899414062, 0.02962779998779297, 0.031841278076171875, 0.03405475616455078, 0.03626823425292969, 0.038481712341308594, 0.0406951904296875, 0.042908668518066406, 0.04512214660644531, 0.04733562469482422, 0.049549102783203125, 0.05176258087158203, 0.05397605895996094, 0.056189537048339844, 0.05840301513671875, 0.060616493225097656, 0.06282997131347656, 0.06504344940185547, 0.06725692749023438, 0.06947040557861328, 0.07168388366699219, 0.0738973617553711, 0.07611083984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 3.0, 10.0, 12.0, 12.0, 15.0, 14.0, 67.0, 136.0, 233.0, 216.0, 116.0, 46.0, 16.0, 11.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007381439208984375, -0.007128655910491943, -0.006875872611999512, -0.00662308931350708, -0.0063703060150146484, -0.006117522716522217, -0.005864739418029785, -0.0056119561195373535, -0.005359172821044922, -0.00510638952255249, -0.004853606224060059, -0.004600822925567627, -0.004348039627075195, -0.004095256328582764, -0.003842473030090332, -0.0035896897315979004, -0.0033369064331054688, -0.003084123134613037, -0.0028313398361206055, -0.002578556537628174, -0.002325773239135742, -0.0020729899406433105, -0.001820206642150879, -0.0015674233436584473, -0.0013146400451660156, -0.001061856746673584, -0.0008090734481811523, -0.0005562901496887207, -0.00030350685119628906, -5.072355270385742e-05, 0.00020205974578857422, 0.00045484304428100586, 0.0007076263427734375, 0.0009604096412658691, 0.0012131929397583008, 0.0014659762382507324, 0.001718759536743164, 0.0019715428352355957, 0.0022243261337280273, 0.002477109432220459, 0.0027298927307128906, 0.0029826760292053223, 0.003235459327697754, 0.0034882426261901855, 0.003741025924682617, 0.003993809223175049, 0.0042465925216674805, 0.004499375820159912, 0.004752159118652344, 0.005004942417144775, 0.005257725715637207, 0.005510509014129639, 0.00576329231262207, 0.006016075611114502, 0.006268858909606934, 0.006521642208099365, 0.006774425506591797, 0.0070272088050842285, 0.00727999210357666, 0.007532775402069092, 0.0077855587005615234, 0.008038341999053955, 0.008291125297546387, 0.008543908596038818, 0.00879669189453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 8.0, 6.0, 13.0, 20.0, 23.0, 30.0, 34.0, 47.0, 51.0, 81.0, 130.0, 189.0, 275.0, 440.0, 776.0, 1612.0, 3682.0, 10355.0, 38986.0, 416877.0, 515853.0, 40892.0, 10645.0, 3739.0, 1571.0, 817.0, 473.0, 274.0, 199.0, 116.0, 86.0, 68.0, 43.0, 30.0, 21.0, 24.0, 17.0, 12.0, 9.0, 7.0, 9.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028927326202392578, -0.028023719787597656, -0.027120113372802734, -0.026216506958007812, -0.02531290054321289, -0.02440929412841797, -0.023505687713623047, -0.022602081298828125, -0.021698474884033203, -0.02079486846923828, -0.01989126205444336, -0.018987655639648438, -0.018084049224853516, -0.017180442810058594, -0.016276836395263672, -0.01537322998046875, -0.014469623565673828, -0.013566017150878906, -0.012662410736083984, -0.011758804321289062, -0.01085519790649414, -0.009951591491699219, -0.009047985076904297, -0.008144378662109375, -0.007240772247314453, -0.006337165832519531, -0.005433559417724609, -0.0045299530029296875, -0.0036263465881347656, -0.0027227401733398438, -0.0018191337585449219, -0.00091552734375, -1.1920928955078125e-05, 0.0008916854858398438, 0.0017952919006347656, 0.0026988983154296875, 0.0036025047302246094, 0.004506111145019531, 0.005409717559814453, 0.006313323974609375, 0.007216930389404297, 0.008120536804199219, 0.00902414321899414, 0.009927749633789062, 0.010831356048583984, 0.011734962463378906, 0.012638568878173828, 0.01354217529296875, 0.014445781707763672, 0.015349388122558594, 0.016252994537353516, 0.017156600952148438, 0.01806020736694336, 0.01896381378173828, 0.019867420196533203, 0.020771026611328125, 0.021674633026123047, 0.02257823944091797, 0.02348184585571289, 0.024385452270507812, 0.025289058685302734, 0.026192665100097656, 0.027096271514892578, 0.0279998779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 8.0, 9.0, 8.0, 7.0, 16.0, 20.0, 18.0, 29.0, 40.0, 34.0, 34.0, 35.0, 46.0, 53.0, 52.0, 45.0, 55.0, 46.0, 44.0, 53.0, 26.0, 44.0, 35.0, 46.0, 23.0, 21.0, 25.0, 14.0, 26.0, 15.0, 8.0, 8.0, 8.0, 7.0, 1.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01538848876953125, -0.01487743854522705, -0.014366388320922852, -0.013855338096618652, -0.013344287872314453, -0.012833237648010254, -0.012322187423706055, -0.011811137199401855, -0.011300086975097656, -0.010789036750793457, -0.010277986526489258, -0.009766936302185059, -0.00925588607788086, -0.00874483585357666, -0.008233785629272461, -0.007722735404968262, -0.0072116851806640625, -0.006700634956359863, -0.006189584732055664, -0.005678534507751465, -0.005167484283447266, -0.004656434059143066, -0.004145383834838867, -0.003634333610534668, -0.0031232833862304688, -0.0026122331619262695, -0.0021011829376220703, -0.001590132713317871, -0.0010790824890136719, -0.0005680322647094727, -5.698204040527344e-05, 0.0004540681838989258, 0.000965118408203125, 0.0014761686325073242, 0.0019872188568115234, 0.0024982690811157227, 0.003009319305419922, 0.003520369529724121, 0.00403141975402832, 0.0045424699783325195, 0.005053520202636719, 0.005564570426940918, 0.006075620651245117, 0.006586670875549316, 0.007097721099853516, 0.007608771324157715, 0.008119821548461914, 0.008630871772766113, 0.009141921997070312, 0.009652972221374512, 0.010164022445678711, 0.01067507266998291, 0.01118612289428711, 0.011697173118591309, 0.012208223342895508, 0.012719273567199707, 0.013230323791503906, 0.013741374015808105, 0.014252424240112305, 0.014763474464416504, 0.015274524688720703, 0.015785574913024902, 0.0162966251373291, 0.0168076753616333, 0.0173187255859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 23.0, 35.0, 57.0, 72.0, 106.0, 153.0, 278.0, 465.0, 831.0, 1750.0, 3743.0, 9810.0, 36135.0, 616434.0, 331763.0, 31021.0, 8824.0, 3425.0, 1628.0, 826.0, 391.0, 269.0, 151.0, 111.0, 61.0, 45.0, 28.0, 21.0, 16.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012264251708984375, -0.001188039779663086, -0.0011496543884277344, -0.0011112689971923828, -0.0010728836059570312, -0.0010344982147216797, -0.0009961128234863281, -0.0009577274322509766, -0.000919342041015625, -0.0008809566497802734, -0.0008425712585449219, -0.0008041858673095703, -0.0007658004760742188, -0.0007274150848388672, -0.0006890296936035156, -0.0006506443023681641, -0.0006122589111328125, -0.0005738735198974609, -0.0005354881286621094, -0.0004971027374267578, -0.00045871734619140625, -0.0004203319549560547, -0.0003819465637207031, -0.00034356117248535156, -0.00030517578125, -0.00026679039001464844, -0.00022840499877929688, -0.0001900196075439453, -0.00015163421630859375, -0.00011324882507324219, -7.486343383789062e-05, -3.647804260253906e-05, 1.9073486328125e-06, 4.029273986816406e-05, 7.867813110351562e-05, 0.00011706352233886719, 0.00015544891357421875, 0.0001938343048095703, 0.00023221969604492188, 0.00027060508728027344, 0.000308990478515625, 0.00034737586975097656, 0.0003857612609863281, 0.0004241466522216797, 0.00046253204345703125, 0.0005009174346923828, 0.0005393028259277344, 0.0005776882171630859, 0.0006160736083984375, 0.0006544589996337891, 0.0006928443908691406, 0.0007312297821044922, 0.0007696151733398438, 0.0008080005645751953, 0.0008463859558105469, 0.0008847713470458984, 0.00092315673828125, 0.0009615421295166016, 0.0009999275207519531, 0.0010383129119873047, 0.0010766983032226562, 0.0011150836944580078, 0.0011534690856933594, 0.001191854476928711, 0.0012302398681640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 8.0, 5.0, 8.0, 6.0, 22.0, 123.0, 502.0, 232.0, 33.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.881674587726593e-05, -5.6896358728408813e-05, -5.49759715795517e-05, -5.305558443069458e-05, -5.113519728183746e-05, -4.921481013298035e-05, -4.729442298412323e-05, -4.537403583526611e-05, -4.3453648686408997e-05, -4.153326153755188e-05, -3.961287438869476e-05, -3.7692487239837646e-05, -3.577210009098053e-05, -3.385171294212341e-05, -3.1931325793266296e-05, -3.001093864440918e-05, -2.8090551495552063e-05, -2.6170164346694946e-05, -2.424977719783783e-05, -2.2329390048980713e-05, -2.0409002900123596e-05, -1.848861575126648e-05, -1.6568228602409363e-05, -1.4647841453552246e-05, -1.272745430469513e-05, -1.0807067155838013e-05, -8.886680006980896e-06, -6.966292858123779e-06, -5.045905709266663e-06, -3.125518560409546e-06, -1.2051314115524292e-06, 7.152557373046875e-07, 2.635642886161804e-06, 4.556030035018921e-06, 6.476417183876038e-06, 8.396804332733154e-06, 1.0317191481590271e-05, 1.2237578630447388e-05, 1.4157965779304504e-05, 1.607835292816162e-05, 1.7998740077018738e-05, 1.9919127225875854e-05, 2.183951437473297e-05, 2.3759901523590088e-05, 2.5680288672447205e-05, 2.760067582130432e-05, 2.9521062970161438e-05, 3.1441450119018555e-05, 3.336183726787567e-05, 3.528222441673279e-05, 3.7202611565589905e-05, 3.912299871444702e-05, 4.104338586330414e-05, 4.2963773012161255e-05, 4.488416016101837e-05, 4.680454730987549e-05, 4.8724934458732605e-05, 5.064532160758972e-05, 5.256570875644684e-05, 5.4486095905303955e-05, 5.640648305416107e-05, 5.832687020301819e-05, 6.0247257351875305e-05, 6.216764450073242e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 11.0, 17.0, 11.0, 19.0, 17.0, 29.0, 39.0, 58.0, 94.0, 135.0, 180.0, 322.0, 584.0, 1201.0, 2511.0, 7219.0, 28643.0, 629008.0, 341937.0, 24906.0, 6571.0, 2396.0, 1133.0, 560.0, 307.0, 187.0, 135.0, 92.0, 52.0, 40.0, 30.0, 24.0, 14.0, 12.0, 14.0, 6.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012083053588867188, -0.0011692792177200317, -0.0011302530765533447, -0.0010912269353866577, -0.0010522007942199707, -0.0010131746530532837, -0.0009741485118865967, -0.0009351223707199097, -0.0008960962295532227, -0.0008570700883865356, -0.0008180439472198486, -0.0007790178060531616, -0.0007399916648864746, -0.0007009655237197876, -0.0006619393825531006, -0.0006229132413864136, -0.0005838871002197266, -0.0005448609590530396, -0.0005058348178863525, -0.00046680867671966553, -0.0004277825355529785, -0.0003887563943862915, -0.0003497302532196045, -0.0003107041120529175, -0.00027167797088623047, -0.00023265182971954346, -0.00019362568855285645, -0.00015459954738616943, -0.00011557340621948242, -7.654726505279541e-05, -3.75211238861084e-05, 1.5050172805786133e-06, 4.0531158447265625e-05, 7.955729961395264e-05, 0.00011858344078063965, 0.00015760958194732666, 0.00019663572311401367, 0.00023566186428070068, 0.0002746880054473877, 0.0003137141466140747, 0.0003527402877807617, 0.00039176642894744873, 0.00043079257011413574, 0.00046981871128082275, 0.0005088448524475098, 0.0005478709936141968, 0.0005868971347808838, 0.0006259232759475708, 0.0006649494171142578, 0.0007039755582809448, 0.0007430016994476318, 0.0007820278406143188, 0.0008210539817810059, 0.0008600801229476929, 0.0008991062641143799, 0.0009381324052810669, 0.000977158546447754, 0.001016184687614441, 0.001055210828781128, 0.001094236969947815, 0.001133263111114502, 0.001172289252281189, 0.001211315393447876, 0.001250341534614563, 0.00128936767578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 10.0, 7.0, 15.0, 23.0, 18.0, 18.0, 27.0, 41.0, 42.0, 64.0, 86.0, 75.0, 95.0, 92.0, 69.0, 49.0, 44.0, 52.0, 27.0, 22.0, 18.0, 20.0, 8.0, 11.0, 10.0, 4.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007576942443847656, -0.000734962522983551, -0.0007122308015823364, -0.0006894990801811218, -0.0006667673587799072, -0.0006440356373786926, -0.000621303915977478, -0.0005985721945762634, -0.0005758404731750488, -0.0005531087517738342, -0.0005303770303726196, -0.000507645308971405, -0.00048491358757019043, -0.00046218186616897583, -0.00043945014476776123, -0.00041671842336654663, -0.00039398670196533203, -0.00037125498056411743, -0.00034852325916290283, -0.00032579153776168823, -0.00030305981636047363, -0.00028032809495925903, -0.00025759637355804443, -0.00023486465215682983, -0.00021213293075561523, -0.00018940120935440063, -0.00016666948795318604, -0.00014393776655197144, -0.00012120604515075684, -9.847432374954224e-05, -7.574260234832764e-05, -5.301088094711304e-05, -3.0279159545898438e-05, -7.547438144683838e-06, 1.5184283256530762e-05, 3.791600465774536e-05, 6.064772605895996e-05, 8.337944746017456e-05, 0.00010611116886138916, 0.00012884289026260376, 0.00015157461166381836, 0.00017430633306503296, 0.00019703805446624756, 0.00021976977586746216, 0.00024250149726867676, 0.00026523321866989136, 0.00028796494007110596, 0.00031069666147232056, 0.00033342838287353516, 0.00035616010427474976, 0.00037889182567596436, 0.00040162354707717896, 0.00042435526847839355, 0.00044708698987960815, 0.00046981871128082275, 0.0004925504326820374, 0.000515282154083252, 0.0005380138754844666, 0.0005607455968856812, 0.0005834773182868958, 0.0006062090396881104, 0.000628940761089325, 0.0006516724824905396, 0.0006744042038917542, 0.0006971359252929688]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 10.0, 16.0, 22.0, 30.0, 76.0, 159.0, 247.0, 197.0, 99.0, 43.0, 36.0, 24.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494062840938568, -0.14543524384498596, -0.1414642184972763, -0.13749317824840546, -0.1335221529006958, -0.12955111265182495, -0.1255800873041153, -0.12160904705524445, -0.11763802170753479, -0.11366698890924454, -0.10969595611095428, -0.10572492331266403, -0.10175389051437378, -0.09778285771608353, -0.09381182491779327, -0.08984078466892242, -0.08586975187063217, -0.08189871907234192, -0.07792768627405167, -0.07395665347576141, -0.06998562067747116, -0.06601458787918091, -0.06204355135560036, -0.058072518557310104, -0.05410148575901985, -0.0501304529607296, -0.046159420162439346, -0.042188383638858795, -0.03821735084056854, -0.03424631804227829, -0.030275285243988037, -0.026304252445697784, -0.02233322709798813, -0.018362194299697876, -0.014391160570085049, -0.010420126840472221, -0.006449094042181969, -0.002478061243891716, 0.001492973417043686, 0.005464006215333939, 0.009435039013624191, 0.013406071811914444, 0.017377104610204697, 0.0213481392711401, 0.02531917206943035, 0.029290204867720604, 0.033261239528656006, 0.03723227232694626, 0.04120330512523651, 0.045174337923526764, 0.04914537072181702, 0.05311640352010727, 0.05708743631839752, 0.061058469116687775, 0.06502950191497803, 0.06900054216384888, 0.07297156751155853, 0.07694260030984879, 0.08091363310813904, 0.08488466590642929, 0.08885569870471954, 0.0928267315030098, 0.09679776430130005, 0.1007688045501709, 0.10473983734846115]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 4.0, 9.0, 17.0, 18.0, 15.0, 21.0, 19.0, 24.0, 33.0, 46.0, 39.0, 52.0, 64.0, 57.0, 65.0, 67.0, 59.0, 46.0, 45.0, 39.0, 27.0, 29.0, 29.0, 33.0, 19.0, 26.0, 22.0, 15.0, 5.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.07515132427215576, -0.07287157326936722, -0.07059182226657867, -0.06831207126379013, -0.06603232026100159, -0.06375257670879364, -0.061472825706005096, -0.05919307470321655, -0.05691332370042801, -0.054633572697639465, -0.05235382169485092, -0.050074074417352676, -0.04779432341456413, -0.04551457241177559, -0.043234825134277344, -0.0409550741314888, -0.038675323128700256, -0.03639557212591171, -0.03411582112312317, -0.031836073845624924, -0.02955632284283638, -0.027276571840047836, -0.024996822699904442, -0.022717073559761047, -0.020437322556972504, -0.01815757155418396, -0.015877822414040565, -0.013598072342574596, -0.011318322271108627, -0.009038572199642658, -0.006758822128176689, -0.004479072988033295, -0.002199321985244751, 8.042808622121811e-05, 0.002360178157687187, 0.004639928229153156, 0.006919678300619125, 0.009199428372085094, 0.011479178443551064, 0.013758927583694458, 0.016038678586483, 0.018318429589271545, 0.02059817872941494, 0.022877927869558334, 0.025157678872346878, 0.027437429875135422, 0.029717179015278816, 0.03199692815542221, 0.034276679158210754, 0.0365564301609993, 0.03883618116378784, 0.04111592844128609, 0.04339567944407463, 0.045675430446863174, 0.04795517772436142, 0.05023492872714996, 0.05251467972993851, 0.05479443073272705, 0.057074181735515594, 0.05935392901301384, 0.06163368001580238, 0.06391342729330063, 0.06619317829608917, 0.06847292929887772, 0.07075268030166626]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 3.0, 17.0, 16.0, 27.0, 47.0, 64.0, 178.0, 365.0, 24806.0, 4167989.0, 334.0, 158.0, 78.0, 51.0, 31.0, 26.0, 10.0, 9.0, 10.0, 5.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.197021484375, -0.19024276733398438, -0.18346405029296875, -0.17668533325195312, -0.1699066162109375, -0.16312789916992188, -0.15634918212890625, -0.14957046508789062, -0.142791748046875, -0.13601303100585938, -0.12923431396484375, -0.12245559692382812, -0.1156768798828125, -0.10889816284179688, -0.10211944580078125, -0.09534072875976562, -0.08856201171875, -0.08178329467773438, -0.07500457763671875, -0.06822586059570312, -0.0614471435546875, -0.054668426513671875, -0.04788970947265625, -0.041110992431640625, -0.034332275390625, -0.027553558349609375, -0.02077484130859375, -0.013996124267578125, -0.0072174072265625, -0.000438690185546875, 0.00634002685546875, 0.013118743896484375, 0.0198974609375, 0.026676177978515625, 0.03345489501953125, 0.040233612060546875, 0.0470123291015625, 0.053791046142578125, 0.06056976318359375, 0.06734848022460938, 0.074127197265625, 0.08090591430664062, 0.08768463134765625, 0.09446334838867188, 0.1012420654296875, 0.10802078247070312, 0.11479949951171875, 0.12157821655273438, 0.12835693359375, 0.13513565063476562, 0.14191436767578125, 0.14869308471679688, 0.1554718017578125, 0.16225051879882812, 0.16902923583984375, 0.17580795288085938, 0.182586669921875, 0.18936538696289062, 0.19614410400390625, 0.20292282104492188, 0.2097015380859375, 0.21648025512695312, 0.22325897216796875, 0.23003768920898438, 0.23681640625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 10.0, 11.0, 10.0, 27.0, 34.0, 91.0, 127.0, 187.0, 190.0, 108.0, 65.0, 34.0, 17.0, 13.0, 6.0, 9.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007343292236328125, -0.007091224193572998, -0.006839156150817871, -0.006587088108062744, -0.006335020065307617, -0.00608295202255249, -0.005830883979797363, -0.005578815937042236, -0.005326747894287109, -0.005074679851531982, -0.0048226118087768555, -0.0045705437660217285, -0.0043184757232666016, -0.004066407680511475, -0.0038143396377563477, -0.0035622715950012207, -0.0033102035522460938, -0.003058135509490967, -0.00280606746673584, -0.002553999423980713, -0.002301931381225586, -0.002049863338470459, -0.001797795295715332, -0.001545727252960205, -0.0012936592102050781, -0.0010415911674499512, -0.0007895231246948242, -0.0005374550819396973, -0.0002853870391845703, -3.331899642944336e-05, 0.0002187490463256836, 0.00047081708908081055, 0.0007228851318359375, 0.0009749531745910645, 0.0012270212173461914, 0.0014790892601013184, 0.0017311573028564453, 0.0019832253456115723, 0.0022352933883666992, 0.002487361431121826, 0.002739429473876953, 0.00299149751663208, 0.003243565559387207, 0.003495633602142334, 0.003747701644897461, 0.003999769687652588, 0.004251837730407715, 0.004503905773162842, 0.004755973815917969, 0.005008041858673096, 0.005260109901428223, 0.00551217794418335, 0.0057642459869384766, 0.0060163140296936035, 0.0062683820724487305, 0.006520450115203857, 0.006772518157958984, 0.007024586200714111, 0.007276654243469238, 0.007528722286224365, 0.007780790328979492, 0.00803285837173462, 0.008284926414489746, 0.008536994457244873, 0.0087890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 13.0, 23.0, 30.0, 44.0, 78.0, 121.0, 227.0, 361.0, 668.0, 1237.0, 2546.0, 5282.0, 13430.0, 44260.0, 813420.0, 3219677.0, 62861.0, 16543.0, 6500.0, 3004.0, 1545.0, 896.0, 551.0, 319.0, 210.0, 143.0, 91.0, 58.0, 40.0, 27.0, 20.0, 17.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.008575439453125, -0.008331239223480225, -0.00808703899383545, -0.007842838764190674, -0.0075986385345458984, -0.007354438304901123, -0.007110238075256348, -0.006866037845611572, -0.006621837615966797, -0.0063776373863220215, -0.006133437156677246, -0.005889236927032471, -0.005645036697387695, -0.00540083646774292, -0.0051566362380981445, -0.004912436008453369, -0.004668235778808594, -0.004424035549163818, -0.004179835319519043, -0.003935635089874268, -0.003691434860229492, -0.003447234630584717, -0.0032030344009399414, -0.002958834171295166, -0.0027146339416503906, -0.0024704337120056152, -0.00222623348236084, -0.0019820332527160645, -0.001737833023071289, -0.0014936327934265137, -0.0012494325637817383, -0.0010052323341369629, -0.0007610321044921875, -0.0005168318748474121, -0.0002726316452026367, -2.8431415557861328e-05, 0.00021576881408691406, 0.00045996904373168945, 0.0007041692733764648, 0.0009483695030212402, 0.0011925697326660156, 0.001436769962310791, 0.0016809701919555664, 0.0019251704216003418, 0.002169370651245117, 0.0024135708808898926, 0.002657771110534668, 0.0029019713401794434, 0.0031461715698242188, 0.003390371799468994, 0.0036345720291137695, 0.003878772258758545, 0.00412297248840332, 0.004367172718048096, 0.004611372947692871, 0.0048555731773376465, 0.005099773406982422, 0.005343973636627197, 0.005588173866271973, 0.005832374095916748, 0.0060765743255615234, 0.006320774555206299, 0.006564974784851074, 0.00680917501449585, 0.007053375244140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 7.0, 14.0, 16.0, 19.0, 22.0, 37.0, 52.0, 131.0, 368.0, 1107.0, 1390.0, 501.0, 172.0, 58.0, 27.0, 22.0, 18.0, 21.0, 5.0, 11.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007122039794921875, -0.0068686604499816895, -0.006615281105041504, -0.006361901760101318, -0.006108522415161133, -0.005855143070220947, -0.005601763725280762, -0.005348384380340576, -0.005095005035400391, -0.004841625690460205, -0.0045882463455200195, -0.004334867000579834, -0.0040814876556396484, -0.003828108310699463, -0.0035747289657592773, -0.003321349620819092, -0.0030679702758789062, -0.0028145909309387207, -0.002561211585998535, -0.0023078322410583496, -0.002054452896118164, -0.0018010735511779785, -0.001547694206237793, -0.0012943148612976074, -0.0010409355163574219, -0.0007875561714172363, -0.0005341768264770508, -0.00028079748153686523, -2.7418136596679688e-05, 0.00022596120834350586, 0.0004793405532836914, 0.000732719898223877, 0.0009860992431640625, 0.001239478588104248, 0.0014928579330444336, 0.0017462372779846191, 0.0019996166229248047, 0.0022529959678649902, 0.0025063753128051758, 0.0027597546577453613, 0.003013134002685547, 0.0032665133476257324, 0.003519892692565918, 0.0037732720375061035, 0.004026651382446289, 0.004280030727386475, 0.00453341007232666, 0.004786789417266846, 0.005040168762207031, 0.005293548107147217, 0.005546927452087402, 0.005800306797027588, 0.0060536861419677734, 0.006307065486907959, 0.0065604448318481445, 0.00681382417678833, 0.007067203521728516, 0.007320582866668701, 0.007573962211608887, 0.007827341556549072, 0.008080720901489258, 0.008334100246429443, 0.008587479591369629, 0.008840858936309814, 0.00909423828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 7.0, 15.0, 47.0, 85.0, 205.0, 257.0, 157.0, 78.0, 53.0, 32.0, 10.0, 19.0, 16.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0763329565525055, -0.07402196526527405, -0.0717109739780426, -0.06939999014139175, -0.06708899885416031, -0.06477800756692886, -0.06246701627969742, -0.06015602499246597, -0.057845037430524826, -0.05553404614329338, -0.053223058581352234, -0.05091206729412079, -0.04860107600688934, -0.046290088444948196, -0.04397909715771675, -0.041668109595775604, -0.03935711830854416, -0.037046127021312714, -0.03473513945937157, -0.03242414817214012, -0.030113158747553825, -0.02780216932296753, -0.025491178035736084, -0.023180188611149788, -0.020869199186563492, -0.018558209761977196, -0.0162472203373909, -0.013936229050159454, -0.011625239625573158, -0.009314250200986862, -0.0070032598450779915, -0.004692269489169121, -0.002381272614002228, -7.02827237546444e-05, 0.002240707166492939, 0.004551697056740522, 0.006862686946988106, 0.009173676371574402, 0.011484666727483273, 0.013795657083392143, 0.01610664650797844, 0.018417635932564735, 0.02072862535715103, 0.023039616644382477, 0.025350606068968773, 0.02766159549355507, 0.029972586780786514, 0.03228357434272766, 0.034594565629959106, 0.03690555691719055, 0.0392165444791317, 0.041527535766363144, 0.04383852332830429, 0.046149514615535736, 0.04846050590276718, 0.05077149718999863, 0.053082484751939774, 0.05539347603917122, 0.057704463601112366, 0.06001545488834381, 0.062326446175575256, 0.0646374374628067, 0.06694842129945755, 0.069259412586689, 0.07157040387392044]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 6.0, 11.0, 7.0, 17.0, 18.0, 20.0, 11.0, 23.0, 33.0, 30.0, 41.0, 35.0, 49.0, 60.0, 49.0, 55.0, 48.0, 64.0, 57.0, 48.0, 38.0, 35.0, 46.0, 33.0, 24.0, 26.0, 29.0, 16.0, 11.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031122207641601562, -0.0300825834274292, -0.029042961075901985, -0.02800333872437477, -0.026963714510202408, -0.025924090296030045, -0.02488446794450283, -0.023844845592975616, -0.022805221378803253, -0.02176559716463089, -0.020725974813103676, -0.019686352461576462, -0.0186467282474041, -0.017607104033231735, -0.01656748168170452, -0.015527858398854733, -0.014488235116004944, -0.013448611833155155, -0.012408988550305367, -0.011369365267455578, -0.01032974198460579, -0.009290118701756, -0.008250495418906212, -0.007210872136056423, -0.0061712488532066345, -0.005131625570356846, -0.004092002287507057, -0.0030523790046572685, -0.00201275572180748, -0.0009731324389576912, 6.649084389209747e-05, 0.0011061141267418861, 0.002145737409591675, 0.0031853606924414635, 0.004224983975291252, 0.005264607258141041, 0.0063042305409908295, 0.007343853823840618, 0.008383477106690407, 0.009423100389540195, 0.010462723672389984, 0.011502346955239773, 0.012541970238089561, 0.01358159352093935, 0.014621216803789139, 0.015660841017961502, 0.016700463369488716, 0.01774008572101593, 0.018779709935188293, 0.019819334149360657, 0.02085895650088787, 0.021898578852415085, 0.022938203066587448, 0.02397782728075981, 0.025017449632287025, 0.02605707198381424, 0.027096696197986603, 0.028136320412158966, 0.02917594276368618, 0.030215565115213394, 0.03125518932938576, 0.03229481354355812, 0.033334434032440186, 0.03437405824661255, 0.03541368246078491]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 9.0, 20.0, 29.0, 34.0, 49.0, 80.0, 85.0, 134.0, 188.0, 260.0, 408.0, 616.0, 950.0, 1478.0, 2593.0, 4866.0, 10977.0, 32896.0, 297758.0, 619453.0, 48792.0, 13367.0, 5621.0, 2880.0, 1720.0, 1054.0, 643.0, 462.0, 307.0, 220.0, 149.0, 120.0, 75.0, 65.0, 45.0, 34.0, 22.0, 25.0, 9.0, 5.0, 13.0, 4.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01190948486328125, -0.01150059700012207, -0.01109170913696289, -0.010682821273803711, -0.010273933410644531, -0.009865045547485352, -0.009456157684326172, -0.009047269821166992, -0.008638381958007812, -0.008229494094848633, -0.007820606231689453, -0.0074117183685302734, -0.007002830505371094, -0.006593942642211914, -0.006185054779052734, -0.005776166915893555, -0.005367279052734375, -0.004958391189575195, -0.004549503326416016, -0.004140615463256836, -0.0037317276000976562, -0.0033228397369384766, -0.002913951873779297, -0.002505064010620117, -0.0020961761474609375, -0.0016872882843017578, -0.0012784004211425781, -0.0008695125579833984, -0.00046062469482421875, -5.173683166503906e-05, 0.0003571510314941406, 0.0007660388946533203, 0.0011749267578125, 0.0015838146209716797, 0.0019927024841308594, 0.002401590347290039, 0.0028104782104492188, 0.0032193660736083984, 0.003628253936767578, 0.004037141799926758, 0.0044460296630859375, 0.004854917526245117, 0.005263805389404297, 0.0056726932525634766, 0.006081581115722656, 0.006490468978881836, 0.006899356842041016, 0.007308244705200195, 0.007717132568359375, 0.008126020431518555, 0.008534908294677734, 0.008943796157836914, 0.009352684020996094, 0.009761571884155273, 0.010170459747314453, 0.010579347610473633, 0.010988235473632812, 0.011397123336791992, 0.011806011199951172, 0.012214899063110352, 0.012623786926269531, 0.013032674789428711, 0.01344156265258789, 0.01385045051574707, 0.01425933837890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 16.0, 22.0, 52.0, 85.0, 136.0, 173.0, 153.0, 139.0, 77.0, 37.0, 12.0, 12.0, 8.0, 6.0, 7.0, 6.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007149875164031982, -0.00689542293548584, -0.006640970706939697, -0.006386518478393555, -0.006132066249847412, -0.0058776140213012695, -0.005623161792755127, -0.005368709564208984, -0.005114257335662842, -0.004859805107116699, -0.004605352878570557, -0.004350900650024414, -0.0040964484214782715, -0.003841996192932129, -0.0035875439643859863, -0.0033330917358398438, -0.003078639507293701, -0.0028241872787475586, -0.002569735050201416, -0.0023152828216552734, -0.002060830593109131, -0.0018063783645629883, -0.0015519261360168457, -0.0012974739074707031, -0.0010430216789245605, -0.000788569450378418, -0.0005341172218322754, -0.0002796649932861328, -2.5212764739990234e-05, 0.00022923946380615234, 0.0004836916923522949, 0.0007381439208984375, 0.00099259614944458, 0.0012470483779907227, 0.0015015006065368652, 0.0017559528350830078, 0.0020104050636291504, 0.002264857292175293, 0.0025193095207214355, 0.002773761749267578, 0.0030282139778137207, 0.0032826662063598633, 0.003537118434906006, 0.0037915706634521484, 0.004046022891998291, 0.004300475120544434, 0.004554927349090576, 0.004809379577636719, 0.005063831806182861, 0.005318284034729004, 0.0055727362632751465, 0.005827188491821289, 0.006081640720367432, 0.006336092948913574, 0.006590545177459717, 0.006844997406005859, 0.007099449634552002, 0.0073539018630981445, 0.007608354091644287, 0.00786280632019043, 0.008117258548736572, 0.008371710777282715, 0.008626163005828857, 0.008880615234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 3.0, 9.0, 8.0, 6.0, 9.0, 13.0, 29.0, 34.0, 55.0, 73.0, 93.0, 123.0, 174.0, 261.0, 362.0, 532.0, 958.0, 1805.0, 3726.0, 9992.0, 38042.0, 259903.0, 629901.0, 75074.0, 16282.0, 5278.0, 2407.0, 1221.0, 700.0, 439.0, 306.0, 186.0, 140.0, 106.0, 72.0, 61.0, 46.0, 18.0, 17.0, 20.0, 14.0, 11.0, 9.0, 6.0, 12.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.01168060302734375, -0.011339068412780762, -0.010997533798217773, -0.010655999183654785, -0.010314464569091797, -0.009972929954528809, -0.00963139533996582, -0.009289860725402832, -0.008948326110839844, -0.008606791496276855, -0.008265256881713867, -0.007923722267150879, -0.007582187652587891, -0.007240653038024902, -0.006899118423461914, -0.006557583808898926, -0.0062160491943359375, -0.005874514579772949, -0.005532979965209961, -0.005191445350646973, -0.004849910736083984, -0.004508376121520996, -0.004166841506958008, -0.0038253068923950195, -0.0034837722778320312, -0.003142237663269043, -0.0028007030487060547, -0.0024591684341430664, -0.002117633819580078, -0.0017760992050170898, -0.0014345645904541016, -0.0010930299758911133, -0.000751495361328125, -0.0004099607467651367, -6.842613220214844e-05, 0.00027310848236083984, 0.0006146430969238281, 0.0009561777114868164, 0.0012977123260498047, 0.001639246940612793, 0.0019807815551757812, 0.0023223161697387695, 0.002663850784301758, 0.003005385398864746, 0.0033469200134277344, 0.0036884546279907227, 0.004029989242553711, 0.004371523857116699, 0.0047130584716796875, 0.005054593086242676, 0.005396127700805664, 0.005737662315368652, 0.006079196929931641, 0.006420731544494629, 0.006762266159057617, 0.0071038007736206055, 0.007445335388183594, 0.007786870002746582, 0.00812840461730957, 0.008469939231872559, 0.008811473846435547, 0.009153008460998535, 0.009494543075561523, 0.009836077690124512, 0.0101776123046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 12.0, 13.0, 15.0, 22.0, 28.0, 23.0, 27.0, 23.0, 25.0, 51.0, 37.0, 46.0, 45.0, 55.0, 42.0, 53.0, 40.0, 44.0, 41.0, 36.0, 33.0, 39.0, 47.0, 31.0, 29.0, 19.0, 21.0, 18.0, 14.0, 13.0, 14.0, 4.0, 4.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.016937255859375, -0.016460657119750977, -0.015984058380126953, -0.01550745964050293, -0.015030860900878906, -0.014554262161254883, -0.01407766342163086, -0.013601064682006836, -0.013124465942382812, -0.012647867202758789, -0.012171268463134766, -0.011694669723510742, -0.011218070983886719, -0.010741472244262695, -0.010264873504638672, -0.009788274765014648, -0.009311676025390625, -0.008835077285766602, -0.008358478546142578, -0.007881879806518555, -0.007405281066894531, -0.006928682327270508, -0.006452083587646484, -0.005975484848022461, -0.0054988861083984375, -0.005022287368774414, -0.004545688629150391, -0.004069089889526367, -0.0035924911499023438, -0.0031158924102783203, -0.002639293670654297, -0.0021626949310302734, -0.00168609619140625, -0.0012094974517822266, -0.0007328987121582031, -0.0002562999725341797, 0.00022029876708984375, 0.0006968975067138672, 0.0011734962463378906, 0.001650094985961914, 0.0021266937255859375, 0.002603292465209961, 0.0030798912048339844, 0.003556489944458008, 0.004033088684082031, 0.004509687423706055, 0.004986286163330078, 0.0054628849029541016, 0.005939483642578125, 0.0064160823822021484, 0.006892681121826172, 0.007369279861450195, 0.007845878601074219, 0.008322477340698242, 0.008799076080322266, 0.009275674819946289, 0.009752273559570312, 0.010228872299194336, 0.01070547103881836, 0.011182069778442383, 0.011658668518066406, 0.01213526725769043, 0.012611865997314453, 0.013088464736938477, 0.0135650634765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 11.0, 7.0, 13.0, 17.0, 18.0, 46.0, 63.0, 123.0, 216.0, 490.0, 1072.0, 2793.0, 8046.0, 40662.0, 840008.0, 133517.0, 14357.0, 4132.0, 1614.0, 650.0, 312.0, 132.0, 85.0, 49.0, 38.0, 14.0, 18.0, 11.0, 12.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0029125213623046875, -0.002826124429702759, -0.00273972749710083, -0.0026533305644989014, -0.0025669336318969727, -0.002480536699295044, -0.0023941397666931152, -0.0023077428340911865, -0.002221345901489258, -0.002134948968887329, -0.0020485520362854004, -0.0019621551036834717, -0.001875758171081543, -0.0017893612384796143, -0.0017029643058776855, -0.0016165673732757568, -0.0015301704406738281, -0.0014437735080718994, -0.0013573765754699707, -0.001270979642868042, -0.0011845827102661133, -0.0010981857776641846, -0.0010117888450622559, -0.0009253919124603271, -0.0008389949798583984, -0.0007525980472564697, -0.000666201114654541, -0.0005798041820526123, -0.0004934072494506836, -0.0004070103168487549, -0.00032061338424682617, -0.00023421645164489746, -0.00014781951904296875, -6.142258644104004e-05, 2.4974346160888672e-05, 0.00011137127876281738, 0.0001977682113647461, 0.0002841651439666748, 0.0003705620765686035, 0.0004569590091705322, 0.0005433559417724609, 0.0006297528743743896, 0.0007161498069763184, 0.0008025467395782471, 0.0008889436721801758, 0.0009753406047821045, 0.0010617375373840332, 0.001148134469985962, 0.0012345314025878906, 0.0013209283351898193, 0.001407325267791748, 0.0014937222003936768, 0.0015801191329956055, 0.0016665160655975342, 0.0017529129981994629, 0.0018393099308013916, 0.0019257068634033203, 0.002012103796005249, 0.0020985007286071777, 0.0021848976612091064, 0.002271294593811035, 0.002357691526412964, 0.0024440884590148926, 0.0025304853916168213, 0.00261688232421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 2.0, 6.0, 4.0, 9.0, 4.0, 7.0, 13.0, 17.0, 12.0, 8.0, 23.0, 22.0, 13.0, 45.0, 19.0, 24.0, 32.0, 42.0, 49.0, 26.0, 42.0, 50.0, 19.0, 46.0, 44.0, 51.0, 21.0, 54.0, 42.0, 13.0, 37.0, 37.0, 20.0, 28.0, 18.0, 25.0, 12.0, 11.0, 10.0, 6.0, 14.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.4570693969726562e-06, -3.355555236339569e-06, -3.254041075706482e-06, -3.1525269150733948e-06, -3.0510127544403076e-06, -2.9494985938072205e-06, -2.8479844331741333e-06, -2.746470272541046e-06, -2.644956111907959e-06, -2.543441951274872e-06, -2.4419277906417847e-06, -2.3404136300086975e-06, -2.2388994693756104e-06, -2.137385308742523e-06, -2.035871148109436e-06, -1.934356987476349e-06, -1.8328428268432617e-06, -1.7313286662101746e-06, -1.6298145055770874e-06, -1.5283003449440002e-06, -1.426786184310913e-06, -1.325272023677826e-06, -1.2237578630447388e-06, -1.1222437024116516e-06, -1.0207295417785645e-06, -9.192153811454773e-07, -8.177012205123901e-07, -7.16187059879303e-07, -6.146728992462158e-07, -5.131587386131287e-07, -4.116445779800415e-07, -3.1013041734695435e-07, -2.086162567138672e-07, -1.0710209608078003e-07, -5.587935447692871e-09, 9.592622518539429e-08, 1.9744038581848145e-07, 2.989545464515686e-07, 4.0046870708465576e-07, 5.019828677177429e-07, 6.034970283508301e-07, 7.050111889839172e-07, 8.065253496170044e-07, 9.080395102500916e-07, 1.0095536708831787e-06, 1.1110678315162659e-06, 1.212581992149353e-06, 1.3140961527824402e-06, 1.4156103134155273e-06, 1.5171244740486145e-06, 1.6186386346817017e-06, 1.7201527953147888e-06, 1.821666955947876e-06, 1.923181116580963e-06, 2.0246952772140503e-06, 2.1262094378471375e-06, 2.2277235984802246e-06, 2.3292377591133118e-06, 2.430751919746399e-06, 2.532266080379486e-06, 2.6337802410125732e-06, 2.7352944016456604e-06, 2.8368085622787476e-06, 2.9383227229118347e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 6.0, 16.0, 14.0, 30.0, 47.0, 52.0, 78.0, 128.0, 190.0, 294.0, 614.0, 1287.0, 3043.0, 9196.0, 47904.0, 810208.0, 150891.0, 16280.0, 4482.0, 1810.0, 822.0, 397.0, 301.0, 130.0, 92.0, 58.0, 45.0, 29.0, 34.0, 16.0, 13.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00278472900390625, -0.0027067363262176514, -0.0026287436485290527, -0.002550750970840454, -0.0024727582931518555, -0.002394765615463257, -0.002316772937774658, -0.0022387802600860596, -0.002160787582397461, -0.0020827949047088623, -0.0020048022270202637, -0.001926809549331665, -0.0018488168716430664, -0.0017708241939544678, -0.0016928315162658691, -0.0016148388385772705, -0.0015368461608886719, -0.0014588534832000732, -0.0013808608055114746, -0.001302868127822876, -0.0012248754501342773, -0.0011468827724456787, -0.00106889009475708, -0.0009908974170684814, -0.0009129047393798828, -0.0008349120616912842, -0.0007569193840026855, -0.0006789267063140869, -0.0006009340286254883, -0.0005229413509368896, -0.000444948673248291, -0.0003669559955596924, -0.00028896331787109375, -0.00021097064018249512, -0.00013297796249389648, -5.498528480529785e-05, 2.300739288330078e-05, 0.00010100007057189941, 0.00017899274826049805, 0.0002569854259490967, 0.0003349781036376953, 0.00041297078132629395, 0.0004909634590148926, 0.0005689561367034912, 0.0006469488143920898, 0.0007249414920806885, 0.0008029341697692871, 0.0008809268474578857, 0.0009589195251464844, 0.001036912202835083, 0.0011149048805236816, 0.0011928975582122803, 0.001270890235900879, 0.0013488829135894775, 0.0014268755912780762, 0.0015048682689666748, 0.0015828609466552734, 0.001660853624343872, 0.0017388463020324707, 0.0018168389797210693, 0.001894831657409668, 0.0019728243350982666, 0.0020508170127868652, 0.002128809690475464, 0.0022068023681640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 0.0, 4.0, 11.0, 8.0, 4.0, 13.0, 22.0, 30.0, 40.0, 49.0, 107.0, 105.0, 104.0, 116.0, 97.0, 79.0, 57.0, 41.0, 28.0, 16.0, 17.0, 14.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032978057861328125, -0.0032031238079071045, -0.0031084418296813965, -0.0030137598514556885, -0.0029190778732299805, -0.0028243958950042725, -0.0027297139167785645, -0.0026350319385528564, -0.0025403499603271484, -0.0024456679821014404, -0.0023509860038757324, -0.0022563040256500244, -0.0021616220474243164, -0.0020669400691986084, -0.0019722580909729004, -0.0018775761127471924, -0.0017828941345214844, -0.0016882121562957764, -0.0015935301780700684, -0.0014988481998443604, -0.0014041662216186523, -0.0013094842433929443, -0.0012148022651672363, -0.0011201202869415283, -0.0010254383087158203, -0.0009307563304901123, -0.0008360743522644043, -0.0007413923740386963, -0.0006467103958129883, -0.0005520284175872803, -0.00045734643936157227, -0.00036266446113586426, -0.00026798248291015625, -0.00017330050468444824, -7.861852645874023e-05, 1.6063451766967773e-05, 0.00011074542999267578, 0.0002054274082183838, 0.0003001093864440918, 0.0003947913646697998, 0.0004894733428955078, 0.0005841553211212158, 0.0006788372993469238, 0.0007735192775726318, 0.0008682012557983398, 0.0009628832340240479, 0.0010575652122497559, 0.0011522471904754639, 0.0012469291687011719, 0.0013416111469268799, 0.0014362931251525879, 0.001530975103378296, 0.001625657081604004, 0.001720339059829712, 0.00181502103805542, 0.001909703016281128, 0.002004384994506836, 0.002099066972732544, 0.002193748950958252, 0.00228843092918396, 0.002383112907409668, 0.002477794885635376, 0.002572476863861084, 0.002667158842086792, 0.0027618408203125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 4.0, 23.0, 38.0, 152.0, 391.0, 231.0, 77.0, 42.0, 16.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10761038213968277, -0.10356015712022781, -0.09950992465019226, -0.0954596996307373, -0.09140946716070175, -0.0873592421412468, -0.08330900967121124, -0.07925878465175629, -0.07520855963230133, -0.07115833461284637, -0.06710810214281082, -0.06305787712335587, -0.05900764465332031, -0.054957419633865356, -0.0509071908891201, -0.04685696214437485, -0.042806729674339294, -0.03875650092959404, -0.034706272184848785, -0.03065604530274868, -0.026605816558003426, -0.02255558781325817, -0.018505360931158066, -0.014455132186412811, -0.010404903441667557, -0.0063546751625835896, -0.0023044468834996223, 0.0017457809299230576, 0.005796009674668312, 0.009846238419413567, 0.013896465301513672, 0.017946694046258926, 0.021996930241584778, 0.026047158986330032, 0.030097387731075287, 0.03414761275053024, 0.038197845220565796, 0.04224807024002075, 0.046298298984766006, 0.05034852772951126, 0.054398756474256516, 0.05844898521900177, 0.062499213963747025, 0.06654944270849228, 0.07059966772794724, 0.07464990019798279, 0.07870012521743774, 0.0827503502368927, 0.08680058270692825, 0.09085080772638321, 0.09490104019641876, 0.09895126521587372, 0.10300149768590927, 0.10705172270536423, 0.11110195517539978, 0.11515218019485474, 0.11920240521430969, 0.12325263023376465, 0.1273028552532196, 0.13135309517383575, 0.1354033201932907, 0.13945354521274567, 0.14350377023220062, 0.14755401015281677, 0.15160423517227173]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 7.0, 3.0, 4.0, 7.0, 13.0, 10.0, 13.0, 11.0, 15.0, 12.0, 20.0, 18.0, 22.0, 28.0, 31.0, 35.0, 37.0, 40.0, 39.0, 50.0, 60.0, 66.0, 61.0, 53.0, 38.0, 36.0, 41.0, 31.0, 20.0, 24.0, 24.0, 21.0, 16.0, 19.0, 10.0, 14.0, 14.0, 5.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056395113468170166, -0.05458729341626167, -0.05277947336435318, -0.050971657037734985, -0.04916383698582649, -0.047356016933918, -0.045548200607299805, -0.04374038055539131, -0.04193256050348282, -0.040124740451574326, -0.03831692039966583, -0.03650910407304764, -0.034701284021139145, -0.03289346396923065, -0.031085645779967308, -0.029277827590703964, -0.02747000753879547, -0.025662187486886978, -0.023854369297623634, -0.02204655110836029, -0.020238731056451797, -0.018430911004543304, -0.01662309281527996, -0.014815273694694042, -0.013007454574108124, -0.011199635453522205, -0.009391816332936287, -0.0075839972123503685, -0.00577617809176445, -0.003968358971178532, -0.0021605398505926132, -0.0003527207300066948, 0.0014550983905792236, 0.003262917511165142, 0.0050707366317510605, 0.006878555752336979, 0.008686374872922897, 0.010494193993508816, 0.012302013114094734, 0.014109832234680653, 0.01591765135526657, 0.017725471407175064, 0.019533289596438408, 0.02134110778570175, 0.023148927837610245, 0.024956747889518738, 0.02676456607878208, 0.028572384268045425, 0.03038020431995392, 0.03218802437186241, 0.033995844423770905, 0.0358036607503891, 0.03761148080229759, 0.039419300854206085, 0.04122711718082428, 0.04303493723273277, 0.044842757284641266, 0.04665057733654976, 0.04845839738845825, 0.05026621371507645, 0.05207403376698494, 0.05388185381889343, 0.05568967014551163, 0.05749749019742012, 0.05930531024932861]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 25.0, 36.0, 49.0, 94.0, 212.0, 568.0, 1558.0, 4551.0, 16145.0, 87498.0, 1683851.0, 2298952.0, 80493.0, 14010.0, 3870.0, 1354.0, 492.0, 196.0, 106.0, 64.0, 42.0, 28.0, 21.0, 10.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004331529140472412, -0.004176974296569824, -0.004022419452667236, -0.0038678646087646484, -0.0037133097648620605, -0.0035587549209594727, -0.0034042000770568848, -0.003249645233154297, -0.003095090389251709, -0.002940535545349121, -0.002785980701446533, -0.0026314258575439453, -0.0024768710136413574, -0.0023223161697387695, -0.0021677613258361816, -0.0020132064819335938, -0.0018586516380310059, -0.001704096794128418, -0.00154954195022583, -0.0013949871063232422, -0.0012404322624206543, -0.0010858774185180664, -0.0009313225746154785, -0.0007767677307128906, -0.0006222128868103027, -0.00046765804290771484, -0.00031310319900512695, -0.00015854835510253906, -3.993511199951172e-06, 0.00015056133270263672, 0.0003051161766052246, 0.0004596710205078125, 0.0006142258644104004, 0.0007687807083129883, 0.0009233355522155762, 0.001077890396118164, 0.001232445240020752, 0.0013870000839233398, 0.0015415549278259277, 0.0016961097717285156, 0.0018506646156311035, 0.0020052194595336914, 0.0021597743034362793, 0.002314329147338867, 0.002468883991241455, 0.002623438835144043, 0.002777993679046631, 0.0029325485229492188, 0.0030871033668518066, 0.0032416582107543945, 0.0033962130546569824, 0.0035507678985595703, 0.003705322742462158, 0.003859877586364746, 0.004014432430267334, 0.004168987274169922, 0.00432354211807251, 0.004478096961975098, 0.0046326518058776855, 0.0047872066497802734, 0.004941761493682861, 0.005096316337585449, 0.005250871181488037, 0.005405426025390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 9.0, 11.0, 28.0, 46.0, 58.0, 79.0, 106.0, 140.0, 129.0, 108.0, 86.0, 46.0, 40.0, 34.0, 20.0, 8.0, 10.0, 10.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007427215576171875, -0.007173478603363037, -0.006919741630554199, -0.006666004657745361, -0.0064122676849365234, -0.0061585307121276855, -0.005904793739318848, -0.00565105676651001, -0.005397319793701172, -0.005143582820892334, -0.004889845848083496, -0.004636108875274658, -0.00438237190246582, -0.004128634929656982, -0.0038748979568481445, -0.0036211609840393066, -0.0033674240112304688, -0.003113687038421631, -0.002859950065612793, -0.002606213092803955, -0.002352476119995117, -0.0020987391471862793, -0.0018450021743774414, -0.0015912652015686035, -0.0013375282287597656, -0.0010837912559509277, -0.0008300542831420898, -0.000576317310333252, -0.00032258033752441406, -6.884336471557617e-05, 0.00018489360809326172, 0.0004386305809020996, 0.0006923675537109375, 0.0009461045265197754, 0.0011998414993286133, 0.0014535784721374512, 0.001707315444946289, 0.001961052417755127, 0.002214789390563965, 0.0024685263633728027, 0.0027222633361816406, 0.0029760003089904785, 0.0032297372817993164, 0.0034834742546081543, 0.003737211227416992, 0.00399094820022583, 0.004244685173034668, 0.004498422145843506, 0.004752159118652344, 0.005005896091461182, 0.0052596330642700195, 0.005513370037078857, 0.005767107009887695, 0.006020843982696533, 0.006274580955505371, 0.006528317928314209, 0.006782054901123047, 0.007035791873931885, 0.007289528846740723, 0.0075432658195495605, 0.0077970027923583984, 0.008050739765167236, 0.008304476737976074, 0.008558213710784912, 0.00881195068359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 15.0, 23.0, 45.0, 70.0, 128.0, 224.0, 398.0, 840.0, 1920.0, 5238.0, 17486.0, 90010.0, 3655546.0, 374765.0, 31616.0, 9429.0, 3482.0, 1412.0, 686.0, 339.0, 183.0, 135.0, 92.0, 65.0, 37.0, 23.0, 14.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0050811767578125, -0.004915714263916016, -0.004750251770019531, -0.004584789276123047, -0.0044193267822265625, -0.004253864288330078, -0.004088401794433594, -0.003922939300537109, -0.003757476806640625, -0.0035920143127441406, -0.0034265518188476562, -0.003261089324951172, -0.0030956268310546875, -0.002930164337158203, -0.0027647018432617188, -0.0025992393493652344, -0.00243377685546875, -0.0022683143615722656, -0.0021028518676757812, -0.0019373893737792969, -0.0017719268798828125, -0.0016064643859863281, -0.0014410018920898438, -0.0012755393981933594, -0.001110076904296875, -0.0009446144104003906, -0.0007791519165039062, -0.0006136894226074219, -0.0004482269287109375, -0.0002827644348144531, -0.00011730194091796875, 4.8160552978515625e-05, 0.000213623046875, 0.0003790855407714844, 0.0005445480346679688, 0.0007100105285644531, 0.0008754730224609375, 0.0010409355163574219, 0.0012063980102539062, 0.0013718605041503906, 0.001537322998046875, 0.0017027854919433594, 0.0018682479858398438, 0.002033710479736328, 0.0021991729736328125, 0.002364635467529297, 0.0025300979614257812, 0.0026955604553222656, 0.00286102294921875, 0.0030264854431152344, 0.0031919479370117188, 0.003357410430908203, 0.0035228729248046875, 0.003688335418701172, 0.0038537979125976562, 0.004019260406494141, 0.004184722900390625, 0.004350185394287109, 0.004515647888183594, 0.004681110382080078, 0.0048465728759765625, 0.005012035369873047, 0.005177497863769531, 0.005342960357666016, 0.0055084228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 13.0, 19.0, 12.0, 26.0, 58.0, 136.0, 353.0, 960.0, 1305.0, 717.0, 235.0, 82.0, 35.0, 17.0, 11.0, 13.0, 10.0, 10.0, 7.0, 13.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006290435791015625, -0.006067931652069092, -0.005845427513122559, -0.005622923374176025, -0.005400419235229492, -0.005177915096282959, -0.004955410957336426, -0.004732906818389893, -0.004510402679443359, -0.004287898540496826, -0.004065394401550293, -0.0038428902626037598, -0.0036203861236572266, -0.0033978819847106934, -0.00317537784576416, -0.002952873706817627, -0.0027303695678710938, -0.0025078654289245605, -0.0022853612899780273, -0.002062857151031494, -0.001840353012084961, -0.0016178488731384277, -0.0013953447341918945, -0.0011728405952453613, -0.0009503364562988281, -0.0007278323173522949, -0.0005053281784057617, -0.0002828240394592285, -6.031990051269531e-05, 0.0001621842384338379, 0.0003846883773803711, 0.0006071925163269043, 0.0008296966552734375, 0.0010522007942199707, 0.001274704933166504, 0.0014972090721130371, 0.0017197132110595703, 0.0019422173500061035, 0.0021647214889526367, 0.00238722562789917, 0.002609729766845703, 0.0028322339057922363, 0.0030547380447387695, 0.0032772421836853027, 0.003499746322631836, 0.003722250461578369, 0.003944754600524902, 0.0041672587394714355, 0.004389762878417969, 0.004612267017364502, 0.004834771156311035, 0.005057275295257568, 0.0052797794342041016, 0.005502283573150635, 0.005724787712097168, 0.005947291851043701, 0.006169795989990234, 0.006392300128936768, 0.006614804267883301, 0.006837308406829834, 0.007059812545776367, 0.0072823166847229, 0.007504820823669434, 0.007727324962615967, 0.0079498291015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 7.0, 34.0, 58.0, 140.0, 223.0, 236.0, 154.0, 57.0, 41.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046362124383449554, -0.04495404660701752, -0.04354596510529518, -0.042137887328863144, -0.04072980582714081, -0.03932172805070877, -0.03791365027427673, -0.036505572497844696, -0.03509749099612236, -0.03368941321969032, -0.03228133171796799, -0.03087325394153595, -0.029465174302458763, -0.028057094663381577, -0.02664901688694954, -0.025240937247872353, -0.023832857608795166, -0.02242477796971798, -0.021016698330640793, -0.019608620554208755, -0.01820054091513157, -0.016792461276054382, -0.01538438256829977, -0.013976303860545158, -0.012568224221467972, -0.011160144582390785, -0.009752065874636173, -0.008343987166881561, -0.006935907527804375, -0.005527828354388475, -0.004119749180972576, -0.002711670473217964, -0.0013035908341407776, 0.00010448833927512169, 0.001512567512691021, 0.0029206466861069202, 0.0043287258595228195, 0.005736805032938719, 0.007144884206354618, 0.00855296291410923, 0.009961042553186417, 0.011369122192263603, 0.012777200900018215, 0.014185279607772827, 0.015593359246850014, 0.0170014388859272, 0.018409516662359238, 0.019817596301436424, 0.02122567594051361, 0.022633755579590797, 0.024041835218667984, 0.02544991299510002, 0.026857992634177208, 0.028266072273254395, 0.029674150049686432, 0.03108222968876362, 0.032490309327840805, 0.03389838710427284, 0.03530646860599518, 0.036714546382427216, 0.03812262415885925, 0.03953070566058159, 0.040938783437013626, 0.04234686493873596, 0.043754942715168]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 7.0, 9.0, 11.0, 8.0, 8.0, 18.0, 17.0, 29.0, 31.0, 32.0, 31.0, 39.0, 39.0, 36.0, 46.0, 37.0, 51.0, 56.0, 47.0, 50.0, 47.0, 33.0, 40.0, 34.0, 44.0, 27.0, 24.0, 37.0, 17.0, 10.0, 9.0, 20.0, 7.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.023339927196502686, -0.022639479488134384, -0.021939033642411232, -0.02123858779668808, -0.02053814008831978, -0.019837692379951477, -0.019137246534228325, -0.018436800688505173, -0.01773635298013687, -0.01703590527176857, -0.016335459426045418, -0.015635013580322266, -0.014934565871953964, -0.014234119094908237, -0.01353367231786251, -0.012833225540816784, -0.012132778763771057, -0.01143233198672533, -0.010731885209679604, -0.010031438432633877, -0.00933099165558815, -0.008630544878542423, -0.007930098101496696, -0.00722965132445097, -0.006529204547405243, -0.005828757770359516, -0.005128310993313789, -0.004427864216268063, -0.003727417439222336, -0.003026970662176609, -0.0023265238851308823, -0.0016260771080851555, -0.0009256303310394287, -0.00022518355399370193, 0.00047526322305202484, 0.0011757100000977516, 0.0018761567771434784, 0.002576603554189205, 0.003277050331234932, 0.003977497108280659, 0.0046779438853263855, 0.005378390662372112, 0.006078837439417839, 0.006779284216463566, 0.007479730993509293, 0.00818017777055502, 0.008880624547600746, 0.009581071324646473, 0.0102815181016922, 0.010981964878737926, 0.011682411655783653, 0.01238285843282938, 0.013083305209875107, 0.013783751986920834, 0.01448419876396656, 0.015184645541012287, 0.015885092318058014, 0.016585540026426315, 0.017285985872149467, 0.01798643171787262, 0.01868687942624092, 0.019387327134609222, 0.020087772980332375, 0.020788218826055527, 0.021488666534423828]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 9.0, 20.0, 26.0, 24.0, 40.0, 57.0, 84.0, 126.0, 201.0, 356.0, 593.0, 1006.0, 1925.0, 3839.0, 8772.0, 24460.0, 92561.0, 441373.0, 363249.0, 74155.0, 20746.0, 7617.0, 3453.0, 1582.0, 877.0, 525.0, 294.0, 196.0, 139.0, 79.0, 53.0, 20.0, 26.0, 20.0, 14.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0053863525390625, -0.00520634651184082, -0.005026340484619141, -0.004846334457397461, -0.004666328430175781, -0.0044863224029541016, -0.004306316375732422, -0.004126310348510742, -0.0039463043212890625, -0.003766298294067383, -0.003586292266845703, -0.0034062862396240234, -0.0032262802124023438, -0.003046274185180664, -0.0028662681579589844, -0.0026862621307373047, -0.002506256103515625, -0.0023262500762939453, -0.0021462440490722656, -0.001966238021850586, -0.0017862319946289062, -0.0016062259674072266, -0.0014262199401855469, -0.0012462139129638672, -0.0010662078857421875, -0.0008862018585205078, -0.0007061958312988281, -0.0005261898040771484, -0.00034618377685546875, -0.00016617774963378906, 1.3828277587890625e-05, 0.0001938343048095703, 0.00037384033203125, 0.0005538463592529297, 0.0007338523864746094, 0.0009138584136962891, 0.0010938644409179688, 0.0012738704681396484, 0.0014538764953613281, 0.0016338825225830078, 0.0018138885498046875, 0.001993894577026367, 0.002173900604248047, 0.0023539066314697266, 0.0025339126586914062, 0.002713918685913086, 0.0028939247131347656, 0.0030739307403564453, 0.003253936767578125, 0.0034339427947998047, 0.0036139488220214844, 0.003793954849243164, 0.003973960876464844, 0.0041539669036865234, 0.004333972930908203, 0.004513978958129883, 0.0046939849853515625, 0.004873991012573242, 0.005053997039794922, 0.0052340030670166016, 0.005414009094238281, 0.005594015121459961, 0.005774021148681641, 0.00595402717590332, 0.006134033203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 23.0, 34.0, 45.0, 76.0, 77.0, 122.0, 146.0, 121.0, 102.0, 70.0, 45.0, 33.0, 28.0, 15.0, 9.0, 7.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00734710693359375, -0.007092714309692383, -0.006838321685791016, -0.0065839290618896484, -0.006329536437988281, -0.006075143814086914, -0.005820751190185547, -0.00556635856628418, -0.0053119659423828125, -0.005057573318481445, -0.004803180694580078, -0.004548788070678711, -0.004294395446777344, -0.0040400028228759766, -0.0037856101989746094, -0.003531217575073242, -0.003276824951171875, -0.003022432327270508, -0.0027680397033691406, -0.0025136470794677734, -0.0022592544555664062, -0.002004861831665039, -0.0017504692077636719, -0.0014960765838623047, -0.0012416839599609375, -0.0009872913360595703, -0.0007328987121582031, -0.00047850608825683594, -0.00022411346435546875, 3.0279159545898438e-05, 0.0002846717834472656, 0.0005390644073486328, 0.00079345703125, 0.0010478496551513672, 0.0013022422790527344, 0.0015566349029541016, 0.0018110275268554688, 0.002065420150756836, 0.002319812774658203, 0.0025742053985595703, 0.0028285980224609375, 0.0030829906463623047, 0.003337383270263672, 0.003591775894165039, 0.0038461685180664062, 0.0041005611419677734, 0.004354953765869141, 0.004609346389770508, 0.004863739013671875, 0.005118131637573242, 0.005372524261474609, 0.0056269168853759766, 0.005881309509277344, 0.006135702133178711, 0.006390094757080078, 0.006644487380981445, 0.0068988800048828125, 0.00715327262878418, 0.007407665252685547, 0.007662057876586914, 0.007916450500488281, 0.008170843124389648, 0.008425235748291016, 0.008679628372192383, 0.00893402099609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 11.0, 5.0, 8.0, 9.0, 13.0, 20.0, 17.0, 24.0, 33.0, 55.0, 61.0, 89.0, 103.0, 154.0, 231.0, 298.0, 514.0, 821.0, 1668.0, 4014.0, 14785.0, 92369.0, 679633.0, 213660.0, 28349.0, 6279.0, 2154.0, 1079.0, 687.0, 395.0, 272.0, 202.0, 144.0, 86.0, 80.0, 67.0, 48.0, 31.0, 28.0, 18.0, 9.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.01020050048828125, -0.009914755821228027, -0.009629011154174805, -0.009343266487121582, -0.00905752182006836, -0.008771777153015137, -0.008486032485961914, -0.008200287818908691, -0.007914543151855469, -0.007628798484802246, -0.0073430538177490234, -0.007057309150695801, -0.006771564483642578, -0.0064858198165893555, -0.006200075149536133, -0.00591433048248291, -0.0056285858154296875, -0.005342841148376465, -0.005057096481323242, -0.0047713518142700195, -0.004485607147216797, -0.004199862480163574, -0.0039141178131103516, -0.003628373146057129, -0.0033426284790039062, -0.0030568838119506836, -0.002771139144897461, -0.0024853944778442383, -0.0021996498107910156, -0.001913905143737793, -0.0016281604766845703, -0.0013424158096313477, -0.001056671142578125, -0.0007709264755249023, -0.0004851818084716797, -0.00019943714141845703, 8.630752563476562e-05, 0.0003720521926879883, 0.0006577968597412109, 0.0009435415267944336, 0.0012292861938476562, 0.001515030860900879, 0.0018007755279541016, 0.0020865201950073242, 0.002372264862060547, 0.0026580095291137695, 0.002943754196166992, 0.003229498863220215, 0.0035152435302734375, 0.00380098819732666, 0.004086732864379883, 0.0043724775314331055, 0.004658222198486328, 0.004943966865539551, 0.0052297115325927734, 0.005515456199645996, 0.005801200866699219, 0.006086945533752441, 0.006372690200805664, 0.006658434867858887, 0.006944179534912109, 0.007229924201965332, 0.007515668869018555, 0.007801413536071777, 0.008087158203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 2.0, 4.0, 8.0, 7.0, 11.0, 9.0, 7.0, 9.0, 12.0, 17.0, 16.0, 24.0, 34.0, 33.0, 28.0, 34.0, 36.0, 36.0, 50.0, 48.0, 32.0, 45.0, 35.0, 47.0, 42.0, 41.0, 38.0, 40.0, 42.0, 28.0, 26.0, 26.0, 17.0, 21.0, 16.0, 11.0, 16.0, 13.0, 7.0, 5.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013458251953125, -0.013055801391601562, -0.012653350830078125, -0.012250900268554688, -0.01184844970703125, -0.011445999145507812, -0.011043548583984375, -0.010641098022460938, -0.0102386474609375, -0.009836196899414062, -0.009433746337890625, -0.009031295776367188, -0.00862884521484375, -0.008226394653320312, -0.007823944091796875, -0.0074214935302734375, -0.00701904296875, -0.0066165924072265625, -0.006214141845703125, -0.0058116912841796875, -0.00540924072265625, -0.0050067901611328125, -0.004604339599609375, -0.0042018890380859375, -0.0037994384765625, -0.0033969879150390625, -0.002994537353515625, -0.0025920867919921875, -0.00218963623046875, -0.0017871856689453125, -0.001384735107421875, -0.0009822845458984375, -0.000579833984375, -0.0001773834228515625, 0.000225067138671875, 0.0006275177001953125, 0.00102996826171875, 0.0014324188232421875, 0.001834869384765625, 0.0022373199462890625, 0.0026397705078125, 0.0030422210693359375, 0.003444671630859375, 0.0038471221923828125, 0.00424957275390625, 0.0046520233154296875, 0.005054473876953125, 0.0054569244384765625, 0.005859375, 0.0062618255615234375, 0.006664276123046875, 0.0070667266845703125, 0.00746917724609375, 0.007871627807617188, 0.008274078369140625, 0.008676528930664062, 0.0090789794921875, 0.009481430053710938, 0.009883880615234375, 0.010286331176757812, 0.01068878173828125, 0.011091232299804688, 0.011493682861328125, 0.011896133422851562, 0.012298583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 5.0, 11.0, 15.0, 18.0, 31.0, 32.0, 57.0, 77.0, 158.0, 304.0, 491.0, 1044.0, 2156.0, 5361.0, 16416.0, 68258.0, 506544.0, 358539.0, 63820.0, 15737.0, 5242.0, 2087.0, 967.0, 483.0, 254.0, 157.0, 104.0, 59.0, 40.0, 30.0, 15.0, 13.0, 11.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001148223876953125, -0.0011071860790252686, -0.0010661482810974121, -0.0010251104831695557, -0.0009840726852416992, -0.0009430348873138428, -0.0009019970893859863, -0.0008609592914581299, -0.0008199214935302734, -0.000778883695602417, -0.0007378458976745605, -0.0006968080997467041, -0.0006557703018188477, -0.0006147325038909912, -0.0005736947059631348, -0.0005326569080352783, -0.0004916191101074219, -0.00045058131217956543, -0.000409543514251709, -0.00036850571632385254, -0.0003274679183959961, -0.00028643012046813965, -0.0002453923225402832, -0.00020435452461242676, -0.0001633167266845703, -0.00012227892875671387, -8.124113082885742e-05, -4.0203332901000977e-05, 8.344650268554688e-07, 4.1872262954711914e-05, 8.291006088256836e-05, 0.0001239478588104248, 0.00016498565673828125, 0.0002060234546661377, 0.00024706125259399414, 0.0002880990505218506, 0.00032913684844970703, 0.0003701746463775635, 0.0004112124443054199, 0.00045225024223327637, 0.0004932880401611328, 0.0005343258380889893, 0.0005753636360168457, 0.0006164014339447021, 0.0006574392318725586, 0.000698477029800415, 0.0007395148277282715, 0.0007805526256561279, 0.0008215904235839844, 0.0008626282215118408, 0.0009036660194396973, 0.0009447038173675537, 0.0009857416152954102, 0.0010267794132232666, 0.001067817211151123, 0.0011088550090789795, 0.001149892807006836, 0.0011909306049346924, 0.0012319684028625488, 0.0012730062007904053, 0.0013140439987182617, 0.0013550817966461182, 0.0013961195945739746, 0.001437157392501831, 0.0014781951904296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 12.0, 9.0, 9.0, 16.0, 11.0, 12.0, 29.0, 20.0, 30.0, 27.0, 30.0, 47.0, 35.0, 60.0, 56.0, 41.0, 74.0, 45.0, 67.0, 75.0, 35.0, 56.0, 26.0, 39.0, 35.0, 20.0, 8.0, 14.0, 19.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.374422132968903e-06, -4.218891263008118e-06, -4.063360393047333e-06, -3.907829523086548e-06, -3.752298653125763e-06, -3.596767783164978e-06, -3.441236913204193e-06, -3.285706043243408e-06, -3.1301751732826233e-06, -2.9746443033218384e-06, -2.8191134333610535e-06, -2.6635825634002686e-06, -2.5080516934394836e-06, -2.3525208234786987e-06, -2.196989953517914e-06, -2.041459083557129e-06, -1.885928213596344e-06, -1.730397343635559e-06, -1.5748664736747742e-06, -1.4193356037139893e-06, -1.2638047337532043e-06, -1.1082738637924194e-06, -9.527429938316345e-07, -7.972121238708496e-07, -6.416812539100647e-07, -4.861503839492798e-07, -3.3061951398849487e-07, -1.7508864402770996e-07, -1.955777406692505e-08, 1.3597309589385986e-07, 2.915039658546448e-07, 4.470348358154297e-07, 6.025657057762146e-07, 7.580965757369995e-07, 9.136274456977844e-07, 1.0691583156585693e-06, 1.2246891856193542e-06, 1.3802200555801392e-06, 1.535750925540924e-06, 1.691281795501709e-06, 1.846812665462494e-06, 2.002343535423279e-06, 2.1578744053840637e-06, 2.3134052753448486e-06, 2.4689361453056335e-06, 2.6244670152664185e-06, 2.7799978852272034e-06, 2.9355287551879883e-06, 3.091059625148773e-06, 3.246590495109558e-06, 3.402121365070343e-06, 3.557652235031128e-06, 3.713183104991913e-06, 3.868713974952698e-06, 4.024244844913483e-06, 4.179775714874268e-06, 4.3353065848350525e-06, 4.490837454795837e-06, 4.646368324756622e-06, 4.801899194717407e-06, 4.957430064678192e-06, 5.112960934638977e-06, 5.268491804599762e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 5.0, 9.0, 9.0, 19.0, 35.0, 36.0, 49.0, 73.0, 111.0, 200.0, 303.0, 526.0, 1106.0, 2675.0, 8850.0, 43072.0, 317762.0, 591945.0, 63822.0, 11787.0, 3329.0, 1261.0, 619.0, 350.0, 194.0, 126.0, 68.0, 55.0, 45.0, 39.0, 14.0, 12.0, 7.0, 12.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001293182373046875, -0.0012454688549041748, -0.0011977553367614746, -0.0011500418186187744, -0.0011023283004760742, -0.001054614782333374, -0.0010069012641906738, -0.0009591877460479736, -0.0009114742279052734, -0.0008637607097625732, -0.000816047191619873, -0.0007683336734771729, -0.0007206201553344727, -0.0006729066371917725, -0.0006251931190490723, -0.0005774796009063721, -0.0005297660827636719, -0.0004820525646209717, -0.0004343390464782715, -0.0003866255283355713, -0.0003389120101928711, -0.0002911984920501709, -0.0002434849739074707, -0.0001957714557647705, -0.0001480579376220703, -0.00010034441947937012, -5.263090133666992e-05, -4.9173831939697266e-06, 4.279613494873047e-05, 9.050965309143066e-05, 0.00013822317123413086, 0.00018593668937683105, 0.00023365020751953125, 0.00028136372566223145, 0.00032907724380493164, 0.00037679076194763184, 0.00042450428009033203, 0.0004722177982330322, 0.0005199313163757324, 0.0005676448345184326, 0.0006153583526611328, 0.000663071870803833, 0.0007107853889465332, 0.0007584989070892334, 0.0008062124252319336, 0.0008539259433746338, 0.000901639461517334, 0.0009493529796600342, 0.0009970664978027344, 0.0010447800159454346, 0.0010924935340881348, 0.001140207052230835, 0.0011879205703735352, 0.0012356340885162354, 0.0012833476066589355, 0.0013310611248016357, 0.001378774642944336, 0.0014264881610870361, 0.0014742016792297363, 0.0015219151973724365, 0.0015696287155151367, 0.001617342233657837, 0.0016650557518005371, 0.0017127692699432373, 0.0017604827880859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 11.0, 19.0, 19.0, 21.0, 34.0, 42.0, 64.0, 67.0, 72.0, 82.0, 93.0, 78.0, 84.0, 57.0, 57.0, 39.0, 34.0, 20.0, 21.0, 14.0, 13.0, 18.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002040863037109375, -0.00197407603263855, -0.0019072890281677246, -0.0018405020236968994, -0.0017737150192260742, -0.001706928014755249, -0.0016401410102844238, -0.0015733540058135986, -0.0015065670013427734, -0.0014397799968719482, -0.001372992992401123, -0.0013062059879302979, -0.0012394189834594727, -0.0011726319789886475, -0.0011058449745178223, -0.001039057970046997, -0.0009722709655761719, -0.0009054839611053467, -0.0008386969566345215, -0.0007719099521636963, -0.0007051229476928711, -0.0006383359432220459, -0.0005715489387512207, -0.0005047619342803955, -0.0004379749298095703, -0.0003711879253387451, -0.0003044009208679199, -0.00023761391639709473, -0.00017082691192626953, -0.00010403990745544434, -3.725290298461914e-05, 2.9534101486206055e-05, 9.632110595703125e-05, 0.00016310811042785645, 0.00022989511489868164, 0.00029668211936950684, 0.00036346912384033203, 0.0004302561283111572, 0.0004970431327819824, 0.0005638301372528076, 0.0006306171417236328, 0.000697404146194458, 0.0007641911506652832, 0.0008309781551361084, 0.0008977651596069336, 0.0009645521640777588, 0.001031339168548584, 0.0010981261730194092, 0.0011649131774902344, 0.0012317001819610596, 0.0012984871864318848, 0.00136527419090271, 0.0014320611953735352, 0.0014988481998443604, 0.0015656352043151855, 0.0016324222087860107, 0.001699209213256836, 0.0017659962177276611, 0.0018327832221984863, 0.0018995702266693115, 0.0019663572311401367, 0.002033144235610962, 0.002099931240081787, 0.0021667182445526123, 0.0022335052490234375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 14.0, 24.0, 59.0, 131.0, 237.0, 297.0, 130.0, 46.0, 29.0, 12.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062259502708911896, -0.059788286685943604, -0.05731707066297531, -0.05484585091471672, -0.05237463489174843, -0.049903418868780136, -0.047432199120521545, -0.04496098309755325, -0.04248976707458496, -0.04001855105161667, -0.037547335028648376, -0.035076115280389786, -0.032604899257421494, -0.0301336832344532, -0.02766246534883976, -0.02519124746322632, -0.022720031440258026, -0.020248815417289734, -0.017777597531676292, -0.015306380577385426, -0.012835163623094559, -0.010363946668803692, -0.007892729714512825, -0.0054215118288993835, -0.0029502958059310913, -0.00047907885164022446, 0.0019921381026506424, 0.004463355056941509, 0.006934572011232376, 0.009405788965523243, 0.01187700591981411, 0.014348223805427551, 0.016819432377815247, 0.01929064840078354, 0.02176186628639698, 0.024233084172010422, 0.026704300194978714, 0.029175516217947006, 0.0316467359662056, 0.03411795198917389, 0.03658916801214218, 0.039060384035110474, 0.041531600058078766, 0.04400281980633736, 0.04647403582930565, 0.04894525185227394, 0.05141647160053253, 0.053887687623500824, 0.056358903646469116, 0.05883011966943741, 0.0613013356924057, 0.06377255171537399, 0.06624376773834229, 0.06871499121189117, 0.07118620723485947, 0.07365742325782776, 0.07612863928079605, 0.07859985530376434, 0.08107107132673264, 0.08354228734970093, 0.08601351082324982, 0.08848472684621811, 0.0909559428691864, 0.0934271588921547, 0.09589837491512299]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 3.0, 5.0, 10.0, 16.0, 8.0, 15.0, 18.0, 19.0, 17.0, 30.0, 26.0, 21.0, 29.0, 37.0, 47.0, 58.0, 64.0, 72.0, 93.0, 61.0, 51.0, 38.0, 36.0, 34.0, 34.0, 20.0, 20.0, 16.0, 12.0, 16.0, 11.0, 8.0, 7.0, 8.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06331872940063477, -0.0614977590739727, -0.05967678874731064, -0.057855818420648575, -0.05603484809398651, -0.05421387776732445, -0.052392907440662384, -0.05057193711400032, -0.04875096678733826, -0.04692999646067619, -0.04510902613401413, -0.043288055807352066, -0.04146708548069, -0.03964611515402794, -0.037825144827365875, -0.03600417450070381, -0.03418320417404175, -0.032362233847379684, -0.03054126352071762, -0.028720293194055557, -0.026899322867393494, -0.02507835254073143, -0.023257382214069366, -0.021436411887407303, -0.01961544156074524, -0.017794471234083176, -0.015973500907421112, -0.014152530580759048, -0.012331560254096985, -0.010510589927434921, -0.008689619600772858, -0.006868649274110794, -0.0050476789474487305, -0.003226708620786667, -0.0014057382941246033, 0.00041523203253746033, 0.002236202359199524, 0.0040571726858615875, 0.005878143012523651, 0.007699113339185715, 0.009520083665847778, 0.011341053992509842, 0.013162024319171906, 0.014982994645833969, 0.016803964972496033, 0.018624935299158096, 0.02044590562582016, 0.022266875952482224, 0.024087846279144287, 0.02590881660580635, 0.027729786932468414, 0.029550757259130478, 0.03137172758579254, 0.033192697912454605, 0.03501366823911667, 0.03683463856577873, 0.038655608892440796, 0.04047657921910286, 0.04229754954576492, 0.04411851987242699, 0.04593949019908905, 0.047760460525751114, 0.04958143085241318, 0.05140240117907524, 0.053223371505737305]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 13.0, 5.0, 19.0, 45.0, 41.0, 85.0, 160.0, 299.0, 698.0, 1813.0, 4740.0, 15642.0, 97897.0, 2179245.0, 1789983.0, 84968.0, 12716.0, 3573.0, 1348.0, 436.0, 228.0, 113.0, 57.0, 48.0, 33.0, 18.0, 15.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004108428955078125, -0.0039560794830322266, -0.003803730010986328, -0.0036513805389404297, -0.0034990310668945312, -0.003346681594848633, -0.0031943321228027344, -0.003041982650756836, -0.0028896331787109375, -0.002737283706665039, -0.0025849342346191406, -0.002432584762573242, -0.0022802352905273438, -0.0021278858184814453, -0.001975536346435547, -0.0018231868743896484, -0.00167083740234375, -0.0015184879302978516, -0.0013661384582519531, -0.0012137889862060547, -0.0010614395141601562, -0.0009090900421142578, -0.0007567405700683594, -0.0006043910980224609, -0.0004520416259765625, -0.00029969215393066406, -0.00014734268188476562, 5.0067901611328125e-06, 0.00015735626220703125, 0.0003097057342529297, 0.0004620552062988281, 0.0006144046783447266, 0.000766754150390625, 0.0009191036224365234, 0.0010714530944824219, 0.0012238025665283203, 0.0013761520385742188, 0.0015285015106201172, 0.0016808509826660156, 0.001833200454711914, 0.0019855499267578125, 0.002137899398803711, 0.0022902488708496094, 0.002442598342895508, 0.0025949478149414062, 0.0027472972869873047, 0.002899646759033203, 0.0030519962310791016, 0.003204345703125, 0.0033566951751708984, 0.003509044647216797, 0.0036613941192626953, 0.0038137435913085938, 0.003966093063354492, 0.004118442535400391, 0.004270792007446289, 0.0044231414794921875, 0.004575490951538086, 0.004727840423583984, 0.004880189895629883, 0.005032539367675781, 0.00518488883972168, 0.005337238311767578, 0.0054895877838134766, 0.005641937255859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 13.0, 20.0, 30.0, 52.0, 67.0, 92.0, 104.0, 138.0, 132.0, 103.0, 84.0, 49.0, 35.0, 26.0, 11.0, 7.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007050931453704834, -0.006796717643737793, -0.006542503833770752, -0.006288290023803711, -0.00603407621383667, -0.005779862403869629, -0.005525648593902588, -0.005271434783935547, -0.005017220973968506, -0.004763007164001465, -0.004508793354034424, -0.004254579544067383, -0.004000365734100342, -0.0037461519241333008, -0.0034919381141662598, -0.0032377243041992188, -0.0029835104942321777, -0.0027292966842651367, -0.0024750828742980957, -0.0022208690643310547, -0.0019666552543640137, -0.0017124414443969727, -0.0014582276344299316, -0.0012040138244628906, -0.0009498000144958496, -0.0006955862045288086, -0.0004413723945617676, -0.00018715858459472656, 6.705522537231445e-05, 0.00032126903533935547, 0.0005754828453063965, 0.0008296966552734375, 0.0010839104652404785, 0.0013381242752075195, 0.0015923380851745605, 0.0018465518951416016, 0.0021007657051086426, 0.0023549795150756836, 0.0026091933250427246, 0.0028634071350097656, 0.0031176209449768066, 0.0033718347549438477, 0.0036260485649108887, 0.0038802623748779297, 0.004134476184844971, 0.004388689994812012, 0.004642903804779053, 0.004897117614746094, 0.005151331424713135, 0.005405545234680176, 0.005659759044647217, 0.005913972854614258, 0.006168186664581299, 0.00642240047454834, 0.006676614284515381, 0.006930828094482422, 0.007185041904449463, 0.007439255714416504, 0.007693469524383545, 0.007947683334350586, 0.008201897144317627, 0.008456110954284668, 0.008710324764251709, 0.00896453857421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 15.0, 22.0, 42.0, 67.0, 162.0, 309.0, 571.0, 1288.0, 4493.0, 39978.0, 3992024.0, 143401.0, 8374.0, 1905.0, 743.0, 378.0, 196.0, 122.0, 56.0, 51.0, 22.0, 12.0, 10.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00928497314453125, -0.009009122848510742, -0.008733272552490234, -0.008457422256469727, -0.008181571960449219, -0.007905721664428711, -0.007629871368408203, -0.007354021072387695, -0.0070781707763671875, -0.00680232048034668, -0.006526470184326172, -0.006250619888305664, -0.005974769592285156, -0.0056989192962646484, -0.005423069000244141, -0.005147218704223633, -0.004871368408203125, -0.004595518112182617, -0.004319667816162109, -0.0040438175201416016, -0.0037679672241210938, -0.003492116928100586, -0.003216266632080078, -0.0029404163360595703, -0.0026645660400390625, -0.0023887157440185547, -0.002112865447998047, -0.001837015151977539, -0.0015611648559570312, -0.0012853145599365234, -0.0010094642639160156, -0.0007336139678955078, -0.000457763671875, -0.0001819133758544922, 9.393692016601562e-05, 0.00036978721618652344, 0.0006456375122070312, 0.0009214878082275391, 0.0011973381042480469, 0.0014731884002685547, 0.0017490386962890625, 0.0020248889923095703, 0.002300739288330078, 0.002576589584350586, 0.0028524398803710938, 0.0031282901763916016, 0.0034041404724121094, 0.003679990768432617, 0.003955841064453125, 0.004231691360473633, 0.004507541656494141, 0.0047833919525146484, 0.005059242248535156, 0.005335092544555664, 0.005610942840576172, 0.00588679313659668, 0.0061626434326171875, 0.006438493728637695, 0.006714344024658203, 0.006990194320678711, 0.007266044616699219, 0.0075418949127197266, 0.007817745208740234, 0.008093595504760742, 0.00836944580078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 9.0, 15.0, 31.0, 141.0, 665.0, 1562.0, 1166.0, 308.0, 75.0, 34.0, 18.0, 21.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.009009361267089844, -0.008672714233398438, -0.008336067199707031, -0.007999420166015625, -0.007662773132324219, -0.0073261260986328125, -0.006989479064941406, -0.00665283203125, -0.006316184997558594, -0.0059795379638671875, -0.005642890930175781, -0.005306243896484375, -0.004969596862792969, -0.0046329498291015625, -0.004296302795410156, -0.00395965576171875, -0.0036230087280273438, -0.0032863616943359375, -0.0029497146606445312, -0.002613067626953125, -0.0022764205932617188, -0.0019397735595703125, -0.0016031265258789062, -0.0012664794921875, -0.0009298324584960938, -0.0005931854248046875, -0.00025653839111328125, 8.0108642578125e-05, 0.00041675567626953125, 0.0007534027099609375, 0.0010900497436523438, 0.00142669677734375, 0.0017633438110351562, 0.0020999908447265625, 0.0024366378784179688, 0.002773284912109375, 0.0031099319458007812, 0.0034465789794921875, 0.0037832260131835938, 0.004119873046875, 0.004456520080566406, 0.0047931671142578125, 0.005129814147949219, 0.005466461181640625, 0.005803108215332031, 0.0061397552490234375, 0.006476402282714844, 0.00681304931640625, 0.007149696350097656, 0.0074863433837890625, 0.007822990417480469, 0.008159637451171875, 0.008496284484863281, 0.008832931518554688, 0.009169578552246094, 0.0095062255859375, 0.009842872619628906, 0.010179519653320312, 0.010516166687011719, 0.010852813720703125, 0.011189460754394531, 0.011526107788085938, 0.011862754821777344, 0.01219940185546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 12.0, 72.0, 310.0, 428.0, 124.0, 25.0, 16.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05934443697333336, -0.056237686425447464, -0.05313093960285187, -0.05002418905496597, -0.04691743850708008, -0.04381069168448448, -0.04070394113659859, -0.03759719431400299, -0.034490443766117096, -0.0313836932182312, -0.028276946395635605, -0.02517019584774971, -0.022063447162508965, -0.01895669847726822, -0.015849947929382324, -0.012743199244141579, -0.009636450558900833, -0.0065297014079988, -0.0034229522570967674, -0.00031620264053344727, 0.0027905460447072983, 0.005897294729948044, 0.009004045277833939, 0.012110793963074684, 0.01521754264831543, 0.018324291333556175, 0.02143104001879692, 0.024537790566682816, 0.02764453925192356, 0.030751287937164307, 0.0338580384850502, 0.036964789032936096, 0.040071532130241394, 0.04317828267812729, 0.046285029500722885, 0.04939178004860878, 0.052498526871204376, 0.05560527741909027, 0.058712027966976166, 0.06181877851486206, 0.06492552161216736, 0.06803227216005325, 0.07113902270793915, 0.07424576580524445, 0.07735251635313034, 0.08045926690101624, 0.08356601744890213, 0.08667276799678802, 0.08977951854467392, 0.09288626909255981, 0.09599301964044571, 0.0990997701883316, 0.1022065132856369, 0.1053132638335228, 0.10842001438140869, 0.11152676492929459, 0.11463351547718048, 0.11774026602506638, 0.12084701657295227, 0.12395375967025757, 0.12706051766872406, 0.13016726076602936, 0.13327401876449585, 0.13638076186180115, 0.13948750495910645]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 9.0, 7.0, 8.0, 9.0, 9.0, 12.0, 13.0, 31.0, 28.0, 23.0, 25.0, 26.0, 25.0, 30.0, 35.0, 43.0, 40.0, 48.0, 53.0, 44.0, 47.0, 50.0, 42.0, 47.0, 36.0, 38.0, 33.0, 28.0, 15.0, 21.0, 25.0, 15.0, 10.0, 17.0, 12.0, 7.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020757019519805908, -0.020089566707611084, -0.01942211575806141, -0.018754664808511734, -0.01808721199631691, -0.017419759184122086, -0.01675230823457241, -0.016084857285022736, -0.015417404472827911, -0.014749952591955662, -0.014082500711083412, -0.013415048830211163, -0.012747596949338913, -0.012080145068466663, -0.011412693187594414, -0.010745241306722164, -0.010077789425849915, -0.009410337544977665, -0.008742885664105415, -0.008075433783233166, -0.007407981902360916, -0.0067405300214886665, -0.006073078140616417, -0.005405626259744167, -0.004738174378871918, -0.004070722497999668, -0.0034032706171274185, -0.002735818736255169, -0.0020683668553829193, -0.0014009149745106697, -0.0007334630936384201, -6.60112127661705e-05, 0.0006014406681060791, 0.0012688925489783287, 0.0019363444298505783, 0.002603796310722828, 0.0032712481915950775, 0.003938700072467327, 0.004606151953339577, 0.005273603834211826, 0.005941055715084076, 0.0066085075959563255, 0.007275959476828575, 0.007943411357700825, 0.008610863238573074, 0.009278315119445324, 0.009945767000317574, 0.010613218881189823, 0.011280670762062073, 0.011948122642934322, 0.012615574523806572, 0.013283026404678822, 0.013950478285551071, 0.01461793016642332, 0.01528538204729557, 0.015952832996845245, 0.01662028580904007, 0.017287738621234894, 0.01795518957078457, 0.018622640520334244, 0.019290093332529068, 0.019957546144723892, 0.020624997094273567, 0.021292448043823242, 0.021959900856018066]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 2.0, 7.0, 5.0, 13.0, 9.0, 17.0, 19.0, 37.0, 36.0, 66.0, 77.0, 113.0, 165.0, 258.0, 339.0, 556.0, 915.0, 1493.0, 2569.0, 4973.0, 10781.0, 26944.0, 78453.0, 238079.0, 392982.0, 187874.0, 60600.0, 21765.0, 9061.0, 4294.0, 2247.0, 1330.0, 808.0, 529.0, 334.0, 228.0, 150.0, 105.0, 91.0, 63.0, 48.0, 28.0, 23.0, 16.0, 15.0, 10.0, 13.0, 6.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037708282470703125, -0.0036506950855255127, -0.003530561923980713, -0.003410428762435913, -0.0032902956008911133, -0.0031701624393463135, -0.0030500292778015137, -0.002929896116256714, -0.002809762954711914, -0.0026896297931671143, -0.0025694966316223145, -0.0024493634700775146, -0.002329230308532715, -0.002209097146987915, -0.0020889639854431152, -0.0019688308238983154, -0.0018486976623535156, -0.0017285645008087158, -0.001608431339263916, -0.0014882981777191162, -0.0013681650161743164, -0.0012480318546295166, -0.0011278986930847168, -0.001007765531539917, -0.0008876323699951172, -0.0007674992084503174, -0.0006473660469055176, -0.0005272328853607178, -0.00040709972381591797, -0.00028696656227111816, -0.00016683340072631836, -4.6700239181518555e-05, 7.343292236328125e-05, 0.00019356608390808105, 0.00031369924545288086, 0.00043383240699768066, 0.0005539655685424805, 0.0006740987300872803, 0.0007942318916320801, 0.0009143650531768799, 0.0010344982147216797, 0.0011546313762664795, 0.0012747645378112793, 0.001394897699356079, 0.001515030860900879, 0.0016351640224456787, 0.0017552971839904785, 0.0018754303455352783, 0.001995563507080078, 0.002115696668624878, 0.0022358298301696777, 0.0023559629917144775, 0.0024760961532592773, 0.002596229314804077, 0.002716362476348877, 0.0028364956378936768, 0.0029566287994384766, 0.0030767619609832764, 0.003196895122528076, 0.003317028284072876, 0.0034371614456176758, 0.0035572946071624756, 0.0036774277687072754, 0.003797560930252075, 0.003917694091796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 18.0, 21.0, 34.0, 52.0, 65.0, 106.0, 131.0, 129.0, 141.0, 104.0, 68.0, 33.0, 32.0, 21.0, 11.0, 6.0, 11.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00725555419921875, -0.007000565528869629, -0.006745576858520508, -0.006490588188171387, -0.006235599517822266, -0.0059806108474731445, -0.0057256221771240234, -0.005470633506774902, -0.005215644836425781, -0.00496065616607666, -0.004705667495727539, -0.004450678825378418, -0.004195690155029297, -0.003940701484680176, -0.0036857128143310547, -0.0034307241439819336, -0.0031757354736328125, -0.0029207468032836914, -0.0026657581329345703, -0.0024107694625854492, -0.002155780792236328, -0.001900792121887207, -0.001645803451538086, -0.0013908147811889648, -0.0011358261108398438, -0.0008808374404907227, -0.0006258487701416016, -0.00037086009979248047, -0.00011587142944335938, 0.00013911724090576172, 0.0003941059112548828, 0.0006490945816040039, 0.000904083251953125, 0.001159071922302246, 0.0014140605926513672, 0.0016690492630004883, 0.0019240379333496094, 0.0021790266036987305, 0.0024340152740478516, 0.0026890039443969727, 0.0029439926147460938, 0.003198981285095215, 0.003453969955444336, 0.003708958625793457, 0.003963947296142578, 0.004218935966491699, 0.00447392463684082, 0.004728913307189941, 0.0049839019775390625, 0.005238890647888184, 0.005493879318237305, 0.005748867988586426, 0.006003856658935547, 0.006258845329284668, 0.006513833999633789, 0.00676882266998291, 0.007023811340332031, 0.007278800010681152, 0.0075337886810302734, 0.0077887773513793945, 0.008043766021728516, 0.008298754692077637, 0.008553743362426758, 0.008808732032775879, 0.009063720703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 3.0, 7.0, 6.0, 13.0, 14.0, 19.0, 25.0, 30.0, 48.0, 71.0, 69.0, 122.0, 165.0, 236.0, 390.0, 690.0, 1205.0, 2461.0, 5405.0, 13299.0, 34592.0, 96284.0, 232401.0, 442292.0, 136232.0, 49525.0, 18374.0, 7333.0, 3313.0, 1633.0, 825.0, 464.0, 325.0, 198.0, 136.0, 95.0, 72.0, 40.0, 35.0, 27.0, 15.0, 17.0, 11.0, 10.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0043487548828125, -0.004221528768539429, -0.004094302654266357, -0.003967076539993286, -0.003839850425720215, -0.0037126243114471436, -0.0035853981971740723, -0.003458172082901001, -0.0033309459686279297, -0.0032037198543548584, -0.003076493740081787, -0.002949267625808716, -0.0028220415115356445, -0.0026948153972625732, -0.002567589282989502, -0.0024403631687164307, -0.0023131370544433594, -0.002185910940170288, -0.002058684825897217, -0.0019314587116241455, -0.0018042325973510742, -0.001677006483078003, -0.0015497803688049316, -0.0014225542545318604, -0.001295328140258789, -0.0011681020259857178, -0.0010408759117126465, -0.0009136497974395752, -0.0007864236831665039, -0.0006591975688934326, -0.0005319714546203613, -0.00040474534034729004, -0.00027751922607421875, -0.00015029311180114746, -2.3066997528076172e-05, 0.00010415911674499512, 0.0002313852310180664, 0.0003586113452911377, 0.000485837459564209, 0.0006130635738372803, 0.0007402896881103516, 0.0008675158023834229, 0.0009947419166564941, 0.0011219680309295654, 0.0012491941452026367, 0.001376420259475708, 0.0015036463737487793, 0.0016308724880218506, 0.0017580986022949219, 0.0018853247165679932, 0.0020125508308410645, 0.0021397769451141357, 0.002267003059387207, 0.0023942291736602783, 0.0025214552879333496, 0.002648681402206421, 0.002775907516479492, 0.0029031336307525635, 0.0030303597450256348, 0.003157585859298706, 0.0032848119735717773, 0.0034120380878448486, 0.00353926420211792, 0.003666490316390991, 0.0037937164306640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 11.0, 3.0, 11.0, 9.0, 8.0, 12.0, 11.0, 11.0, 19.0, 20.0, 24.0, 24.0, 21.0, 35.0, 40.0, 36.0, 42.0, 44.0, 47.0, 49.0, 51.0, 42.0, 43.0, 38.0, 29.0, 31.0, 35.0, 40.0, 33.0, 27.0, 20.0, 16.0, 20.0, 17.0, 20.0, 10.0, 6.0, 8.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01067352294921875, -0.010328173637390137, -0.009982824325561523, -0.00963747501373291, -0.009292125701904297, -0.008946776390075684, -0.00860142707824707, -0.008256077766418457, -0.007910728454589844, -0.0075653791427612305, -0.007220029830932617, -0.006874680519104004, -0.006529331207275391, -0.006183981895446777, -0.005838632583618164, -0.005493283271789551, -0.0051479339599609375, -0.004802584648132324, -0.004457235336303711, -0.004111886024475098, -0.0037665367126464844, -0.003421187400817871, -0.003075838088989258, -0.0027304887771606445, -0.0023851394653320312, -0.002039790153503418, -0.0016944408416748047, -0.0013490915298461914, -0.0010037422180175781, -0.0006583929061889648, -0.00031304359436035156, 3.230571746826172e-05, 0.000377655029296875, 0.0007230043411254883, 0.0010683536529541016, 0.0014137029647827148, 0.0017590522766113281, 0.0021044015884399414, 0.0024497509002685547, 0.002795100212097168, 0.0031404495239257812, 0.0034857988357543945, 0.003831148147583008, 0.004176497459411621, 0.004521846771240234, 0.004867196083068848, 0.005212545394897461, 0.005557894706726074, 0.0059032440185546875, 0.006248593330383301, 0.006593942642211914, 0.006939291954040527, 0.007284641265869141, 0.007629990577697754, 0.007975339889526367, 0.00832068920135498, 0.008666038513183594, 0.009011387825012207, 0.00935673713684082, 0.009702086448669434, 0.010047435760498047, 0.01039278507232666, 0.010738134384155273, 0.011083483695983887, 0.0114288330078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 13.0, 10.0, 14.0, 22.0, 46.0, 63.0, 89.0, 148.0, 243.0, 383.0, 663.0, 1264.0, 2450.0, 5363.0, 12850.0, 36830.0, 135403.0, 596869.0, 180712.0, 47304.0, 15473.0, 6353.0, 2747.0, 1373.0, 757.0, 405.0, 270.0, 149.0, 80.0, 81.0, 45.0, 30.0, 18.0, 12.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013113021850585938, -0.0012684464454650879, -0.001225590705871582, -0.0011827349662780762, -0.0011398792266845703, -0.0010970234870910645, -0.0010541677474975586, -0.0010113120079040527, -0.0009684562683105469, -0.000925600528717041, -0.0008827447891235352, -0.0008398890495300293, -0.0007970333099365234, -0.0007541775703430176, -0.0007113218307495117, -0.0006684660911560059, -0.0006256103515625, -0.0005827546119689941, -0.0005398988723754883, -0.0004970431327819824, -0.00045418739318847656, -0.0004113316535949707, -0.00036847591400146484, -0.000325620174407959, -0.0002827644348144531, -0.00023990869522094727, -0.0001970529556274414, -0.00015419721603393555, -0.00011134147644042969, -6.848573684692383e-05, -2.562999725341797e-05, 1.722574234008789e-05, 6.008148193359375e-05, 0.00010293722152709961, 0.00014579296112060547, 0.00018864870071411133, 0.0002315044403076172, 0.00027436017990112305, 0.0003172159194946289, 0.00036007165908813477, 0.0004029273986816406, 0.0004457831382751465, 0.0004886388778686523, 0.0005314946174621582, 0.0005743503570556641, 0.0006172060966491699, 0.0006600618362426758, 0.0007029175758361816, 0.0007457733154296875, 0.0007886290550231934, 0.0008314847946166992, 0.0008743405342102051, 0.0009171962738037109, 0.0009600520133972168, 0.0010029077529907227, 0.0010457634925842285, 0.0010886192321777344, 0.0011314749717712402, 0.001174330711364746, 0.001217186450958252, 0.0012600421905517578, 0.0013028979301452637, 0.0013457536697387695, 0.0013886094093322754, 0.0014314651489257812]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 13.0, 15.0, 17.0, 11.0, 22.0, 11.0, 27.0, 34.0, 37.0, 33.0, 42.0, 44.0, 23.0, 51.0, 50.0, 51.0, 63.0, 48.0, 50.0, 22.0, 55.0, 32.0, 32.0, 41.0, 23.0, 25.0, 12.0, 29.0, 19.0, 8.0, 11.0, 8.0, 4.0, 2.0, 7.0, 2.0, 6.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.516674041748047e-06, -3.405846655368805e-06, -3.295019268989563e-06, -3.184191882610321e-06, -3.073364496231079e-06, -2.962537109851837e-06, -2.8517097234725952e-06, -2.7408823370933533e-06, -2.6300549507141113e-06, -2.5192275643348694e-06, -2.4084001779556274e-06, -2.2975727915763855e-06, -2.1867454051971436e-06, -2.0759180188179016e-06, -1.9650906324386597e-06, -1.8542632460594177e-06, -1.7434358596801758e-06, -1.6326084733009338e-06, -1.521781086921692e-06, -1.41095370054245e-06, -1.300126314163208e-06, -1.189298927783966e-06, -1.0784715414047241e-06, -9.676441550254822e-07, -8.568167686462402e-07, -7.459893822669983e-07, -6.351619958877563e-07, -5.243346095085144e-07, -4.1350722312927246e-07, -3.026798367500305e-07, -1.9185245037078857e-07, -8.102506399154663e-08, 2.9802322387695312e-08, 1.4062970876693726e-07, 2.514570951461792e-07, 3.6228448152542114e-07, 4.731118679046631e-07, 5.83939254283905e-07, 6.94766640663147e-07, 8.055940270423889e-07, 9.164214134216309e-07, 1.0272487998008728e-06, 1.1380761861801147e-06, 1.2489035725593567e-06, 1.3597309589385986e-06, 1.4705583453178406e-06, 1.5813857316970825e-06, 1.6922131180763245e-06, 1.8030405044555664e-06, 1.9138678908348083e-06, 2.0246952772140503e-06, 2.1355226635932922e-06, 2.246350049972534e-06, 2.357177436351776e-06, 2.468004822731018e-06, 2.57883220911026e-06, 2.689659595489502e-06, 2.800486981868744e-06, 2.911314368247986e-06, 3.0221417546272278e-06, 3.1329691410064697e-06, 3.2437965273857117e-06, 3.3546239137649536e-06, 3.4654513001441956e-06, 3.5762786865234375e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 9.0, 18.0, 16.0, 29.0, 32.0, 93.0, 148.0, 338.0, 736.0, 1945.0, 6300.0, 26188.0, 161684.0, 688880.0, 131252.0, 22221.0, 5483.0, 1798.0, 716.0, 308.0, 129.0, 82.0, 39.0, 32.0, 17.0, 16.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00225830078125, -0.002202466130256653, -0.0021466314792633057, -0.0020907968282699585, -0.0020349621772766113, -0.001979127526283264, -0.001923292875289917, -0.0018674582242965698, -0.0018116235733032227, -0.0017557889223098755, -0.0016999542713165283, -0.0016441196203231812, -0.001588284969329834, -0.0015324503183364868, -0.0014766156673431396, -0.0014207810163497925, -0.0013649463653564453, -0.0013091117143630981, -0.001253277063369751, -0.0011974424123764038, -0.0011416077613830566, -0.0010857731103897095, -0.0010299384593963623, -0.0009741038084030151, -0.000918269157409668, -0.0008624345064163208, -0.0008065998554229736, -0.0007507652044296265, -0.0006949305534362793, -0.0006390959024429321, -0.000583261251449585, -0.0005274266004562378, -0.0004715919494628906, -0.00041575729846954346, -0.0003599226474761963, -0.0003040879964828491, -0.00024825334548950195, -0.00019241869449615479, -0.00013658404350280762, -8.074939250946045e-05, -2.491474151611328e-05, 3.091990947723389e-05, 8.675456047058105e-05, 0.00014258921146392822, 0.0001984238624572754, 0.00025425851345062256, 0.0003100931644439697, 0.0003659278154373169, 0.00042176246643066406, 0.00047759711742401123, 0.0005334317684173584, 0.0005892664194107056, 0.0006451010704040527, 0.0007009357213973999, 0.0007567703723907471, 0.0008126050233840942, 0.0008684396743774414, 0.0009242743253707886, 0.0009801089763641357, 0.001035943627357483, 0.00109177827835083, 0.0011476129293441772, 0.0012034475803375244, 0.0012592822313308716, 0.0013151168823242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 9.0, 17.0, 21.0, 21.0, 17.0, 26.0, 48.0, 56.0, 75.0, 84.0, 82.0, 89.0, 98.0, 78.0, 72.0, 50.0, 38.0, 33.0, 17.0, 15.0, 10.0, 14.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.0024108588695526123, -0.0023383498191833496, -0.002265840768814087, -0.0021933317184448242, -0.0021208226680755615, -0.002048313617706299, -0.001975804567337036, -0.0019032955169677734, -0.0018307864665985107, -0.001758277416229248, -0.0016857683658599854, -0.0016132593154907227, -0.00154075026512146, -0.0014682412147521973, -0.0013957321643829346, -0.0013232231140136719, -0.0012507140636444092, -0.0011782050132751465, -0.0011056959629058838, -0.001033186912536621, -0.0009606778621673584, -0.0008881688117980957, -0.000815659761428833, -0.0007431507110595703, -0.0006706416606903076, -0.0005981326103210449, -0.0005256235599517822, -0.00045311450958251953, -0.00038060545921325684, -0.00030809640884399414, -0.00023558735847473145, -0.00016307830810546875, -9.056925773620605e-05, -1.806020736694336e-05, 5.4448843002319336e-05, 0.00012695789337158203, 0.00019946694374084473, 0.0002719759941101074, 0.0003444850444793701, 0.0004169940948486328, 0.0004895031452178955, 0.0005620121955871582, 0.0006345212459564209, 0.0007070302963256836, 0.0007795393466949463, 0.000852048397064209, 0.0009245574474334717, 0.0009970664978027344, 0.001069575548171997, 0.0011420845985412598, 0.0012145936489105225, 0.0012871026992797852, 0.0013596117496490479, 0.0014321208000183105, 0.0015046298503875732, 0.001577138900756836, 0.0016496479511260986, 0.0017221570014953613, 0.001794666051864624, 0.0018671751022338867, 0.0019396841526031494, 0.002012193202972412, 0.002084702253341675, 0.0021572113037109375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 9.0, 18.0, 31.0, 71.0, 220.0, 359.0, 181.0, 72.0, 24.0, 10.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04073881357908249, -0.03827570006251335, -0.035812586545944214, -0.033349473029375076, -0.03088635765016079, -0.028423244133591652, -0.025960128754377365, -0.023497015237808228, -0.02103390172123909, -0.018570788204669952, -0.016107674688100815, -0.013644559308886528, -0.01118144579231739, -0.008718332275748253, -0.006255217827856541, -0.0037921033799648285, -0.001328989863395691, 0.001134124118834734, 0.003597238101065159, 0.006060352083295584, 0.008523466065526009, 0.010986579582095146, 0.013449694029986858, 0.01591280847787857, 0.018375921994447708, 0.020839035511016846, 0.023302149027585983, 0.02576526440680027, 0.028228377923369408, 0.030691491439938545, 0.03315460681915283, 0.03561772033572197, 0.03808082640171051, 0.04054393991827965, 0.043007053434848785, 0.04547016695141792, 0.04793328046798706, 0.0503963977098465, 0.052859511226415634, 0.05532262474298477, 0.05778573825955391, 0.06024885177612305, 0.06271196901798248, 0.06517507880926132, 0.06763819605112076, 0.0701013058423996, 0.07256442308425903, 0.07502754032611847, 0.07749065011739731, 0.07995376735925674, 0.08241687715053558, 0.08487999439239502, 0.08734310418367386, 0.0898062214255333, 0.09226933121681213, 0.09473244845867157, 0.097195565700531, 0.09965868294239044, 0.10212179273366928, 0.10458490997552872, 0.10704801976680756, 0.10951113700866699, 0.11197424679994583, 0.11443736404180527, 0.1169004738330841]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 7.0, 3.0, 6.0, 5.0, 10.0, 15.0, 10.0, 16.0, 13.0, 15.0, 22.0, 27.0, 29.0, 25.0, 20.0, 31.0, 41.0, 41.0, 58.0, 60.0, 69.0, 56.0, 61.0, 35.0, 38.0, 30.0, 33.0, 14.0, 23.0, 21.0, 17.0, 18.0, 24.0, 11.0, 13.0, 14.0, 8.0, 7.0, 7.0, 5.0, 7.0, 10.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.03861534595489502, -0.03742838278412819, -0.03624141961336136, -0.03505445271730423, -0.0338674895465374, -0.03268052637577057, -0.03149355947971344, -0.03030659630894661, -0.02911963313817978, -0.02793266996741295, -0.02674570493400097, -0.02555873990058899, -0.02437177672982216, -0.02318481355905533, -0.02199784852564335, -0.02081088349223137, -0.01962392032146454, -0.018436957150697708, -0.01724999211728573, -0.01606302708387375, -0.014876063913106918, -0.013689099811017513, -0.012502135708928108, -0.011315171606838703, -0.010128207504749298, -0.008941243402659893, -0.007754279300570488, -0.006567315198481083, -0.005380351096391678, -0.004193386994302273, -0.0030064228922128677, -0.0018194587901234627, -0.0006324946880340576, 0.0005544694140553474, 0.0017414335161447525, 0.0029283976182341576, 0.004115361720323563, 0.005302325822412968, 0.006489289924502373, 0.007676254026591778, 0.008863218128681183, 0.010050182230770588, 0.011237146332859993, 0.012424110434949398, 0.013611074537038803, 0.014798038639128208, 0.015985002741217613, 0.017171967774629593, 0.018358930945396423, 0.019545894116163254, 0.020732859149575233, 0.021919824182987213, 0.023106787353754044, 0.024293750524520874, 0.025480715557932854, 0.026667680591344833, 0.027854643762111664, 0.029041606932878494, 0.030228571966290474, 0.031415536999702454, 0.032602500170469284, 0.033789463341236115, 0.03497643023729324, 0.036163393408060074, 0.037350356578826904]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 11.0, 9.0, 17.0, 41.0, 97.0, 197.0, 310.0, 518.0, 972.0, 1897.0, 3573.0, 7771.0, 21326.0, 95203.0, 709223.0, 2688535.0, 556991.0, 79129.0, 17740.0, 5568.0, 2523.0, 1288.0, 658.0, 350.0, 143.0, 66.0, 42.0, 20.0, 16.0, 8.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0032825469970703125, -0.0031899213790893555, -0.0030972957611083984, -0.0030046701431274414, -0.0029120445251464844, -0.0028194189071655273, -0.0027267932891845703, -0.0026341676712036133, -0.0025415420532226562, -0.0024489164352416992, -0.002356290817260742, -0.002263665199279785, -0.002171039581298828, -0.002078413963317871, -0.001985788345336914, -0.001893162727355957, -0.001800537109375, -0.001707911491394043, -0.001615285873413086, -0.001522660255432129, -0.0014300346374511719, -0.0013374090194702148, -0.0012447834014892578, -0.0011521577835083008, -0.0010595321655273438, -0.0009669065475463867, -0.0008742809295654297, -0.0007816553115844727, -0.0006890296936035156, -0.0005964040756225586, -0.0005037784576416016, -0.00041115283966064453, -0.0003185272216796875, -0.00022590160369873047, -0.00013327598571777344, -4.0650367736816406e-05, 5.1975250244140625e-05, 0.00014460086822509766, 0.0002372264862060547, 0.0003298521041870117, 0.00042247772216796875, 0.0005151033401489258, 0.0006077289581298828, 0.0007003545761108398, 0.0007929801940917969, 0.0008856058120727539, 0.000978231430053711, 0.001070857048034668, 0.001163482666015625, 0.001256108283996582, 0.001348733901977539, 0.001441359519958496, 0.0015339851379394531, 0.0016266107559204102, 0.0017192363739013672, 0.0018118619918823242, 0.0019044876098632812, 0.0019971132278442383, 0.0020897388458251953, 0.0021823644638061523, 0.0022749900817871094, 0.0023676156997680664, 0.0024602413177490234, 0.0025528669357299805, 0.0026454925537109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 5.0, 6.0, 13.0, 19.0, 28.0, 46.0, 78.0, 109.0, 109.0, 139.0, 137.0, 106.0, 82.0, 33.0, 35.0, 25.0, 11.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007293701171875, -0.007038474082946777, -0.006783246994018555, -0.006528019905090332, -0.006272792816162109, -0.006017565727233887, -0.005762338638305664, -0.005507111549377441, -0.005251884460449219, -0.004996657371520996, -0.0047414302825927734, -0.004486203193664551, -0.004230976104736328, -0.0039757490158081055, -0.003720521926879883, -0.00346529483795166, -0.0032100677490234375, -0.002954840660095215, -0.002699613571166992, -0.0024443864822387695, -0.002189159393310547, -0.0019339323043823242, -0.0016787052154541016, -0.001423478126525879, -0.0011682510375976562, -0.0009130239486694336, -0.0006577968597412109, -0.0004025697708129883, -0.00014734268188476562, 0.00010788440704345703, 0.0003631114959716797, 0.0006183385848999023, 0.000873565673828125, 0.0011287927627563477, 0.0013840198516845703, 0.001639246940612793, 0.0018944740295410156, 0.0021497011184692383, 0.002404928207397461, 0.0026601552963256836, 0.0029153823852539062, 0.003170609474182129, 0.0034258365631103516, 0.0036810636520385742, 0.003936290740966797, 0.0041915178298950195, 0.004446744918823242, 0.004701972007751465, 0.0049571990966796875, 0.00521242618560791, 0.005467653274536133, 0.0057228803634643555, 0.005978107452392578, 0.006233334541320801, 0.0064885616302490234, 0.006743788719177246, 0.006999015808105469, 0.007254242897033691, 0.007509469985961914, 0.007764697074890137, 0.00801992416381836, 0.008275151252746582, 0.008530378341674805, 0.008785605430603027, 0.00904083251953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 15.0, 25.0, 37.0, 87.0, 159.0, 312.0, 12087.0, 4179898.0, 1242.0, 205.0, 120.0, 57.0, 29.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291595458984375, -0.028197050094604492, -0.027234554290771484, -0.026272058486938477, -0.02530956268310547, -0.02434706687927246, -0.023384571075439453, -0.022422075271606445, -0.021459579467773438, -0.02049708366394043, -0.019534587860107422, -0.018572092056274414, -0.017609596252441406, -0.0166471004486084, -0.01568460464477539, -0.014722108840942383, -0.013759613037109375, -0.012797117233276367, -0.01183462142944336, -0.010872125625610352, -0.009909629821777344, -0.008947134017944336, -0.007984638214111328, -0.00702214241027832, -0.0060596466064453125, -0.005097150802612305, -0.004134654998779297, -0.003172159194946289, -0.0022096633911132812, -0.0012471675872802734, -0.0002846717834472656, 0.0006778240203857422, 0.00164031982421875, 0.002602815628051758, 0.0035653114318847656, 0.0045278072357177734, 0.005490303039550781, 0.006452798843383789, 0.007415294647216797, 0.008377790451049805, 0.009340286254882812, 0.01030278205871582, 0.011265277862548828, 0.012227773666381836, 0.013190269470214844, 0.014152765274047852, 0.01511526107788086, 0.016077756881713867, 0.017040252685546875, 0.018002748489379883, 0.01896524429321289, 0.0199277400970459, 0.020890235900878906, 0.021852731704711914, 0.022815227508544922, 0.02377772331237793, 0.024740219116210938, 0.025702714920043945, 0.026665210723876953, 0.02762770652770996, 0.02859020233154297, 0.029552698135375977, 0.030515193939208984, 0.03147768974304199, 0.032440185546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 19.0, 55.0, 239.0, 1018.0, 1830.0, 701.0, 142.0, 33.0, 11.0, 8.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.018707275390625, -0.01834315061569214, -0.017979025840759277, -0.017614901065826416, -0.017250776290893555, -0.016886651515960693, -0.016522526741027832, -0.01615840196609497, -0.01579427719116211, -0.015430152416229248, -0.015066027641296387, -0.014701902866363525, -0.014337778091430664, -0.013973653316497803, -0.013609528541564941, -0.01324540376663208, -0.012881278991699219, -0.012517154216766357, -0.012153029441833496, -0.011788904666900635, -0.011424779891967773, -0.011060655117034912, -0.01069653034210205, -0.01033240556716919, -0.009968280792236328, -0.009604156017303467, -0.009240031242370605, -0.008875906467437744, -0.008511781692504883, -0.008147656917572021, -0.00778353214263916, -0.007419407367706299, -0.0070552825927734375, -0.006691157817840576, -0.006327033042907715, -0.0059629082679748535, -0.005598783493041992, -0.005234658718109131, -0.0048705339431762695, -0.004506409168243408, -0.004142284393310547, -0.0037781596183776855, -0.0034140348434448242, -0.003049910068511963, -0.0026857852935791016, -0.0023216605186462402, -0.001957535743713379, -0.0015934109687805176, -0.0012292861938476562, -0.0008651614189147949, -0.0005010366439819336, -0.00013691186904907227, 0.00022721290588378906, 0.0005913376808166504, 0.0009554624557495117, 0.001319587230682373, 0.0016837120056152344, 0.0020478367805480957, 0.002411961555480957, 0.0027760863304138184, 0.0031402111053466797, 0.003504335880279541, 0.0038684606552124023, 0.004232585430145264, 0.004596710205078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 8.0, 11.0, 19.0, 36.0, 68.0, 128.0, 164.0, 197.0, 157.0, 95.0, 61.0, 22.0, 10.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05580972880125046, -0.054664552211761475, -0.05351937562227249, -0.05237419903278351, -0.051229022443294525, -0.05008384585380554, -0.04893866926431656, -0.047793492674827576, -0.04664831608533859, -0.04550313949584961, -0.044357962906360626, -0.04321278631687164, -0.04206760972738266, -0.04092243313789368, -0.039777256548404694, -0.03863207995891571, -0.03748689964413643, -0.036341723054647446, -0.03519654646515846, -0.03405136987566948, -0.032906193286180496, -0.03176101669669151, -0.03061583824455738, -0.029470661655068398, -0.028325485065579414, -0.02718030847609043, -0.026035131886601448, -0.024889955297112465, -0.023744776844978333, -0.02259960025548935, -0.021454423666000366, -0.020309247076511383, -0.0191640704870224, -0.018018893897533417, -0.016873717308044434, -0.01572854071855545, -0.014583363197743893, -0.01343818660825491, -0.012293009087443352, -0.011147832497954369, -0.010002655908465385, -0.008857479318976402, -0.007712302263826132, -0.006567125208675861, -0.005421948619186878, -0.004276772029697895, -0.0031315949745476246, -0.001986417919397354, -0.000841241329908371, 0.00030393549241125584, 0.0014491123147308826, 0.0025942891370505095, 0.0037394659593701363, 0.004884642548859119, 0.00602981960400939, 0.00717499665915966, 0.008320173248648643, 0.009465349838137627, 0.01061052642762661, 0.011755703948438168, 0.01290088053792715, 0.014046057127416134, 0.015191234648227692, 0.016336411237716675, 0.017481587827205658]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 8.0, 8.0, 7.0, 10.0, 8.0, 11.0, 17.0, 22.0, 25.0, 30.0, 26.0, 42.0, 27.0, 44.0, 31.0, 37.0, 51.0, 38.0, 36.0, 45.0, 43.0, 45.0, 50.0, 43.0, 45.0, 34.0, 28.0, 40.0, 21.0, 17.0, 19.0, 19.0, 14.0, 10.0, 13.0, 10.0, 12.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02270883321762085, -0.022083088755607605, -0.02145734243094921, -0.020831596106290817, -0.020205851644277573, -0.019580107182264328, -0.018954360857605934, -0.01832861453294754, -0.017702870070934296, -0.01707712560892105, -0.016451379284262657, -0.015825632959604263, -0.015199888497591019, -0.0145741431042552, -0.01394839771091938, -0.013322652317583561, -0.012696906924247742, -0.012071161530911922, -0.011445416137576103, -0.010819670744240284, -0.010193925350904465, -0.009568179957568645, -0.008942434564232826, -0.008316689170897007, -0.007690943777561188, -0.0070651983842253685, -0.006439452990889549, -0.00581370759755373, -0.005187962204217911, -0.0045622168108820915, -0.003936471417546272, -0.003310726024210453, -0.002684980630874634, -0.0020592352375388145, -0.0014334898442029953, -0.0008077444508671761, -0.0001819990575313568, 0.00044374633580446243, 0.0010694917291402817, 0.001695237122476101, 0.00232098251581192, 0.0029467279091477394, 0.0035724733024835587, 0.004198218695819378, 0.004823964089155197, 0.005449709482491016, 0.006075454875826836, 0.006701200269162655, 0.007326945662498474, 0.007952691055834293, 0.008578436449170113, 0.009204181842505932, 0.009829927235841751, 0.01045567262917757, 0.01108141802251339, 0.011707163415849209, 0.012332908809185028, 0.012958654202520847, 0.013584399595856667, 0.014210144989192486, 0.014835890382528305, 0.015461635775864124, 0.016087381169199944, 0.016713127493858337, 0.017338871955871582]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 13.0, 7.0, 18.0, 18.0, 34.0, 36.0, 57.0, 65.0, 91.0, 173.0, 249.0, 342.0, 497.0, 899.0, 1542.0, 3028.0, 6425.0, 15433.0, 44192.0, 142244.0, 395205.0, 295419.0, 91313.0, 29675.0, 10919.0, 4808.0, 2374.0, 1247.0, 782.0, 458.0, 339.0, 186.0, 117.0, 108.0, 64.0, 49.0, 29.0, 32.0, 23.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004314422607421875, -0.004178822040557861, -0.004043221473693848, -0.003907620906829834, -0.0037720203399658203, -0.0036364197731018066, -0.003500819206237793, -0.0033652186393737793, -0.0032296180725097656, -0.003094017505645752, -0.0029584169387817383, -0.0028228163719177246, -0.002687215805053711, -0.0025516152381896973, -0.0024160146713256836, -0.00228041410446167, -0.0021448135375976562, -0.0020092129707336426, -0.001873612403869629, -0.0017380118370056152, -0.0016024112701416016, -0.0014668107032775879, -0.0013312101364135742, -0.0011956095695495605, -0.0010600090026855469, -0.0009244084358215332, -0.0007888078689575195, -0.0006532073020935059, -0.0005176067352294922, -0.0003820061683654785, -0.00024640560150146484, -0.00011080503463745117, 2.47955322265625e-05, 0.00016039609909057617, 0.00029599666595458984, 0.0004315972328186035, 0.0005671977996826172, 0.0007027983665466309, 0.0008383989334106445, 0.0009739995002746582, 0.0011096000671386719, 0.0012452006340026855, 0.0013808012008666992, 0.0015164017677307129, 0.0016520023345947266, 0.0017876029014587402, 0.001923203468322754, 0.0020588040351867676, 0.0021944046020507812, 0.002330005168914795, 0.0024656057357788086, 0.0026012063026428223, 0.002736806869506836, 0.0028724074363708496, 0.0030080080032348633, 0.003143608570098877, 0.0032792091369628906, 0.0034148097038269043, 0.003550410270690918, 0.0036860108375549316, 0.0038216114044189453, 0.003957211971282959, 0.004092812538146973, 0.004228413105010986, 0.004364013671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 20.0, 27.0, 58.0, 80.0, 99.0, 120.0, 138.0, 139.0, 105.0, 59.0, 42.0, 35.0, 23.0, 12.0, 13.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007266998291015625, -0.007012307643890381, -0.006757616996765137, -0.006502926349639893, -0.0062482357025146484, -0.005993545055389404, -0.00573885440826416, -0.005484163761138916, -0.005229473114013672, -0.004974782466888428, -0.004720091819763184, -0.0044654011726379395, -0.004210710525512695, -0.003956019878387451, -0.003701329231262207, -0.003446638584136963, -0.0031919479370117188, -0.0029372572898864746, -0.0026825666427612305, -0.0024278759956359863, -0.002173185348510742, -0.001918494701385498, -0.001663804054260254, -0.0014091134071350098, -0.0011544227600097656, -0.0008997321128845215, -0.0006450414657592773, -0.0003903508186340332, -0.00013566017150878906, 0.00011903047561645508, 0.0003737211227416992, 0.0006284117698669434, 0.0008831024169921875, 0.0011377930641174316, 0.0013924837112426758, 0.00164717435836792, 0.001901865005493164, 0.002156555652618408, 0.0024112462997436523, 0.0026659369468688965, 0.0029206275939941406, 0.0031753182411193848, 0.003430008888244629, 0.003684699535369873, 0.003939390182495117, 0.004194080829620361, 0.0044487714767456055, 0.00470346212387085, 0.004958152770996094, 0.005212843418121338, 0.005467534065246582, 0.005722224712371826, 0.00597691535949707, 0.0062316060066223145, 0.006486296653747559, 0.006740987300872803, 0.006995677947998047, 0.007250368595123291, 0.007505059242248535, 0.007759749889373779, 0.008014440536499023, 0.008269131183624268, 0.008523821830749512, 0.008778512477874756, 0.009033203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 9.0, 12.0, 14.0, 26.0, 35.0, 66.0, 76.0, 91.0, 144.0, 215.0, 297.0, 525.0, 1034.0, 2885.0, 14107.0, 100670.0, 700285.0, 195442.0, 25053.0, 4567.0, 1388.0, 597.0, 387.0, 210.0, 112.0, 83.0, 66.0, 53.0, 27.0, 24.0, 10.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007518768310546875, -0.007265269756317139, -0.007011771202087402, -0.006758272647857666, -0.00650477409362793, -0.006251275539398193, -0.005997776985168457, -0.005744278430938721, -0.005490779876708984, -0.005237281322479248, -0.004983782768249512, -0.004730284214019775, -0.004476785659790039, -0.004223287105560303, -0.003969788551330566, -0.00371628999710083, -0.0034627914428710938, -0.0032092928886413574, -0.002955794334411621, -0.0027022957801818848, -0.0024487972259521484, -0.002195298671722412, -0.0019418001174926758, -0.0016883015632629395, -0.0014348030090332031, -0.0011813044548034668, -0.0009278059005737305, -0.0006743073463439941, -0.0004208087921142578, -0.00016731023788452148, 8.618831634521484e-05, 0.00033968687057495117, 0.0005931854248046875, 0.0008466839790344238, 0.0011001825332641602, 0.0013536810874938965, 0.0016071796417236328, 0.0018606781959533691, 0.0021141767501831055, 0.002367675304412842, 0.002621173858642578, 0.0028746724128723145, 0.0031281709671020508, 0.003381669521331787, 0.0036351680755615234, 0.0038886666297912598, 0.004142165184020996, 0.004395663738250732, 0.004649162292480469, 0.004902660846710205, 0.005156159400939941, 0.005409657955169678, 0.005663156509399414, 0.00591665506362915, 0.006170153617858887, 0.006423652172088623, 0.006677150726318359, 0.006930649280548096, 0.007184147834777832, 0.007437646389007568, 0.007691144943237305, 0.007944643497467041, 0.008198142051696777, 0.008451640605926514, 0.00870513916015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 4.0, 9.0, 8.0, 13.0, 15.0, 21.0, 16.0, 18.0, 33.0, 27.0, 34.0, 47.0, 61.0, 56.0, 40.0, 59.0, 55.0, 71.0, 53.0, 52.0, 53.0, 33.0, 40.0, 38.0, 37.0, 26.0, 23.0, 11.0, 12.0, 9.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.01235342025756836, -0.011912345886230469, -0.011471271514892578, -0.011030197143554688, -0.010589122772216797, -0.010148048400878906, -0.009706974029541016, -0.009265899658203125, -0.008824825286865234, -0.008383750915527344, -0.007942676544189453, -0.0075016021728515625, -0.007060527801513672, -0.006619453430175781, -0.006178379058837891, -0.0057373046875, -0.005296230316162109, -0.004855155944824219, -0.004414081573486328, -0.0039730072021484375, -0.003531932830810547, -0.0030908584594726562, -0.0026497840881347656, -0.002208709716796875, -0.0017676353454589844, -0.0013265609741210938, -0.0008854866027832031, -0.0004444122314453125, -3.337860107421875e-06, 0.00043773651123046875, 0.0008788108825683594, 0.00131988525390625, 0.0017609596252441406, 0.0022020339965820312, 0.002643108367919922, 0.0030841827392578125, 0.003525257110595703, 0.003966331481933594, 0.004407405853271484, 0.004848480224609375, 0.005289554595947266, 0.005730628967285156, 0.006171703338623047, 0.0066127777099609375, 0.007053852081298828, 0.007494926452636719, 0.00793600082397461, 0.0083770751953125, 0.00881814956665039, 0.009259223937988281, 0.009700298309326172, 0.010141372680664062, 0.010582447052001953, 0.011023521423339844, 0.011464595794677734, 0.011905670166015625, 0.012346744537353516, 0.012787818908691406, 0.013228893280029297, 0.013669967651367188, 0.014111042022705078, 0.014552116394042969, 0.01499319076538086, 0.01543426513671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 10.0, 16.0, 12.0, 12.0, 27.0, 40.0, 65.0, 85.0, 119.0, 225.0, 319.0, 563.0, 975.0, 1988.0, 4015.0, 9436.0, 23828.0, 69410.0, 240658.0, 544790.0, 97648.0, 31869.0, 11990.0, 5115.0, 2319.0, 1245.0, 690.0, 382.0, 219.0, 141.0, 93.0, 62.0, 43.0, 38.0, 27.0, 14.0, 12.0, 14.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010242462158203125, -0.0009913593530654907, -0.0009584724903106689, -0.0009255856275558472, -0.0008926987648010254, -0.0008598119020462036, -0.0008269250392913818, -0.0007940381765365601, -0.0007611513137817383, -0.0007282644510269165, -0.0006953775882720947, -0.000662490725517273, -0.0006296038627624512, -0.0005967170000076294, -0.0005638301372528076, -0.0005309432744979858, -0.0004980564117431641, -0.0004651695489883423, -0.0004322826862335205, -0.00039939582347869873, -0.00036650896072387695, -0.0003336220979690552, -0.0003007352352142334, -0.0002678483724594116, -0.00023496150970458984, -0.00020207464694976807, -0.0001691877841949463, -0.0001363009214401245, -0.00010341405868530273, -7.052719593048096e-05, -3.764033317565918e-05, -4.753470420837402e-06, 2.8133392333984375e-05, 6.102025508880615e-05, 9.390711784362793e-05, 0.0001267939805984497, 0.00015968084335327148, 0.00019256770610809326, 0.00022545456886291504, 0.0002583414316177368, 0.0002912282943725586, 0.00032411515712738037, 0.00035700201988220215, 0.0003898888826370239, 0.0004227757453918457, 0.0004556626081466675, 0.0004885494709014893, 0.000521436333656311, 0.0005543231964111328, 0.0005872100591659546, 0.0006200969219207764, 0.0006529837846755981, 0.0006858706474304199, 0.0007187575101852417, 0.0007516443729400635, 0.0007845312356948853, 0.000817418098449707, 0.0008503049612045288, 0.0008831918239593506, 0.0009160786867141724, 0.0009489655494689941, 0.000981852412223816, 0.0010147392749786377, 0.0010476261377334595, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 2.0, 11.0, 12.0, 6.0, 13.0, 18.0, 18.0, 28.0, 27.0, 19.0, 17.0, 37.0, 40.0, 29.0, 51.0, 37.0, 53.0, 21.0, 51.0, 49.0, 34.0, 48.0, 53.0, 33.0, 30.0, 39.0, 46.0, 9.0, 33.0, 24.0, 10.0, 19.0, 19.0, 14.0, 11.0, 9.0, 8.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.2782554626464844e-06, -3.1767413020133972e-06, -3.07522714138031e-06, -2.973712980747223e-06, -2.8721988201141357e-06, -2.7706846594810486e-06, -2.6691704988479614e-06, -2.5676563382148743e-06, -2.466142177581787e-06, -2.3646280169487e-06, -2.263113856315613e-06, -2.1615996956825256e-06, -2.0600855350494385e-06, -1.9585713744163513e-06, -1.8570572137832642e-06, -1.755543053150177e-06, -1.6540288925170898e-06, -1.5525147318840027e-06, -1.4510005712509155e-06, -1.3494864106178284e-06, -1.2479722499847412e-06, -1.146458089351654e-06, -1.044943928718567e-06, -9.434297680854797e-07, -8.419156074523926e-07, -7.404014468193054e-07, -6.388872861862183e-07, -5.373731255531311e-07, -4.3585896492004395e-07, -3.343448042869568e-07, -2.3283064365386963e-07, -1.3131648302078247e-07, -2.9802322387695312e-08, 7.171183824539185e-08, 1.73225998878479e-07, 2.7474015951156616e-07, 3.762543201446533e-07, 4.777684807777405e-07, 5.792826414108276e-07, 6.807968020439148e-07, 7.82310962677002e-07, 8.838251233100891e-07, 9.853392839431763e-07, 1.0868534445762634e-06, 1.1883676052093506e-06, 1.2898817658424377e-06, 1.391395926475525e-06, 1.492910087108612e-06, 1.5944242477416992e-06, 1.6959384083747864e-06, 1.7974525690078735e-06, 1.8989667296409607e-06, 2.000480890274048e-06, 2.101995050907135e-06, 2.203509211540222e-06, 2.3050233721733093e-06, 2.4065375328063965e-06, 2.5080516934394836e-06, 2.609565854072571e-06, 2.711080014705658e-06, 2.812594175338745e-06, 2.9141083359718323e-06, 3.0156224966049194e-06, 3.1171366572380066e-06, 3.2186508178710938e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 11.0, 10.0, 11.0, 14.0, 15.0, 23.0, 24.0, 41.0, 48.0, 74.0, 134.0, 160.0, 263.0, 422.0, 743.0, 1444.0, 3156.0, 7919.0, 21241.0, 65472.0, 242010.0, 556248.0, 99473.0, 30298.0, 10812.0, 4184.0, 1892.0, 950.0, 512.0, 307.0, 197.0, 121.0, 86.0, 60.0, 46.0, 33.0, 20.0, 16.0, 18.0, 8.0, 9.0, 9.0, 8.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0011358261108398438, -0.0011025816202163696, -0.0010693371295928955, -0.0010360926389694214, -0.0010028481483459473, -0.0009696036577224731, -0.000936359167098999, -0.0009031146764755249, -0.0008698701858520508, -0.0008366256952285767, -0.0008033812046051025, -0.0007701367139816284, -0.0007368922233581543, -0.0007036477327346802, -0.0006704032421112061, -0.0006371587514877319, -0.0006039142608642578, -0.0005706697702407837, -0.0005374252796173096, -0.0005041807889938354, -0.00047093629837036133, -0.0004376918077468872, -0.0004044473171234131, -0.00037120282649993896, -0.00033795833587646484, -0.0003047138452529907, -0.0002714693546295166, -0.00023822486400604248, -0.00020498037338256836, -0.00017173588275909424, -0.00013849139213562012, -0.000105246901512146, -7.200241088867188e-05, -3.8757920265197754e-05, -5.513429641723633e-06, 2.7731060981750488e-05, 6.097555160522461e-05, 9.422004222869873e-05, 0.00012746453285217285, 0.00016070902347564697, 0.0001939535140991211, 0.00022719800472259521, 0.00026044249534606934, 0.00029368698596954346, 0.0003269314765930176, 0.0003601759672164917, 0.0003934204578399658, 0.00042666494846343994, 0.00045990943908691406, 0.0004931539297103882, 0.0005263984203338623, 0.0005596429109573364, 0.0005928874015808105, 0.0006261318922042847, 0.0006593763828277588, 0.0006926208734512329, 0.000725865364074707, 0.0007591098546981812, 0.0007923543453216553, 0.0008255988359451294, 0.0008588433265686035, 0.0008920878171920776, 0.0009253323078155518, 0.0009585767984390259, 0.0009918212890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 6.0, 10.0, 11.0, 20.0, 23.0, 31.0, 25.0, 43.0, 47.0, 50.0, 53.0, 76.0, 71.0, 64.0, 64.0, 52.0, 62.0, 49.0, 39.0, 41.0, 25.0, 18.0, 16.0, 8.0, 10.0, 9.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013856887817382812, -0.0013398975133895874, -0.0012941062450408936, -0.0012483149766921997, -0.0012025237083435059, -0.001156732439994812, -0.0011109411716461182, -0.0010651499032974243, -0.0010193586349487305, -0.0009735673666000366, -0.0009277760982513428, -0.0008819848299026489, -0.0008361935615539551, -0.0007904022932052612, -0.0007446110248565674, -0.0006988197565078735, -0.0006530284881591797, -0.0006072372198104858, -0.000561445951461792, -0.0005156546831130981, -0.0004698634147644043, -0.00042407214641571045, -0.0003782808780670166, -0.00033248960971832275, -0.0002866983413696289, -0.00024090707302093506, -0.0001951158046722412, -0.00014932453632354736, -0.00010353326797485352, -5.774199962615967e-05, -1.195073127746582e-05, 3.384053707122803e-05, 7.963180541992188e-05, 0.00012542307376861572, 0.00017121434211730957, 0.00021700561046600342, 0.00026279687881469727, 0.0003085881471633911, 0.00035437941551208496, 0.0004001706838607788, 0.00044596195220947266, 0.0004917532205581665, 0.0005375444889068604, 0.0005833357572555542, 0.000629127025604248, 0.0006749182939529419, 0.0007207095623016357, 0.0007665008306503296, 0.0008122920989990234, 0.0008580833673477173, 0.0009038746356964111, 0.000949665904045105, 0.0009954571723937988, 0.0010412484407424927, 0.0010870397090911865, 0.0011328309774398804, 0.0011786222457885742, 0.001224413514137268, 0.001270204782485962, 0.0013159960508346558, 0.0013617873191833496, 0.0014075785875320435, 0.0014533698558807373, 0.0014991611242294312, 0.001544952392578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 16.0, 31.0, 56.0, 79.0, 132.0, 238.0, 179.0, 91.0, 56.0, 39.0, 18.0, 13.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05052497237920761, -0.04925081506371498, -0.04797666147351265, -0.04670250415802002, -0.04542835056781769, -0.04415419325232506, -0.04288003593683243, -0.041605882346630096, -0.040331725031137466, -0.039057567715644836, -0.037783414125442505, -0.036509256809949875, -0.03523510321974754, -0.03396094590425491, -0.03268679231405258, -0.03141263499855995, -0.03013847954571247, -0.02886432409286499, -0.02759016864001751, -0.02631601318717003, -0.0250418558716774, -0.023767700418829918, -0.022493544965982437, -0.021219387650489807, -0.019945234060287476, -0.018671078607439995, -0.017396923154592514, -0.016122765839099884, -0.014848610386252403, -0.013574454933404922, -0.012300299480557442, -0.011026143096387386, -0.00975198857486248, -0.008477833122015, -0.007203676737844944, -0.005929521284997463, -0.004655365366488695, -0.003381209447979927, -0.0021070539951324463, -0.0008328976109623909, 0.0004412578418850899, 0.0017154136439785361, 0.0029895694460719824, 0.004263725131750107, 0.005537881050258875, 0.006812036968767643, 0.008086192421615124, 0.00936034880578518, 0.01063450425863266, 0.01190865971148014, 0.013182816095650196, 0.014456971548497677, 0.015731127932667732, 0.017005283385515213, 0.018279438838362694, 0.019553594291210175, 0.020827751606702805, 0.022101907059550285, 0.023376062512397766, 0.024650219827890396, 0.025924375280737877, 0.027198530733585358, 0.02847268618643284, 0.02974684163928032, 0.0310209970921278]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 5.0, 5.0, 9.0, 11.0, 13.0, 15.0, 15.0, 11.0, 22.0, 16.0, 29.0, 30.0, 34.0, 21.0, 32.0, 30.0, 34.0, 66.0, 93.0, 81.0, 57.0, 31.0, 39.0, 22.0, 32.0, 31.0, 21.0, 19.0, 19.0, 19.0, 16.0, 20.0, 12.0, 12.0, 4.0, 13.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03422337770462036, -0.03304683044552803, -0.0318702831864357, -0.03069373220205307, -0.02951718494296074, -0.028340637683868408, -0.027164088562130928, -0.025987539440393448, -0.024810992181301117, -0.023634444922208786, -0.022457895800471306, -0.021281346678733826, -0.020104799419641495, -0.018928252160549164, -0.017751703038811684, -0.016575153917074203, -0.015398606657981873, -0.014222058467566967, -0.013045510277152061, -0.011868962086737156, -0.01069241389632225, -0.009515865705907345, -0.00833931751549244, -0.007162769325077534, -0.005986221134662628, -0.004809672944247723, -0.003633124753832817, -0.0024565765634179115, -0.001280028373003006, -0.00010348018258810043, 0.0010730680078268051, 0.0022496161982417107, 0.003426164388656616, 0.004602712579071522, 0.005779260769486427, 0.006955808959901333, 0.008132357150316238, 0.009308905340731144, 0.01048545353114605, 0.011662001721560955, 0.01283854991197586, 0.014015098102390766, 0.015191646292805672, 0.016368195414543152, 0.017544742673635483, 0.018721289932727814, 0.019897839054465294, 0.021074388176202774, 0.022250935435295105, 0.023427482694387436, 0.024604031816124916, 0.025780580937862396, 0.026957128196954727, 0.028133675456047058, 0.02931022457778454, 0.03048677369952202, 0.03166332095861435, 0.03283986821770668, 0.03401641547679901, 0.03519296646118164, 0.03636951372027397, 0.0375460609793663, 0.03872261196374893, 0.03989915922284126, 0.041075706481933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 9.0, 15.0, 26.0, 44.0, 61.0, 79.0, 132.0, 212.0, 393.0, 1208.0, 3823.0, 18501.0, 398648.0, 3593385.0, 164107.0, 9893.0, 2313.0, 603.0, 288.0, 157.0, 123.0, 77.0, 58.0, 33.0, 20.0, 21.0, 12.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00762176513671875, -0.007393479347229004, -0.007165193557739258, -0.006936907768249512, -0.006708621978759766, -0.0064803361892700195, -0.0062520503997802734, -0.006023764610290527, -0.005795478820800781, -0.005567193031311035, -0.005338907241821289, -0.005110621452331543, -0.004882335662841797, -0.004654049873352051, -0.004425764083862305, -0.004197478294372559, -0.0039691925048828125, -0.0037409067153930664, -0.0035126209259033203, -0.0032843351364135742, -0.003056049346923828, -0.002827763557434082, -0.002599477767944336, -0.00237119197845459, -0.0021429061889648438, -0.0019146203994750977, -0.0016863346099853516, -0.0014580488204956055, -0.0012297630310058594, -0.0010014772415161133, -0.0007731914520263672, -0.0005449056625366211, -0.000316619873046875, -8.83340835571289e-05, 0.0001399517059326172, 0.0003682374954223633, 0.0005965232849121094, 0.0008248090744018555, 0.0010530948638916016, 0.0012813806533813477, 0.0015096664428710938, 0.0017379522323608398, 0.001966238021850586, 0.002194523811340332, 0.002422809600830078, 0.0026510953903198242, 0.0028793811798095703, 0.0031076669692993164, 0.0033359527587890625, 0.0035642385482788086, 0.0037925243377685547, 0.004020810127258301, 0.004249095916748047, 0.004477381706237793, 0.004705667495727539, 0.004933953285217285, 0.005162239074707031, 0.005390524864196777, 0.0056188106536865234, 0.0058470964431762695, 0.006075382232666016, 0.006303668022155762, 0.006531953811645508, 0.006760239601135254, 0.006988525390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 10.0, 9.0, 9.0, 23.0, 27.0, 60.0, 67.0, 85.0, 126.0, 152.0, 116.0, 97.0, 90.0, 49.0, 26.0, 22.0, 16.0, 9.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007266998291015625, -0.007013142108917236, -0.006759285926818848, -0.006505429744720459, -0.00625157356262207, -0.005997717380523682, -0.005743861198425293, -0.005490005016326904, -0.005236148834228516, -0.004982292652130127, -0.004728436470031738, -0.00447458028793335, -0.004220724105834961, -0.003966867923736572, -0.0037130117416381836, -0.003459155559539795, -0.0032052993774414062, -0.0029514431953430176, -0.002697587013244629, -0.0024437308311462402, -0.0021898746490478516, -0.0019360184669494629, -0.0016821622848510742, -0.0014283061027526855, -0.0011744499206542969, -0.0009205937385559082, -0.0006667375564575195, -0.00041288137435913086, -0.0001590251922607422, 9.483098983764648e-05, 0.00034868717193603516, 0.0006025433540344238, 0.0008563995361328125, 0.0011102557182312012, 0.0013641119003295898, 0.0016179680824279785, 0.0018718242645263672, 0.002125680446624756, 0.0023795366287231445, 0.002633392810821533, 0.002887248992919922, 0.0031411051750183105, 0.0033949613571166992, 0.003648817539215088, 0.0039026737213134766, 0.004156529903411865, 0.004410386085510254, 0.004664242267608643, 0.004918098449707031, 0.00517195463180542, 0.005425810813903809, 0.005679666996002197, 0.005933523178100586, 0.006187379360198975, 0.006441235542297363, 0.006695091724395752, 0.006948947906494141, 0.007202804088592529, 0.007456660270690918, 0.007710516452789307, 0.007964372634887695, 0.008218228816986084, 0.008472084999084473, 0.008725941181182861, 0.00897979736328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 16.0, 23.0, 44.0, 70.0, 164.0, 297.0, 724.0, 2481.0, 22229.0, 3891278.0, 268545.0, 6138.0, 1291.0, 457.0, 227.0, 134.0, 58.0, 33.0, 26.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01273345947265625, -0.01239621639251709, -0.01205897331237793, -0.01172173023223877, -0.01138448715209961, -0.01104724407196045, -0.010710000991821289, -0.010372757911682129, -0.010035514831542969, -0.009698271751403809, -0.009361028671264648, -0.009023785591125488, -0.008686542510986328, -0.008349299430847168, -0.008012056350708008, -0.007674813270568848, -0.0073375701904296875, -0.007000327110290527, -0.006663084030151367, -0.006325840950012207, -0.005988597869873047, -0.005651354789733887, -0.0053141117095947266, -0.004976868629455566, -0.004639625549316406, -0.004302382469177246, -0.003965139389038086, -0.0036278963088989258, -0.0032906532287597656, -0.0029534101486206055, -0.0026161670684814453, -0.002278923988342285, -0.001941680908203125, -0.0016044378280639648, -0.0012671947479248047, -0.0009299516677856445, -0.0005927085876464844, -0.0002554655075073242, 8.177757263183594e-05, 0.0004190206527709961, 0.0007562637329101562, 0.0010935068130493164, 0.0014307498931884766, 0.0017679929733276367, 0.002105236053466797, 0.002442479133605957, 0.002779722213745117, 0.0031169652938842773, 0.0034542083740234375, 0.0037914514541625977, 0.004128694534301758, 0.004465937614440918, 0.004803180694580078, 0.005140423774719238, 0.0054776668548583984, 0.005814909934997559, 0.006152153015136719, 0.006489396095275879, 0.006826639175415039, 0.007163882255554199, 0.007501125335693359, 0.00783836841583252, 0.00817561149597168, 0.00851285457611084, 0.00885009765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 10.0, 18.0, 26.0, 57.0, 144.0, 342.0, 728.0, 1090.0, 849.0, 464.0, 176.0, 73.0, 30.0, 29.0, 14.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005584716796875, -0.005314230918884277, -0.005043745040893555, -0.004773259162902832, -0.004502773284912109, -0.004232287406921387, -0.003961801528930664, -0.0036913156509399414, -0.0034208297729492188, -0.003150343894958496, -0.0028798580169677734, -0.0026093721389770508, -0.002338886260986328, -0.0020684003829956055, -0.0017979145050048828, -0.0015274286270141602, -0.0012569427490234375, -0.0009864568710327148, -0.0007159709930419922, -0.00044548511505126953, -0.00017499923706054688, 9.548664093017578e-05, 0.00036597251892089844, 0.0006364583969116211, 0.0009069442749023438, 0.0011774301528930664, 0.001447916030883789, 0.0017184019088745117, 0.0019888877868652344, 0.002259373664855957, 0.0025298595428466797, 0.0028003454208374023, 0.003070831298828125, 0.0033413171768188477, 0.0036118030548095703, 0.003882288932800293, 0.004152774810791016, 0.004423260688781738, 0.004693746566772461, 0.004964232444763184, 0.005234718322753906, 0.005505204200744629, 0.0057756900787353516, 0.006046175956726074, 0.006316661834716797, 0.0065871477127075195, 0.006857633590698242, 0.007128119468688965, 0.0073986053466796875, 0.00766909122467041, 0.007939577102661133, 0.008210062980651855, 0.008480548858642578, 0.0087510347366333, 0.009021520614624023, 0.009292006492614746, 0.009562492370605469, 0.009832978248596191, 0.010103464126586914, 0.010373950004577637, 0.01064443588256836, 0.010914921760559082, 0.011185407638549805, 0.011455893516540527, 0.01172637939453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 21.0, 22.0, 41.0, 64.0, 93.0, 107.0, 163.0, 130.0, 92.0, 92.0, 42.0, 42.0, 18.0, 17.0, 4.0, 14.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02202855423092842, -0.020994314923882484, -0.0199600737541914, -0.018925834447145462, -0.017891593277454376, -0.01685735397040844, -0.015823114663362503, -0.014788874424993992, -0.01375463418662548, -0.01272039394825697, -0.011686153709888458, -0.010651914402842522, -0.00961767416447401, -0.0085834339261055, -0.007549194153398275, -0.0065149543806910515, -0.00548071414232254, -0.004446473903954029, -0.003412234131246805, -0.0023779941257089376, -0.00134375412017107, -0.0003095138818025589, 0.000724725890904665, 0.0017589656636118889, 0.0027932059019804, 0.0038274459075182676, 0.004861685913056135, 0.005895925685763359, 0.00693016592413187, 0.007964406162500381, 0.008998645469546318, 0.01003288570791483, 0.011067129671573639, 0.01210136990994215, 0.013135610148310661, 0.014169849455356598, 0.015204089693725109, 0.01623832993209362, 0.017272569239139557, 0.018306810408830643, 0.01934104971587658, 0.020375289022922516, 0.0214095301926136, 0.02244376949965954, 0.023478008806705475, 0.02451224997639656, 0.025546489283442497, 0.026580728590488434, 0.02761496976017952, 0.028649209067225456, 0.029683450236916542, 0.03071768954396248, 0.031751930713653564, 0.03278616815805435, 0.03382040932774544, 0.03485465049743652, 0.03588888794183731, 0.0369231291115284, 0.037957366555929184, 0.03899160772562027, 0.040025848895311356, 0.04106009006500244, 0.04209432750940323, 0.043128568679094315, 0.0441628098487854]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 10.0, 7.0, 12.0, 8.0, 12.0, 17.0, 17.0, 17.0, 20.0, 25.0, 34.0, 24.0, 41.0, 51.0, 57.0, 36.0, 45.0, 57.0, 60.0, 48.0, 45.0, 50.0, 40.0, 43.0, 34.0, 24.0, 26.0, 10.0, 16.0, 13.0, 14.0, 17.0, 10.0, 9.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.019015789031982422, -0.01829322800040245, -0.01757066510617733, -0.01684810221195221, -0.016125541180372238, -0.015402979217469692, -0.014680417254567146, -0.0139578552916646, -0.013235293328762054, -0.012512731365859509, -0.011790169402956963, -0.011067607440054417, -0.01034504547715187, -0.009622483514249325, -0.008899921551346779, -0.008177359588444233, -0.007454797625541687, -0.006732235662639141, -0.006009673699736595, -0.005287111736834049, -0.004564549773931503, -0.0038419878110289574, -0.0031194258481264114, -0.0023968638852238655, -0.0016743019223213196, -0.0009517399594187737, -0.00022917799651622772, 0.0004933839663863182, 0.0012159459292888641, 0.00193850789219141, 0.002661069855093956, 0.003383631817996502, 0.004106193780899048, 0.004828755743801594, 0.00555131770670414, 0.006273879669606686, 0.006996441632509232, 0.0077190035954117775, 0.008441565558314323, 0.00916412752121687, 0.009886689484119415, 0.010609251447021961, 0.011331813409924507, 0.012054375372827053, 0.012776937335729599, 0.013499499298632145, 0.01422206126153469, 0.014944623224437237, 0.015667185187339783, 0.016389746218919754, 0.017112309113144875, 0.017834872007369995, 0.018557433038949966, 0.019279994070529938, 0.02000255696475506, 0.02072511985898018, 0.02144768089056015, 0.02217024192214012, 0.022892804816365242, 0.023615367710590363, 0.024337928742170334, 0.025060489773750305, 0.025783052667975426, 0.026505615562200546, 0.027228176593780518]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 5.0, 8.0, 14.0, 18.0, 24.0, 18.0, 52.0, 57.0, 93.0, 137.0, 195.0, 366.0, 717.0, 1382.0, 3015.0, 7844.0, 24992.0, 107828.0, 497145.0, 316374.0, 61892.0, 16169.0, 5405.0, 2276.0, 1053.0, 585.0, 302.0, 194.0, 124.0, 74.0, 55.0, 36.0, 27.0, 13.0, 16.0, 14.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007717132568359375, -0.00748896598815918, -0.007260799407958984, -0.007032632827758789, -0.006804466247558594, -0.0065762996673583984, -0.006348133087158203, -0.006119966506958008, -0.0058917999267578125, -0.005663633346557617, -0.005435466766357422, -0.0052073001861572266, -0.004979133605957031, -0.004750967025756836, -0.004522800445556641, -0.004294633865356445, -0.00406646728515625, -0.0038383007049560547, -0.0036101341247558594, -0.003381967544555664, -0.0031538009643554688, -0.0029256343841552734, -0.002697467803955078, -0.002469301223754883, -0.0022411346435546875, -0.002012968063354492, -0.0017848014831542969, -0.0015566349029541016, -0.0013284683227539062, -0.001100301742553711, -0.0008721351623535156, -0.0006439685821533203, -0.000415802001953125, -0.0001876354217529297, 4.0531158447265625e-05, 0.00026869773864746094, 0.0004968643188476562, 0.0007250308990478516, 0.0009531974792480469, 0.0011813640594482422, 0.0014095306396484375, 0.0016376972198486328, 0.0018658638000488281, 0.0020940303802490234, 0.0023221969604492188, 0.002550363540649414, 0.0027785301208496094, 0.0030066967010498047, 0.00323486328125, 0.0034630298614501953, 0.0036911964416503906, 0.003919363021850586, 0.004147529602050781, 0.0043756961822509766, 0.004603862762451172, 0.004832029342651367, 0.0050601959228515625, 0.005288362503051758, 0.005516529083251953, 0.0057446956634521484, 0.005972862243652344, 0.006201028823852539, 0.006429195404052734, 0.00665736198425293, 0.006885528564453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 15.0, 20.0, 33.0, 64.0, 81.0, 116.0, 96.0, 143.0, 119.0, 101.0, 69.0, 63.0, 20.0, 17.0, 19.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.006996810436248779, -0.006741881370544434, -0.006486952304840088, -0.006232023239135742, -0.0059770941734313965, -0.005722165107727051, -0.005467236042022705, -0.005212306976318359, -0.004957377910614014, -0.004702448844909668, -0.004447519779205322, -0.0041925907135009766, -0.003937661647796631, -0.003682732582092285, -0.0034278035163879395, -0.0031728744506835938, -0.002917945384979248, -0.0026630163192749023, -0.0024080872535705566, -0.002153158187866211, -0.0018982291221618652, -0.0016433000564575195, -0.0013883709907531738, -0.0011334419250488281, -0.0008785128593444824, -0.0006235837936401367, -0.000368654727935791, -0.00011372566223144531, 0.0001412034034729004, 0.0003961324691772461, 0.0006510615348815918, 0.0009059906005859375, 0.0011609196662902832, 0.001415848731994629, 0.0016707777976989746, 0.0019257068634033203, 0.002180635929107666, 0.0024355649948120117, 0.0026904940605163574, 0.002945423126220703, 0.003200352191925049, 0.0034552812576293945, 0.0037102103233337402, 0.003965139389038086, 0.004220068454742432, 0.004474997520446777, 0.004729926586151123, 0.004984855651855469, 0.0052397847175598145, 0.00549471378326416, 0.005749642848968506, 0.0060045719146728516, 0.006259500980377197, 0.006514430046081543, 0.006769359111785889, 0.007024288177490234, 0.00727921724319458, 0.007534146308898926, 0.0077890753746032715, 0.008044004440307617, 0.008298933506011963, 0.008553862571716309, 0.008808791637420654, 0.009063720703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 9.0, 12.0, 9.0, 10.0, 16.0, 23.0, 27.0, 50.0, 50.0, 101.0, 120.0, 173.0, 314.0, 499.0, 798.0, 1657.0, 4854.0, 23852.0, 219051.0, 724908.0, 57892.0, 8941.0, 2410.0, 1124.0, 619.0, 342.0, 210.0, 139.0, 94.0, 64.0, 41.0, 38.0, 25.0, 21.0, 21.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00908660888671875, -0.008795499801635742, -0.008504390716552734, -0.008213281631469727, -0.007922172546386719, -0.007631063461303711, -0.007339954376220703, -0.007048845291137695, -0.0067577362060546875, -0.00646662712097168, -0.006175518035888672, -0.005884408950805664, -0.005593299865722656, -0.0053021907806396484, -0.005011081695556641, -0.004719972610473633, -0.004428863525390625, -0.004137754440307617, -0.0038466453552246094, -0.0035555362701416016, -0.0032644271850585938, -0.002973318099975586, -0.002682209014892578, -0.0023910999298095703, -0.0020999908447265625, -0.0018088817596435547, -0.0015177726745605469, -0.001226663589477539, -0.0009355545043945312, -0.0006444454193115234, -0.0003533363342285156, -6.222724914550781e-05, 0.0002288818359375, 0.0005199909210205078, 0.0008111000061035156, 0.0011022090911865234, 0.0013933181762695312, 0.001684427261352539, 0.001975536346435547, 0.0022666454315185547, 0.0025577545166015625, 0.0028488636016845703, 0.003139972686767578, 0.003431081771850586, 0.0037221908569335938, 0.0040132999420166016, 0.004304409027099609, 0.004595518112182617, 0.004886627197265625, 0.005177736282348633, 0.005468845367431641, 0.0057599544525146484, 0.006051063537597656, 0.006342172622680664, 0.006633281707763672, 0.00692439079284668, 0.0072154998779296875, 0.007506608963012695, 0.007797718048095703, 0.008088827133178711, 0.008379936218261719, 0.008671045303344727, 0.008962154388427734, 0.009253263473510742, 0.00954437255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 7.0, 13.0, 9.0, 18.0, 30.0, 30.0, 44.0, 32.0, 44.0, 69.0, 70.0, 61.0, 61.0, 65.0, 62.0, 58.0, 50.0, 55.0, 45.0, 31.0, 29.0, 22.0, 21.0, 16.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01593017578125, -0.0154496431350708, -0.014969110488891602, -0.014488577842712402, -0.014008045196533203, -0.013527512550354004, -0.013046979904174805, -0.012566447257995605, -0.012085914611816406, -0.011605381965637207, -0.011124849319458008, -0.010644316673278809, -0.01016378402709961, -0.00968325138092041, -0.009202718734741211, -0.008722186088562012, -0.008241653442382812, -0.007761120796203613, -0.007280588150024414, -0.006800055503845215, -0.006319522857666016, -0.005838990211486816, -0.005358457565307617, -0.004877924919128418, -0.004397392272949219, -0.0039168596267700195, -0.0034363269805908203, -0.002955794334411621, -0.002475261688232422, -0.0019947290420532227, -0.0015141963958740234, -0.0010336637496948242, -0.000553131103515625, -7.259845733642578e-05, 0.00040793418884277344, 0.0008884668350219727, 0.0013689994812011719, 0.001849532127380371, 0.0023300647735595703, 0.0028105974197387695, 0.0032911300659179688, 0.003771662712097168, 0.004252195358276367, 0.004732728004455566, 0.005213260650634766, 0.005693793296813965, 0.006174325942993164, 0.006654858589172363, 0.0071353912353515625, 0.007615923881530762, 0.008096456527709961, 0.00857698917388916, 0.00905752182006836, 0.009538054466247559, 0.010018587112426758, 0.010499119758605957, 0.010979652404785156, 0.011460185050964355, 0.011940717697143555, 0.012421250343322754, 0.012901782989501953, 0.013382315635681152, 0.013862848281860352, 0.01434338092803955, 0.01482391357421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 9.0, 16.0, 23.0, 42.0, 52.0, 70.0, 140.0, 235.0, 419.0, 814.0, 2102.0, 6603.0, 29399.0, 224223.0, 710576.0, 57515.0, 10814.0, 3096.0, 1150.0, 513.0, 258.0, 185.0, 86.0, 59.0, 35.0, 28.0, 12.0, 12.0, 16.0, 6.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.001682281494140625, -0.0016330629587173462, -0.0015838444232940674, -0.0015346258878707886, -0.0014854073524475098, -0.001436188817024231, -0.0013869702816009521, -0.0013377517461776733, -0.0012885332107543945, -0.0012393146753311157, -0.001190096139907837, -0.001140877604484558, -0.0010916590690612793, -0.0010424405336380005, -0.0009932219982147217, -0.0009440034627914429, -0.0008947849273681641, -0.0008455663919448853, -0.0007963478565216064, -0.0007471293210983276, -0.0006979107856750488, -0.00064869225025177, -0.0005994737148284912, -0.0005502551794052124, -0.0005010366439819336, -0.0004518181085586548, -0.000402599573135376, -0.00035338103771209717, -0.00030416250228881836, -0.00025494396686553955, -0.00020572543144226074, -0.00015650689601898193, -0.00010728836059570312, -5.8069825172424316e-05, -8.851289749145508e-06, 4.03672456741333e-05, 8.958578109741211e-05, 0.00013880431652069092, 0.00018802285194396973, 0.00023724138736724854, 0.00028645992279052734, 0.00033567845821380615, 0.00038489699363708496, 0.00043411552906036377, 0.0004833340644836426, 0.0005325525999069214, 0.0005817711353302002, 0.000630989670753479, 0.0006802082061767578, 0.0007294267416000366, 0.0007786452770233154, 0.0008278638124465942, 0.000877082347869873, 0.0009263008832931519, 0.0009755194187164307, 0.0010247379541397095, 0.0010739564895629883, 0.001123175024986267, 0.001172393560409546, 0.0012216120958328247, 0.0012708306312561035, 0.0013200491666793823, 0.0013692677021026611, 0.00141848623752594, 0.0014677047729492188]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 8.0, 8.0, 8.0, 20.0, 11.0, 18.0, 15.0, 21.0, 16.0, 37.0, 33.0, 50.0, 30.0, 76.0, 43.0, 80.0, 55.0, 56.0, 69.0, 43.0, 53.0, 27.0, 32.0, 27.0, 42.0, 20.0, 13.0, 19.0, 9.0, 9.0, 9.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.708766937255859e-06, -4.560686647891998e-06, -4.412606358528137e-06, -4.264526069164276e-06, -4.116445779800415e-06, -3.968365490436554e-06, -3.820285201072693e-06, -3.6722049117088318e-06, -3.5241246223449707e-06, -3.3760443329811096e-06, -3.2279640436172485e-06, -3.0798837542533875e-06, -2.9318034648895264e-06, -2.7837231755256653e-06, -2.635642886161804e-06, -2.487562596797943e-06, -2.339482307434082e-06, -2.191402018070221e-06, -2.04332172870636e-06, -1.8952414393424988e-06, -1.7471611499786377e-06, -1.5990808606147766e-06, -1.4510005712509155e-06, -1.3029202818870544e-06, -1.1548399925231934e-06, -1.0067597031593323e-06, -8.586794137954712e-07, -7.105991244316101e-07, -5.62518835067749e-07, -4.1443854570388794e-07, -2.6635825634002686e-07, -1.1827796697616577e-07, 2.9802322387695312e-08, 1.778826117515564e-07, 3.259629011154175e-07, 4.7404319047927856e-07, 6.221234798431396e-07, 7.702037692070007e-07, 9.182840585708618e-07, 1.066364347934723e-06, 1.214444637298584e-06, 1.362524926662445e-06, 1.5106052160263062e-06, 1.6586855053901672e-06, 1.8067657947540283e-06, 1.9548460841178894e-06, 2.1029263734817505e-06, 2.2510066628456116e-06, 2.3990869522094727e-06, 2.5471672415733337e-06, 2.695247530937195e-06, 2.843327820301056e-06, 2.991408109664917e-06, 3.139488399028778e-06, 3.287568688392639e-06, 3.4356489777565002e-06, 3.5837292671203613e-06, 3.7318095564842224e-06, 3.8798898458480835e-06, 4.027970135211945e-06, 4.176050424575806e-06, 4.324130713939667e-06, 4.472211003303528e-06, 4.620291292667389e-06, 4.76837158203125e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 0.0, 7.0, 5.0, 24.0, 11.0, 27.0, 31.0, 44.0, 77.0, 85.0, 140.0, 253.0, 427.0, 916.0, 2108.0, 5885.0, 22629.0, 155876.0, 756513.0, 81469.0, 14421.0, 4229.0, 1631.0, 722.0, 398.0, 210.0, 131.0, 72.0, 61.0, 49.0, 27.0, 24.0, 14.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001369476318359375, -0.0013243556022644043, -0.0012792348861694336, -0.0012341141700744629, -0.0011889934539794922, -0.0011438727378845215, -0.0010987520217895508, -0.00105363130569458, -0.0010085105895996094, -0.0009633898735046387, -0.000918269157409668, -0.0008731484413146973, -0.0008280277252197266, -0.0007829070091247559, -0.0007377862930297852, -0.0006926655769348145, -0.0006475448608398438, -0.000602424144744873, -0.0005573034286499023, -0.0005121827125549316, -0.00046706199645996094, -0.00042194128036499023, -0.00037682056427001953, -0.00033169984817504883, -0.0002865791320800781, -0.00024145841598510742, -0.00019633769989013672, -0.00015121698379516602, -0.00010609626770019531, -6.097555160522461e-05, -1.5854835510253906e-05, 2.9265880584716797e-05, 7.43865966796875e-05, 0.0001195073127746582, 0.0001646280288696289, 0.0002097487449645996, 0.0002548694610595703, 0.000299990177154541, 0.0003451108932495117, 0.0003902316093444824, 0.0004353523254394531, 0.00048047304153442383, 0.0005255937576293945, 0.0005707144737243652, 0.0006158351898193359, 0.0006609559059143066, 0.0007060766220092773, 0.000751197338104248, 0.0007963180541992188, 0.0008414387702941895, 0.0008865594863891602, 0.0009316802024841309, 0.0009768009185791016, 0.0010219216346740723, 0.001067042350769043, 0.0011121630668640137, 0.0011572837829589844, 0.001202404499053955, 0.0012475252151489258, 0.0012926459312438965, 0.0013377666473388672, 0.0013828873634338379, 0.0014280080795288086, 0.0014731287956237793, 0.00151824951171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 16.0, 25.0, 23.0, 36.0, 57.0, 69.0, 75.0, 95.0, 108.0, 93.0, 76.0, 74.0, 56.0, 44.0, 36.0, 19.0, 11.0, 20.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020904541015625, -0.0020330101251602173, -0.0019755661487579346, -0.0019181221723556519, -0.0018606781959533691, -0.0018032342195510864, -0.0017457902431488037, -0.001688346266746521, -0.0016309022903442383, -0.0015734583139419556, -0.0015160143375396729, -0.0014585703611373901, -0.0014011263847351074, -0.0013436824083328247, -0.001286238431930542, -0.0012287944555282593, -0.0011713504791259766, -0.0011139065027236938, -0.0010564625263214111, -0.0009990185499191284, -0.0009415745735168457, -0.000884130597114563, -0.0008266866207122803, -0.0007692426443099976, -0.0007117986679077148, -0.0006543546915054321, -0.0005969107151031494, -0.0005394667387008667, -0.000482022762298584, -0.00042457878589630127, -0.00036713480949401855, -0.00030969083309173584, -0.0002522468566894531, -0.0001948028802871704, -0.0001373589038848877, -7.991492748260498e-05, -2.2470951080322266e-05, 3.497302532196045e-05, 9.241700172424316e-05, 0.00014986097812652588, 0.0002073049545288086, 0.0002647489309310913, 0.000322192907333374, 0.00037963688373565674, 0.00043708086013793945, 0.0004945248365402222, 0.0005519688129425049, 0.0006094127893447876, 0.0006668567657470703, 0.000724300742149353, 0.0007817447185516357, 0.0008391886949539185, 0.0008966326713562012, 0.0009540766477584839, 0.0010115206241607666, 0.0010689646005630493, 0.001126408576965332, 0.0011838525533676147, 0.0012412965297698975, 0.0012987405061721802, 0.0013561844825744629, 0.0014136284589767456, 0.0014710724353790283, 0.001528516411781311, 0.0015859603881835938]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 26.0, 86.0, 198.0, 421.0, 166.0, 56.0, 19.0, 15.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0683184489607811, -0.06560777872800827, -0.06289711594581604, -0.06018644571304321, -0.057475775480270386, -0.05476510524749756, -0.05205443874001503, -0.0493437722325325, -0.046633101999759674, -0.04392243176698685, -0.04121176525950432, -0.03850109875202179, -0.03579042851924896, -0.033079758286476135, -0.030369091778993607, -0.02765842340886593, -0.02494775503873825, -0.022237086668610573, -0.019526418298482895, -0.016815749928355217, -0.014105081558227539, -0.011394413188099861, -0.008683744817972183, -0.005973076447844505, -0.0032624080777168274, -0.0005517397075891495, 0.0021589286625385284, 0.004869597032666206, 0.007580265402793884, 0.010290933772921562, 0.01300160214304924, 0.015712270513176918, 0.018422946333885193, 0.02113361470401287, 0.02384428307414055, 0.026554951444268227, 0.029265619814395905, 0.03197629004716873, 0.03468695655465126, 0.03739762306213379, 0.040108293294906616, 0.04281896352767944, 0.04552963003516197, 0.0482402965426445, 0.05095096677541733, 0.053661637008190155, 0.056372303515672684, 0.05908297002315521, 0.06179364025592804, 0.06450431048870087, 0.0672149807214737, 0.06992564350366592, 0.07263631373643875, 0.07534698396921158, 0.07805764675140381, 0.08076831698417664, 0.08347898721694946, 0.08618965744972229, 0.08890032768249512, 0.09161099046468735, 0.09432166069746017, 0.097032330930233, 0.09974299371242523, 0.10245366394519806, 0.10516433417797089]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 3.0, 5.0, 6.0, 12.0, 13.0, 14.0, 18.0, 26.0, 26.0, 26.0, 31.0, 29.0, 42.0, 77.0, 135.0, 154.0, 87.0, 38.0, 41.0, 33.0, 28.0, 24.0, 18.0, 21.0, 19.0, 17.0, 6.0, 14.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05504107475280762, -0.053425658494234085, -0.05181024223566055, -0.05019482597708702, -0.04857940971851349, -0.04696399345993996, -0.045348577201366425, -0.04373316094279289, -0.04211774468421936, -0.04050232842564583, -0.038886912167072296, -0.037271495908498764, -0.03565607964992523, -0.0340406633913517, -0.03242524713277817, -0.030809830874204636, -0.029194414615631104, -0.02757899835705757, -0.02596358209848404, -0.024348165839910507, -0.022732749581336975, -0.021117333322763443, -0.01950191706418991, -0.01788650080561638, -0.016271084547042847, -0.014655668288469315, -0.013040252029895782, -0.01142483577132225, -0.009809419512748718, -0.008194003254175186, -0.006578586995601654, -0.004963170737028122, -0.00334775447845459, -0.0017323382198810577, -0.00011692196130752563, 0.0014984942972660065, 0.0031139105558395386, 0.004729326814413071, 0.006344743072986603, 0.007960159331560135, 0.009575575590133667, 0.011190991848707199, 0.012806408107280731, 0.014421824365854263, 0.016037240624427795, 0.017652656883001328, 0.01926807314157486, 0.02088348940014839, 0.022498905658721924, 0.024114321917295456, 0.025729738175868988, 0.02734515443444252, 0.028960570693016052, 0.030575986951589584, 0.032191403210163116, 0.03380681946873665, 0.03542223572731018, 0.03703765198588371, 0.038653068244457245, 0.04026848450303078, 0.04188390076160431, 0.04349931702017784, 0.04511473327875137, 0.046730149537324905, 0.04834556579589844]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 24.0, 28.0, 42.0, 55.0, 118.0, 270.0, 865.0, 1957.0, 4809.0, 15930.0, 95622.0, 1290094.0, 2515807.0, 236186.0, 22266.0, 6579.0, 2199.0, 700.0, 307.0, 129.0, 93.0, 61.0, 31.0, 24.0, 18.0, 20.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005218505859375, -0.005026519298553467, -0.004834532737731934, -0.0046425461769104, -0.004450559616088867, -0.004258573055267334, -0.004066586494445801, -0.0038745999336242676, -0.0036826133728027344, -0.003490626811981201, -0.003298640251159668, -0.0031066536903381348, -0.0029146671295166016, -0.0027226805686950684, -0.002530694007873535, -0.002338707447052002, -0.0021467208862304688, -0.0019547343254089355, -0.0017627477645874023, -0.0015707612037658691, -0.001378774642944336, -0.0011867880821228027, -0.0009948015213012695, -0.0008028149604797363, -0.0006108283996582031, -0.0004188418388366699, -0.00022685527801513672, -3.4868717193603516e-05, 0.0001571178436279297, 0.0003491044044494629, 0.0005410909652709961, 0.0007330775260925293, 0.0009250640869140625, 0.0011170506477355957, 0.001309037208557129, 0.0015010237693786621, 0.0016930103302001953, 0.0018849968910217285, 0.0020769834518432617, 0.002268970012664795, 0.002460956573486328, 0.0026529431343078613, 0.0028449296951293945, 0.0030369162559509277, 0.003228902816772461, 0.003420889377593994, 0.0036128759384155273, 0.0038048624992370605, 0.003996849060058594, 0.004188835620880127, 0.00438082218170166, 0.004572808742523193, 0.0047647953033447266, 0.00495678186416626, 0.005148768424987793, 0.005340754985809326, 0.005532741546630859, 0.005724728107452393, 0.005916714668273926, 0.006108701229095459, 0.006300687789916992, 0.006492674350738525, 0.006684660911560059, 0.006876647472381592, 0.007068634033203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 13.0, 4.0, 13.0, 17.0, 45.0, 63.0, 90.0, 116.0, 125.0, 125.0, 110.0, 95.0, 62.0, 42.0, 31.0, 23.0, 17.0, 7.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.00699537992477417, -0.006739020347595215, -0.00648266077041626, -0.006226301193237305, -0.00596994161605835, -0.0057135820388793945, -0.0054572224617004395, -0.005200862884521484, -0.004944503307342529, -0.004688143730163574, -0.004431784152984619, -0.004175424575805664, -0.003919064998626709, -0.003662705421447754, -0.003406345844268799, -0.0031499862670898438, -0.0028936266899108887, -0.0026372671127319336, -0.0023809075355529785, -0.0021245479583740234, -0.0018681883811950684, -0.0016118288040161133, -0.0013554692268371582, -0.0010991096496582031, -0.000842750072479248, -0.000586390495300293, -0.0003300309181213379, -7.367134094238281e-05, 0.00018268823623657227, 0.00043904781341552734, 0.0006954073905944824, 0.0009517669677734375, 0.0012081265449523926, 0.0014644861221313477, 0.0017208456993103027, 0.001977205276489258, 0.002233564853668213, 0.002489924430847168, 0.002746284008026123, 0.003002643585205078, 0.003259003162384033, 0.0035153627395629883, 0.0037717223167419434, 0.0040280818939208984, 0.0042844414710998535, 0.004540801048278809, 0.004797160625457764, 0.005053520202636719, 0.005309879779815674, 0.005566239356994629, 0.005822598934173584, 0.006078958511352539, 0.006335318088531494, 0.006591677665710449, 0.006848037242889404, 0.007104396820068359, 0.0073607563972473145, 0.0076171159744262695, 0.007873475551605225, 0.00812983512878418, 0.008386194705963135, 0.00864255428314209, 0.008898913860321045, 0.0091552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 17.0, 32.0, 72.0, 196.0, 613.0, 3480.0, 4065049.0, 122162.0, 1904.0, 456.0, 157.0, 62.0, 37.0, 12.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03726673126220703, -0.03592872619628906, -0.034590721130371094, -0.033252716064453125, -0.031914710998535156, -0.030576705932617188, -0.02923870086669922, -0.02790069580078125, -0.02656269073486328, -0.025224685668945312, -0.023886680603027344, -0.022548675537109375, -0.021210670471191406, -0.019872665405273438, -0.01853466033935547, -0.0171966552734375, -0.01585865020751953, -0.014520645141601562, -0.013182640075683594, -0.011844635009765625, -0.010506629943847656, -0.009168624877929688, -0.007830619812011719, -0.00649261474609375, -0.005154609680175781, -0.0038166046142578125, -0.0024785995483398438, -0.001140594482421875, 0.00019741058349609375, 0.0015354156494140625, 0.0028734207153320312, 0.00421142578125, 0.005549430847167969, 0.0068874359130859375, 0.008225440979003906, 0.009563446044921875, 0.010901451110839844, 0.012239456176757812, 0.013577461242675781, 0.01491546630859375, 0.01625347137451172, 0.017591476440429688, 0.018929481506347656, 0.020267486572265625, 0.021605491638183594, 0.022943496704101562, 0.02428150177001953, 0.0256195068359375, 0.02695751190185547, 0.028295516967773438, 0.029633522033691406, 0.030971527099609375, 0.032309532165527344, 0.03364753723144531, 0.03498554229736328, 0.03632354736328125, 0.03766155242919922, 0.03899955749511719, 0.040337562561035156, 0.041675567626953125, 0.043013572692871094, 0.04435157775878906, 0.04568958282470703, 0.047027587890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 9.0, 10.0, 12.0, 24.0, 36.0, 61.0, 114.0, 225.0, 490.0, 1115.0, 1069.0, 459.0, 216.0, 102.0, 62.0, 24.0, 17.0, 11.0, 5.0, 11.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0099945068359375, -0.009407281875610352, -0.008820056915283203, -0.008232831954956055, -0.007645606994628906, -0.007058382034301758, -0.006471157073974609, -0.005883932113647461, -0.0052967071533203125, -0.004709482192993164, -0.004122257232666016, -0.003535032272338867, -0.0029478073120117188, -0.0023605823516845703, -0.0017733573913574219, -0.0011861324310302734, -0.000598907470703125, -1.1682510375976562e-05, 0.0005755424499511719, 0.0011627674102783203, 0.0017499923706054688, 0.002337217330932617, 0.0029244422912597656, 0.003511667251586914, 0.0040988922119140625, 0.004686117172241211, 0.005273342132568359, 0.005860567092895508, 0.006447792053222656, 0.007035017013549805, 0.007622241973876953, 0.008209466934204102, 0.00879669189453125, 0.009383916854858398, 0.009971141815185547, 0.010558366775512695, 0.011145591735839844, 0.011732816696166992, 0.01232004165649414, 0.012907266616821289, 0.013494491577148438, 0.014081716537475586, 0.014668941497802734, 0.015256166458129883, 0.01584339141845703, 0.01643061637878418, 0.017017841339111328, 0.017605066299438477, 0.018192291259765625, 0.018779516220092773, 0.019366741180419922, 0.01995396614074707, 0.02054119110107422, 0.021128416061401367, 0.021715641021728516, 0.022302865982055664, 0.022890090942382812, 0.02347731590270996, 0.02406454086303711, 0.024651765823364258, 0.025238990783691406, 0.025826215744018555, 0.026413440704345703, 0.02700066566467285, 0.027587890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 46.0, 83.0, 135.0, 236.0, 208.0, 111.0, 63.0, 29.0, 14.0, 5.0, 10.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0895826444029808, -0.08583042770624161, -0.08207820355892181, -0.07832598686218262, -0.07457377016544342, -0.07082155346870422, -0.06706933677196503, -0.06331711262464523, -0.059564895927906036, -0.05581267923116684, -0.052060458809137344, -0.04830823838710785, -0.04455602169036865, -0.040803804993629456, -0.03705158457159996, -0.033299364149570465, -0.02954714745283127, -0.025794928893446922, -0.022042710334062576, -0.01829049177467823, -0.014538273215293884, -0.010786054655909538, -0.007033836096525192, -0.0032816175371408463, 0.00047060102224349976, 0.004222819581627846, 0.007975038141012192, 0.011727256700396538, 0.015479475259780884, 0.01923169381916523, 0.022983912378549576, 0.026736130937933922, 0.03048834204673767, 0.03424055874347687, 0.03799277916550636, 0.04174499958753586, 0.045497216284275055, 0.04924943298101425, 0.05300165340304375, 0.05675387382507324, 0.06050609052181244, 0.06425830721855164, 0.06801052391529083, 0.07176274806261063, 0.07551496475934982, 0.07926718145608902, 0.08301940560340881, 0.08677162230014801, 0.09052383899688721, 0.0942760556936264, 0.0980282723903656, 0.1017804965376854, 0.10553271323442459, 0.10928492993116379, 0.11303715407848358, 0.11678937077522278, 0.12054158747196198, 0.12429380416870117, 0.12804602086544037, 0.13179823756217957, 0.13555046916007996, 0.13930268585681915, 0.14305490255355835, 0.14680711925029755, 0.15055933594703674]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 10.0, 21.0, 25.0, 21.0, 44.0, 46.0, 82.0, 83.0, 118.0, 125.0, 106.0, 79.0, 79.0, 50.0, 45.0, 17.0, 14.0, 12.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09496647119522095, -0.09070610255002975, -0.08644573390483856, -0.08218536525964737, -0.07792499661445618, -0.07366463541984558, -0.06940426677465439, -0.0651438981294632, -0.060883529484272, -0.05662316083908081, -0.05236279219388962, -0.048102427273988724, -0.04384205862879753, -0.03958168998360634, -0.035321325063705444, -0.03106095641851425, -0.02680058777332306, -0.022540219128131866, -0.018279852345585823, -0.014019484631717205, -0.009759116917848587, -0.005498748272657394, -0.001238381490111351, 0.0030219852924346924, 0.007282353937625885, 0.011542721651494503, 0.01580308936536312, 0.020063456147909164, 0.024323824793100357, 0.02858419343829155, 0.032844558358192444, 0.037104927003383636, 0.04136529564857483, 0.04562566429376602, 0.049886032938957214, 0.05414639785885811, 0.0584067665040493, 0.0626671314239502, 0.06692750006914139, 0.07118786871433258, 0.07544823735952377, 0.07970860600471497, 0.08396897464990616, 0.08822934329509735, 0.09248970448970795, 0.09675008058547974, 0.10101044178009033, 0.10527081042528152, 0.10953117907047272, 0.11379154771566391, 0.1180519163608551, 0.1223122850060463, 0.1265726536512375, 0.13083301484584808, 0.13509339094161987, 0.13935375213623047, 0.14361411333084106, 0.14787447452545166, 0.15213485062122345, 0.15639521181583405, 0.16065558791160583, 0.16491594910621643, 0.16917632520198822, 0.17343668639659882, 0.1776970624923706]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 12.0, 15.0, 20.0, 32.0, 36.0, 68.0, 103.0, 131.0, 219.0, 364.0, 719.0, 1394.0, 3265.0, 8669.0, 28501.0, 147383.0, 687477.0, 129846.0, 26105.0, 7989.0, 3097.0, 1374.0, 690.0, 358.0, 212.0, 141.0, 80.0, 47.0, 38.0, 33.0, 20.0, 13.0, 19.0, 13.0, 10.0, 2.0, 5.0, 2.0, 8.0, 1.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00792694091796875, -0.00761568546295166, -0.00730443000793457, -0.0069931745529174805, -0.006681919097900391, -0.006370663642883301, -0.006059408187866211, -0.005748152732849121, -0.005436897277832031, -0.005125641822814941, -0.0048143863677978516, -0.004503130912780762, -0.004191875457763672, -0.003880620002746582, -0.003569364547729492, -0.0032581090927124023, -0.0029468536376953125, -0.0026355981826782227, -0.002324342727661133, -0.002013087272644043, -0.0017018318176269531, -0.0013905763626098633, -0.0010793209075927734, -0.0007680654525756836, -0.00045680999755859375, -0.0001455545425415039, 0.00016570091247558594, 0.0004769563674926758, 0.0007882118225097656, 0.0010994672775268555, 0.0014107227325439453, 0.0017219781875610352, 0.002033233642578125, 0.002344489097595215, 0.0026557445526123047, 0.0029670000076293945, 0.0032782554626464844, 0.0035895109176635742, 0.003900766372680664, 0.004212021827697754, 0.004523277282714844, 0.004834532737731934, 0.0051457881927490234, 0.005457043647766113, 0.005768299102783203, 0.006079554557800293, 0.006390810012817383, 0.006702065467834473, 0.0070133209228515625, 0.007324576377868652, 0.007635831832885742, 0.007947087287902832, 0.008258342742919922, 0.008569598197937012, 0.008880853652954102, 0.009192109107971191, 0.009503364562988281, 0.009814620018005371, 0.010125875473022461, 0.01043713092803955, 0.01074838638305664, 0.01105964183807373, 0.01137089729309082, 0.01168215274810791, 0.011993408203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 12.0, 21.0, 29.0, 42.0, 86.0, 135.0, 137.0, 142.0, 125.0, 87.0, 63.0, 38.0, 37.0, 27.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006771087646484375, -0.006403505802154541, -0.006035923957824707, -0.005668342113494873, -0.005300760269165039, -0.004933178424835205, -0.004565596580505371, -0.004198014736175537, -0.003830432891845703, -0.003462851047515869, -0.003095269203186035, -0.002727687358856201, -0.002360105514526367, -0.001992523670196533, -0.0016249418258666992, -0.0012573599815368652, -0.0008897781372070312, -0.0005221962928771973, -0.00015461444854736328, 0.0002129673957824707, 0.0005805492401123047, 0.0009481310844421387, 0.0013157129287719727, 0.0016832947731018066, 0.0020508766174316406, 0.0024184584617614746, 0.0027860403060913086, 0.0031536221504211426, 0.0035212039947509766, 0.0038887858390808105, 0.0042563676834106445, 0.0046239495277404785, 0.0049915313720703125, 0.0053591132164001465, 0.0057266950607299805, 0.0060942769050598145, 0.0064618587493896484, 0.006829440593719482, 0.007197022438049316, 0.00756460428237915, 0.007932186126708984, 0.008299767971038818, 0.008667349815368652, 0.009034931659698486, 0.00940251350402832, 0.009770095348358154, 0.010137677192687988, 0.010505259037017822, 0.010872840881347656, 0.01124042272567749, 0.011608004570007324, 0.011975586414337158, 0.012343168258666992, 0.012710750102996826, 0.01307833194732666, 0.013445913791656494, 0.013813495635986328, 0.014181077480316162, 0.014548659324645996, 0.01491624116897583, 0.015283823013305664, 0.015651404857635498, 0.016018986701965332, 0.016386568546295166, 0.016754150390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 5.0, 7.0, 12.0, 10.0, 16.0, 10.0, 18.0, 28.0, 36.0, 55.0, 72.0, 114.0, 174.0, 303.0, 557.0, 1200.0, 2994.0, 11970.0, 90059.0, 872751.0, 54890.0, 8494.0, 2533.0, 955.0, 509.0, 269.0, 153.0, 108.0, 66.0, 39.0, 25.0, 27.0, 21.0, 13.0, 11.0, 10.0, 8.0, 9.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01068878173828125, -0.010348320007324219, -0.010007858276367188, -0.009667396545410156, -0.009326934814453125, -0.008986473083496094, -0.008646011352539062, -0.008305549621582031, -0.007965087890625, -0.007624626159667969, -0.0072841644287109375, -0.006943702697753906, -0.006603240966796875, -0.006262779235839844, -0.0059223175048828125, -0.005581855773925781, -0.00524139404296875, -0.004900932312011719, -0.0045604705810546875, -0.004220008850097656, -0.003879547119140625, -0.0035390853881835938, -0.0031986236572265625, -0.0028581619262695312, -0.0025177001953125, -0.0021772384643554688, -0.0018367767333984375, -0.0014963150024414062, -0.001155853271484375, -0.0008153915405273438, -0.0004749298095703125, -0.00013446807861328125, 0.00020599365234375, 0.0005464553833007812, 0.0008869171142578125, 0.0012273788452148438, 0.001567840576171875, 0.0019083023071289062, 0.0022487640380859375, 0.0025892257690429688, 0.0029296875, 0.0032701492309570312, 0.0036106109619140625, 0.003951072692871094, 0.004291534423828125, 0.004631996154785156, 0.0049724578857421875, 0.005312919616699219, 0.00565338134765625, 0.005993843078613281, 0.0063343048095703125, 0.006674766540527344, 0.007015228271484375, 0.007355690002441406, 0.0076961517333984375, 0.008036613464355469, 0.0083770751953125, 0.008717536926269531, 0.009057998657226562, 0.009398460388183594, 0.009738922119140625, 0.010079383850097656, 0.010419845581054688, 0.010760307312011719, 0.01110076904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 7.0, 7.0, 6.0, 5.0, 6.0, 16.0, 11.0, 21.0, 19.0, 24.0, 28.0, 35.0, 55.0, 56.0, 69.0, 76.0, 86.0, 79.0, 62.0, 58.0, 40.0, 39.0, 40.0, 27.0, 24.0, 22.0, 13.0, 10.0, 13.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0196380615234375, -0.018996000289916992, -0.018353939056396484, -0.017711877822875977, -0.01706981658935547, -0.01642775535583496, -0.015785694122314453, -0.015143632888793945, -0.014501571655273438, -0.01385951042175293, -0.013217449188232422, -0.012575387954711914, -0.011933326721191406, -0.011291265487670898, -0.01064920425415039, -0.010007143020629883, -0.009365081787109375, -0.008723020553588867, -0.00808095932006836, -0.0074388980865478516, -0.006796836853027344, -0.006154775619506836, -0.005512714385986328, -0.00487065315246582, -0.0042285919189453125, -0.0035865306854248047, -0.002944469451904297, -0.002302408218383789, -0.0016603469848632812, -0.0010182857513427734, -0.0003762245178222656, 0.0002658367156982422, 0.00090789794921875, 0.0015499591827392578, 0.0021920204162597656, 0.0028340816497802734, 0.0034761428833007812, 0.004118204116821289, 0.004760265350341797, 0.005402326583862305, 0.0060443878173828125, 0.00668644905090332, 0.007328510284423828, 0.007970571517944336, 0.008612632751464844, 0.009254693984985352, 0.00989675521850586, 0.010538816452026367, 0.011180877685546875, 0.011822938919067383, 0.01246500015258789, 0.013107061386108398, 0.013749122619628906, 0.014391183853149414, 0.015033245086669922, 0.01567530632019043, 0.016317367553710938, 0.016959428787231445, 0.017601490020751953, 0.01824355125427246, 0.01888561248779297, 0.019527673721313477, 0.020169734954833984, 0.020811796188354492, 0.021453857421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 7.0, 17.0, 25.0, 30.0, 62.0, 91.0, 191.0, 418.0, 1355.0, 6181.0, 137906.0, 889755.0, 9698.0, 1797.0, 500.0, 200.0, 96.0, 72.0, 40.0, 28.0, 24.0, 9.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0046844482421875, -0.004538536071777344, -0.0043926239013671875, -0.004246711730957031, -0.004100799560546875, -0.003954887390136719, -0.0038089752197265625, -0.0036630630493164062, -0.00351715087890625, -0.0033712387084960938, -0.0032253265380859375, -0.0030794143676757812, -0.002933502197265625, -0.0027875900268554688, -0.0026416778564453125, -0.0024957656860351562, -0.002349853515625, -0.0022039413452148438, -0.0020580291748046875, -0.0019121170043945312, -0.001766204833984375, -0.0016202926635742188, -0.0014743804931640625, -0.0013284683227539062, -0.00118255615234375, -0.0010366439819335938, -0.0008907318115234375, -0.0007448196411132812, -0.000598907470703125, -0.00045299530029296875, -0.0003070831298828125, -0.00016117095947265625, -1.52587890625e-05, 0.00013065338134765625, 0.0002765655517578125, 0.00042247772216796875, 0.000568389892578125, 0.0007143020629882812, 0.0008602142333984375, 0.0010061264038085938, 0.00115203857421875, 0.0012979507446289062, 0.0014438629150390625, 0.0015897750854492188, 0.001735687255859375, 0.0018815994262695312, 0.0020275115966796875, 0.0021734237670898438, 0.0023193359375, 0.0024652481079101562, 0.0026111602783203125, 0.0027570724487304688, 0.002902984619140625, 0.0030488967895507812, 0.0031948089599609375, 0.0033407211303710938, 0.00348663330078125, 0.0036325454711914062, 0.0037784576416015625, 0.003924369812011719, 0.004070281982421875, 0.004216194152832031, 0.0043621063232421875, 0.004508018493652344, 0.0046539306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 4.0, 0.0, 7.0, 6.0, 7.0, 5.0, 7.0, 10.0, 13.0, 13.0, 11.0, 8.0, 24.0, 34.0, 37.0, 23.0, 47.0, 63.0, 41.0, 48.0, 33.0, 54.0, 94.0, 49.0, 33.0, 43.0, 31.0, 57.0, 34.0, 26.0, 17.0, 22.0, 22.0, 13.0, 13.0, 8.0, 9.0, 4.0, 6.0, 8.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.410743713378906e-06, -4.279427230358124e-06, -4.148110747337341e-06, -4.016794264316559e-06, -3.885477781295776e-06, -3.754161298274994e-06, -3.6228448152542114e-06, -3.491528332233429e-06, -3.3602118492126465e-06, -3.228895366191864e-06, -3.0975788831710815e-06, -2.966262400150299e-06, -2.8349459171295166e-06, -2.703629434108734e-06, -2.5723129510879517e-06, -2.440996468067169e-06, -2.3096799850463867e-06, -2.1783635020256042e-06, -2.0470470190048218e-06, -1.9157305359840393e-06, -1.7844140529632568e-06, -1.6530975699424744e-06, -1.521781086921692e-06, -1.3904646039009094e-06, -1.259148120880127e-06, -1.1278316378593445e-06, -9.96515154838562e-07, -8.651986718177795e-07, -7.338821887969971e-07, -6.025657057762146e-07, -4.7124922275543213e-07, -3.3993273973464966e-07, -2.086162567138672e-07, -7.729977369308472e-08, 5.4016709327697754e-08, 1.8533319234848022e-07, 3.166496753692627e-07, 4.4796615839004517e-07, 5.792826414108276e-07, 7.105991244316101e-07, 8.419156074523926e-07, 9.73232090473175e-07, 1.1045485734939575e-06, 1.23586505651474e-06, 1.3671815395355225e-06, 1.498498022556305e-06, 1.6298145055770874e-06, 1.7611309885978699e-06, 1.8924474716186523e-06, 2.023763954639435e-06, 2.1550804376602173e-06, 2.2863969206809998e-06, 2.4177134037017822e-06, 2.5490298867225647e-06, 2.680346369743347e-06, 2.8116628527641296e-06, 2.942979335784912e-06, 3.0742958188056946e-06, 3.205612301826477e-06, 3.3369287848472595e-06, 3.468245267868042e-06, 3.5995617508888245e-06, 3.730878233909607e-06, 3.862194716930389e-06, 3.993511199951172e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 5.0, 13.0, 28.0, 47.0, 77.0, 89.0, 229.0, 357.0, 766.0, 1780.0, 5255.0, 22479.0, 733054.0, 256106.0, 20073.0, 4969.0, 1694.0, 728.0, 338.0, 173.0, 93.0, 58.0, 43.0, 21.0, 17.0, 16.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014171600341796875, -0.0013682395219802856, -0.0013193190097808838, -0.001270398497581482, -0.00122147798538208, -0.0011725574731826782, -0.0011236369609832764, -0.0010747164487838745, -0.0010257959365844727, -0.0009768754243850708, -0.0009279549121856689, -0.0008790343999862671, -0.0008301138877868652, -0.0007811933755874634, -0.0007322728633880615, -0.0006833523511886597, -0.0006344318389892578, -0.000585511326789856, -0.0005365908145904541, -0.00048767030239105225, -0.0004387497901916504, -0.00038982927799224854, -0.0003409087657928467, -0.0002919882535934448, -0.00024306774139404297, -0.0001941472291946411, -0.00014522671699523926, -9.63062047958374e-05, -4.738569259643555e-05, 1.5348196029663086e-06, 5.0455331802368164e-05, 9.937584400177002e-05, 0.00014829635620117188, 0.00019721686840057373, 0.0002461373805999756, 0.00029505789279937744, 0.0003439784049987793, 0.00039289891719818115, 0.000441819429397583, 0.0004907399415969849, 0.0005396604537963867, 0.0005885809659957886, 0.0006375014781951904, 0.0006864219903945923, 0.0007353425025939941, 0.000784263014793396, 0.0008331835269927979, 0.0008821040391921997, 0.0009310245513916016, 0.0009799450635910034, 0.0010288655757904053, 0.0010777860879898071, 0.001126706600189209, 0.0011756271123886108, 0.0012245476245880127, 0.0012734681367874146, 0.0013223886489868164, 0.0013713091611862183, 0.0014202296733856201, 0.001469150185585022, 0.0015180706977844238, 0.0015669912099838257, 0.0016159117221832275, 0.0016648322343826294, 0.0017137527465820312]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 21.0, 14.0, 19.0, 45.0, 50.0, 118.0, 151.0, 175.0, 130.0, 101.0, 54.0, 36.0, 21.0, 10.0, 10.0, 17.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002475738525390625, -0.002370178699493408, -0.0022646188735961914, -0.0021590590476989746, -0.002053499221801758, -0.001947939395904541, -0.0018423795700073242, -0.0017368197441101074, -0.0016312599182128906, -0.0015257000923156738, -0.001420140266418457, -0.0013145804405212402, -0.0012090206146240234, -0.0011034607887268066, -0.0009979009628295898, -0.000892341136932373, -0.0007867813110351562, -0.0006812214851379395, -0.0005756616592407227, -0.00047010183334350586, -0.00036454200744628906, -0.00025898218154907227, -0.00015342235565185547, -4.786252975463867e-05, 5.7697296142578125e-05, 0.00016325712203979492, 0.0002688169479370117, 0.0003743767738342285, 0.0004799365997314453, 0.0005854964256286621, 0.0006910562515258789, 0.0007966160774230957, 0.0009021759033203125, 0.0010077357292175293, 0.001113295555114746, 0.0012188553810119629, 0.0013244152069091797, 0.0014299750328063965, 0.0015355348587036133, 0.00164109468460083, 0.0017466545104980469, 0.0018522143363952637, 0.0019577741622924805, 0.0020633339881896973, 0.002168893814086914, 0.002274453639984131, 0.0023800134658813477, 0.0024855732917785645, 0.0025911331176757812, 0.002696692943572998, 0.002802252769470215, 0.0029078125953674316, 0.0030133724212646484, 0.0031189322471618652, 0.003224492073059082, 0.003330051898956299, 0.0034356117248535156, 0.0035411715507507324, 0.0036467313766479492, 0.003752291202545166, 0.003857851028442383, 0.0039634108543396, 0.004068970680236816, 0.004174530506134033, 0.00428009033203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 10.0, 20.0, 50.0, 130.0, 588.0, 127.0, 47.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.17189592123031616, -0.16756770014762878, -0.1632394641637802, -0.15891124308109283, -0.15458300709724426, -0.15025478601455688, -0.1459265649318695, -0.14159832894802094, -0.13727010786533356, -0.13294188678264618, -0.1286136507987976, -0.12428542971611023, -0.11995720118284225, -0.11562897264957428, -0.1113007515668869, -0.10697252303361893, -0.10264429450035095, -0.09831606596708298, -0.093987837433815, -0.08965961635112762, -0.08533138781785965, -0.08100315928459167, -0.0766749382019043, -0.07234670966863632, -0.06801848113536835, -0.06369025260210037, -0.059362027794122696, -0.05503380298614502, -0.050705574452877045, -0.04637734591960907, -0.04204912111163139, -0.03772089630365372, -0.033392660319805145, -0.02906443364918232, -0.024736206978559494, -0.02040798030793667, -0.016079753637313843, -0.011751526966691017, -0.0074233002960681915, -0.003095073625445366, 0.0012331530451774597, 0.005561379715800285, 0.009889606386423111, 0.014217833057045937, 0.018546059727668762, 0.022874286398291588, 0.027202513068914413, 0.03153073787689209, 0.035858966410160065, 0.04018719494342804, 0.044515419751405716, 0.04884364455938339, 0.05317187309265137, 0.05750010162591934, 0.06182832643389702, 0.0661565512418747, 0.07048477977514267, 0.07481300830841064, 0.07914122939109802, 0.083469457924366, 0.08779768645763397, 0.09212591499090195, 0.09645414352416992, 0.1007823646068573, 0.10511059314012527]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 6.0, 12.0, 17.0, 24.0, 26.0, 27.0, 26.0, 29.0, 44.0, 123.0, 300.0, 112.0, 38.0, 32.0, 25.0, 23.0, 22.0, 23.0, 14.0, 12.0, 9.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07029181718826294, -0.06805931776762009, -0.06582681089639664, -0.06359431147575378, -0.06136180832982063, -0.05912930518388748, -0.05689680576324463, -0.05466430261731148, -0.052431799471378326, -0.050199296325445175, -0.047966793179512024, -0.04573429375886917, -0.04350179061293602, -0.04126928746700287, -0.039036788046360016, -0.036804284900426865, -0.03457178175449371, -0.03233927860856056, -0.03010677732527256, -0.027874276041984558, -0.025641772896051407, -0.023409269750118256, -0.021176768466830254, -0.01894426718354225, -0.0167117640376091, -0.014479261822998524, -0.012246759608387947, -0.01001425739377737, -0.007781755179166794, -0.005549252964556217, -0.0033167507499456406, -0.0010842494666576385, 0.0011482536792755127, 0.0033807558938860893, 0.005613258108496666, 0.007845760323107243, 0.01007826253771782, 0.012310764752328396, 0.014543266966938972, 0.016775768250226974, 0.019008271396160126, 0.021240774542093277, 0.02347327582538128, 0.02570577710866928, 0.027938280254602432, 0.030170783400535583, 0.032403282821178436, 0.03463578596711159, 0.03686828911304474, 0.03910079225897789, 0.04133329540491104, 0.043565794825553894, 0.045798297971487045, 0.0480308011174202, 0.05026330053806305, 0.0524958036839962, 0.05472830682992935, 0.0569608099758625, 0.059193313121795654, 0.06142581254243851, 0.06365831196308136, 0.06589081883430481, 0.06812331825494766, 0.07035581767559052, 0.07258832454681396]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 2.0, 6.0, 11.0, 20.0, 11.0, 16.0, 16.0, 23.0, 24.0, 44.0, 56.0, 117.0, 280.0, 92.0, 41.0, 47.0, 31.0, 29.0, 29.0, 16.0, 14.0, 7.0, 7.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00418853759765625, -0.004035472869873047, -0.0038824081420898438, -0.0037293434143066406, -0.0035762786865234375, -0.0034232139587402344, -0.0032701492309570312, -0.003117084503173828, -0.002964019775390625, -0.002810955047607422, -0.0026578903198242188, -0.0025048255920410156, -0.0023517608642578125, -0.0021986961364746094, -0.0020456314086914062, -0.0018925666809082031, -0.001739501953125, -0.0015864372253417969, -0.0014333724975585938, -0.0012803077697753906, -0.0011272430419921875, -0.0009741783142089844, -0.0008211135864257812, -0.0006680488586425781, -0.000514984130859375, -0.0003619194030761719, -0.00020885467529296875, -5.5789947509765625e-05, 9.72747802734375e-05, 0.0002503395080566406, 0.00040340423583984375, 0.0005564689636230469, 0.00070953369140625, 0.0008625984191894531, 0.0010156631469726562, 0.0011687278747558594, 0.0013217926025390625, 0.0014748573303222656, 0.0016279220581054688, 0.0017809867858886719, 0.001934051513671875, 0.002087116241455078, 0.0022401809692382812, 0.0023932456970214844, 0.0025463104248046875, 0.0026993751525878906, 0.0028524398803710938, 0.003005504608154297, 0.0031585693359375, 0.003311634063720703, 0.0034646987915039062, 0.0036177635192871094, 0.0037708282470703125, 0.003923892974853516, 0.004076957702636719, 0.004230022430419922, 0.004383087158203125, 0.004536151885986328, 0.004689216613769531, 0.004842281341552734, 0.0049953460693359375, 0.005148410797119141, 0.005301475524902344, 0.005454540252685547, 0.00560760498046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 20.0, 11.0, 5.0, 15.0, 36.0, 31.0, 44.0, 100.0, 252.0, 844.0, 7848.0, 8369648.0, 8293.0, 921.0, 238.0, 92.0, 76.0, 31.0, 13.0, 13.0, 14.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.05763475224375725, -0.05601182579994202, -0.05438889563083649, -0.052765969187021255, -0.051143042743206024, -0.049520112574100494, -0.04789718613028526, -0.04627425968647003, -0.0446513332426548, -0.04302840679883957, -0.04140547662973404, -0.03978255018591881, -0.03815962374210358, -0.03653669357299805, -0.034913767129182816, -0.033290840685367584, -0.031667910516262054, -0.030044982209801674, -0.028422055765986443, -0.026799127459526062, -0.02517620101571083, -0.02355327270925045, -0.02193034440279007, -0.020307417958974838, -0.018684491515159607, -0.017061563208699226, -0.015438636764883995, -0.013815708458423615, -0.012192782014608383, -0.010569853708148003, -0.008946926333010197, -0.007323998957872391, -0.005701072514057159, -0.0040781451389193535, -0.002455217530950904, -0.0008322899229824543, 0.0007906374521553516, 0.002413565292954445, 0.004036492668092251, 0.005659420043230057, 0.007282347418367863, 0.008905274793505669, 0.010528202168643475, 0.01215112954378128, 0.013774057850241661, 0.015396985225379467, 0.017019912600517273, 0.018642839044332504, 0.020265767350792885, 0.021888695657253265, 0.023511622101068497, 0.025134550407528877, 0.02675747685134411, 0.02838040515780449, 0.03000333160161972, 0.03162626177072525, 0.03324918821454048, 0.03487211465835571, 0.03649504482746124, 0.038117971271276474, 0.039740897715091705, 0.041363827884197235, 0.042986754328012466, 0.0446096807718277, 0.04623260721564293]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 2.0, 2.0, 4.0, 2.0, 9.0, 4.0, 7.0, 5.0, 8.0, 1.0, 5.0, 2.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023277707397937775, -0.022740105167031288, -0.0222025029361248, -0.021664900705218315, -0.02112729847431183, -0.020589694380760193, -0.020052092149853706, -0.01951448991894722, -0.018976887688040733, -0.018439285457134247, -0.01790168322622776, -0.017364080995321274, -0.016826476901769638, -0.01628887467086315, -0.015751272439956665, -0.015213670209050179, -0.014676067978143692, -0.014138465747237206, -0.013600863516330719, -0.013063260354101658, -0.012525658123195171, -0.011988055892288685, -0.011450452730059624, -0.010912850499153137, -0.01037524826824665, -0.009837646037340164, -0.009300043806433678, -0.008762440644204617, -0.00822483841329813, -0.0076872361823916435, -0.00714963348582387, -0.006612030789256096, -0.00607442669570446, -0.005536824464797974, -0.0049992217682302, -0.004461619071662426, -0.0039240168407559395, -0.0033864143770188093, -0.002848811913281679, -0.002311209449544549, -0.0017736069858074188, -0.0012360045220702887, -0.0006984020583331585, -0.00016079959459602833, 0.00037680286914110184, 0.000914405332878232, 0.0014520077966153622, 0.0019896102603524923, 0.0025272127240896225, 0.0030648151878267527, 0.003602417651563883, 0.004140020348131657, 0.004677622579038143, 0.00521522480994463, 0.0057528275065124035, 0.006290430203080177, 0.006828032433986664, 0.00736563466489315, 0.007903236895799637, 0.008440840058028698, 0.008978442288935184, 0.009516044519841671, 0.010053647682070732, 0.010591249912977219, 0.011128852143883705]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 5.0, 9.0, 6.0, 21.0, 14.0, 36.0, 52.0, 96.0, 170.0, 224.0, 389.0, 819.0, 1722.0, 4031.0, 10191.0, 30030.0, 100196.0, 221675.0, 105560.0, 31341.0, 10403.0, 3885.0, 1545.0, 754.0, 375.0, 204.0, 162.0, 90.0, 60.0, 46.0, 38.0, 22.0, 17.0, 17.0, 14.0, 6.0, 9.0, 6.0, 4.0, 2.0, 7.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0206298828125, -0.01995372772216797, -0.019277572631835938, -0.018601417541503906, -0.017925262451171875, -0.017249107360839844, -0.016572952270507812, -0.01589679718017578, -0.01522064208984375, -0.014544486999511719, -0.013868331909179688, -0.013192176818847656, -0.012516021728515625, -0.011839866638183594, -0.011163711547851562, -0.010487556457519531, -0.0098114013671875, -0.009135246276855469, -0.008459091186523438, -0.007782936096191406, -0.007106781005859375, -0.006430625915527344, -0.0057544708251953125, -0.005078315734863281, -0.00440216064453125, -0.0037260055541992188, -0.0030498504638671875, -0.0023736953735351562, -0.001697540283203125, -0.0010213851928710938, -0.0003452301025390625, 0.00033092498779296875, 0.001007080078125, 0.0016832351684570312, 0.0023593902587890625, 0.0030355453491210938, 0.003711700439453125, 0.004387855529785156, 0.0050640106201171875, 0.005740165710449219, 0.00641632080078125, 0.007092475891113281, 0.0077686309814453125, 0.008444786071777344, 0.009120941162109375, 0.009797096252441406, 0.010473251342773438, 0.011149406433105469, 0.0118255615234375, 0.012501716613769531, 0.013177871704101562, 0.013854026794433594, 0.014530181884765625, 0.015206336975097656, 0.015882492065429688, 0.01655864715576172, 0.01723480224609375, 0.01791095733642578, 0.018587112426757812, 0.019263267517089844, 0.019939422607421875, 0.020615577697753906, 0.021291732788085938, 0.02196788787841797, 0.02264404296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 7.0, 7.0, 10.0, 38.0, 50.0, 87.0, 101.0, 161.0, 162.0, 159.0, 83.0, 61.0, 33.0, 23.0, 13.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006114959716796875, -0.005738317966461182, -0.005361676216125488, -0.004985034465789795, -0.0046083927154541016, -0.004231750965118408, -0.003855109214782715, -0.0034784674644470215, -0.003101825714111328, -0.0027251839637756348, -0.0023485422134399414, -0.001971900463104248, -0.0015952587127685547, -0.0012186169624328613, -0.000841975212097168, -0.0004653334617614746, -8.869171142578125e-05, 0.0002879500389099121, 0.0006645917892456055, 0.0010412335395812988, 0.0014178752899169922, 0.0017945170402526855, 0.002171158790588379, 0.0025478005409240723, 0.0029244422912597656, 0.003301084041595459, 0.0036777257919311523, 0.004054367542266846, 0.004431009292602539, 0.004807651042938232, 0.005184292793273926, 0.005560934543609619, 0.0059375762939453125, 0.006314218044281006, 0.006690859794616699, 0.007067501544952393, 0.007444143295288086, 0.00782078504562378, 0.008197426795959473, 0.008574068546295166, 0.00895071029663086, 0.009327352046966553, 0.009703993797302246, 0.01008063554763794, 0.010457277297973633, 0.010833919048309326, 0.01121056079864502, 0.011587202548980713, 0.011963844299316406, 0.0123404860496521, 0.012717127799987793, 0.013093769550323486, 0.01347041130065918, 0.013847053050994873, 0.014223694801330566, 0.01460033655166626, 0.014976978302001953, 0.015353620052337646, 0.01573026180267334, 0.016106903553009033, 0.016483545303344727, 0.01686018705368042, 0.017236828804016113, 0.017613470554351807, 0.0179901123046875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 9.0, 6.0, 3.0, 15.0, 29.0, 126.0, 151.0, 75.0, 28.0, 9.0, 8.0, 8.0, 3.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03378673642873764, -0.03251172974705696, -0.031236721202731133, -0.029961712658405304, -0.028686705976724625, -0.027411699295043945, -0.026136690750718117, -0.024861682206392288, -0.02358667552471161, -0.02231166884303093, -0.0210366602987051, -0.019761651754379272, -0.018486645072698593, -0.017211638391017914, -0.015936629846692085, -0.014661622233688831, -0.013386614620685577, -0.012111607007682323, -0.01083659939467907, -0.009561591781675816, -0.008286584168672562, -0.007011576555669308, -0.005736568942666054, -0.0044615613296628, -0.003186553716659546, -0.001911546103656292, -0.000636538490653038, 0.0006384691223502159, 0.0019134767353534698, 0.003188484348356724, 0.004463491961359978, 0.005738499574363232, 0.007013507187366486, 0.00828851480036974, 0.009563522413372993, 0.010838530026376247, 0.012113537639379501, 0.013388545252382755, 0.01466355286538601, 0.015938561409711838, 0.017213568091392517, 0.018488574773073196, 0.019763583317399025, 0.021038591861724854, 0.022313598543405533, 0.023588605225086212, 0.02486361376941204, 0.02613862231373787, 0.02741362899541855, 0.028688635677099228, 0.029963644221425056, 0.031238652765750885, 0.032513659447431564, 0.033788666129112244, 0.03506367653608322, 0.0363386832177639, 0.03761368989944458, 0.03888869658112526, 0.04016370326280594, 0.041438713669776917, 0.042713720351457596, 0.043988727033138275, 0.04526373744010925, 0.04653874412178993, 0.04781375080347061]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 8.0, 12.0, 45.0, 106.0, 98.0, 80.0, 35.0, 14.0, 10.0, 4.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.031161367893218994, -0.030129114165902138, -0.02909686043858528, -0.028064606711268425, -0.02703235298395157, -0.026000099256634712, -0.024967845529317856, -0.023935591802001, -0.022903338074684143, -0.021871084347367287, -0.02083883062005043, -0.019806576892733574, -0.018774323165416718, -0.01774206943809986, -0.016709815710783005, -0.01567756198346615, -0.014645308256149292, -0.013613054528832436, -0.01258080080151558, -0.011548547074198723, -0.010516293346881866, -0.00948403961956501, -0.008451785892248154, -0.007419532164931297, -0.006387278437614441, -0.0053550247102975845, -0.004322770982980728, -0.0032905172556638718, -0.0022582635283470154, -0.001226009801030159, -0.0001937560737133026, 0.0008384976536035538, 0.0018707513809204102, 0.0029030051082372665, 0.003935258835554123, 0.004967512562870979, 0.005999766290187836, 0.007032020017504692, 0.008064273744821548, 0.009096527472138405, 0.010128781199455261, 0.011161034926772118, 0.012193288654088974, 0.01322554238140583, 0.014257796108722687, 0.015290049836039543, 0.0163223035633564, 0.017354557290673256, 0.018386811017990112, 0.01941906474530697, 0.020451318472623825, 0.02148357219994068, 0.022515825927257538, 0.023548079654574394, 0.02458033338189125, 0.025612587109208107, 0.026644840836524963, 0.02767709456384182, 0.028709348291158676, 0.029741602018475533, 0.03077385574579239, 0.031806111335754395, 0.0328383632004261, 0.03387061506509781, 0.034902870655059814]}, "eval/loss": 4.547459125518799, "eval/wer": 2.4429393097976995, "eval/runtime": 930.4687, "eval/samples_per_second": 2.839, "eval/steps_per_second": 0.238, "train/train_runtime": 6725.1387, "train/train_samples_per_second": 4.243, "train/train_steps_per_second": 0.177, "train/total_flos": 0.0, "train/train_loss": 4.647471772210753} \ No newline at end of file +{"train/loss": 5.1519, "train/learning_rate": 1.741654571843251e-06, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 8088, "_timestamp": 1646243983, "_step": 1192, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 39.0, 666.0, 303.0, 7.0, 1.0, 0.0, 1.0], "bins": [-403.2832946777344, -396.4258117675781, -389.5683288574219, -382.7108459472656, -375.8533630371094, -368.9958801269531, -362.138427734375, -355.28094482421875, -348.4234619140625, -341.56597900390625, -334.70849609375, -327.85101318359375, -320.9935302734375, -314.13604736328125, -307.278564453125, -300.42108154296875, -293.5635986328125, -286.70611572265625, -279.8486328125, -272.99114990234375, -266.1336669921875, -259.27618408203125, -252.41871643066406, -245.5612335205078, -238.70376586914062, -231.84628295898438, -224.98880004882812, -218.13131713867188, -211.2738494873047, -204.41636657714844, -197.5588836669922, -190.70140075683594, -183.84393310546875, -176.9864501953125, -170.12896728515625, -163.271484375, -156.4140167236328, -149.55653381347656, -142.6990509033203, -135.84156799316406, -128.9840850830078, -122.12660217285156, -115.26912689208984, -108.4116439819336, -101.55416107177734, -94.69668579101562, -87.83920288085938, -80.98171997070312, -74.12423706054688, -67.26675415039062, -60.40927505493164, -53.551795959472656, -46.694313049316406, -39.83683395385742, -32.97935485839844, -26.121871948242188, -19.264392852783203, -12.406911849975586, -5.549431800842285, 1.3080482482910156, 8.165529251098633, 15.02301025390625, 21.880489349365234, 28.737972259521484, 35.59545135498047]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 4.0, 10.0, 8.0, 12.0, 10.0, 11.0, 23.0, 12.0, 16.0, 20.0, 30.0, 24.0, 30.0, 35.0, 37.0, 35.0, 57.0, 39.0, 42.0, 42.0, 43.0, 40.0, 36.0, 42.0, 36.0, 30.0, 32.0, 24.0, 31.0, 28.0, 17.0, 24.0, 21.0, 15.0, 14.0, 14.0, 13.0, 6.0, 5.0, 4.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-56.051300048828125, -54.218135833740234, -52.384971618652344, -50.55180740356445, -48.71864318847656, -46.88547897338867, -45.05231475830078, -43.21915054321289, -41.385986328125, -39.55282211303711, -37.71965789794922, -35.88649368286133, -34.05332946777344, -32.22016525268555, -30.387001037597656, -28.553836822509766, -26.720674514770508, -24.887510299682617, -23.054346084594727, -21.221181869506836, -19.388017654418945, -17.554855346679688, -15.72169017791748, -13.88852596282959, -12.0553617477417, -10.222197532653809, -8.389033317565918, -6.5558695793151855, -4.722705364227295, -2.8895416259765625, -1.0563774108886719, 0.7767868041992188, 2.6099510192871094, 4.443115234375, 6.276279449462891, 8.109443664550781, 9.942607879638672, 11.775771141052246, 13.608935356140137, 15.442099571228027, 17.275264739990234, 19.108428955078125, 20.941593170166016, 22.774757385253906, 24.607921600341797, 26.441085815429688, 28.274250030517578, 30.10741424560547, 31.940576553344727, 33.773738861083984, 35.606903076171875, 37.440067291259766, 39.273231506347656, 41.10639572143555, 42.93955993652344, 44.77272415161133, 46.60588836669922, 48.43905258178711, 50.272216796875, 52.10538101196289, 53.93854522705078, 55.77170944213867, 57.60487365722656, 59.43803787231445, 61.271202087402344]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 15.0, 13.0, 14.0, 33.0, 29.0, 41.0, 51.0, 70.0, 70.0, 74.0, 85.0, 77.0, 74.0, 68.0, 60.0, 59.0, 45.0, 45.0, 27.0, 15.0, 14.0, 7.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.728515625, -3.641937255859375, -3.55535888671875, -3.468780517578125, -3.3822021484375, -3.295623779296875, -3.20904541015625, -3.122467041015625, -3.035888671875, -2.949310302734375, -2.86273193359375, -2.776153564453125, -2.6895751953125, -2.602996826171875, -2.51641845703125, -2.429840087890625, -2.34326171875, -2.256683349609375, -2.17010498046875, -2.083526611328125, -1.9969482421875, -1.910369873046875, -1.82379150390625, -1.737213134765625, -1.650634765625, -1.564056396484375, -1.47747802734375, -1.390899658203125, -1.3043212890625, -1.217742919921875, -1.13116455078125, -1.044586181640625, -0.9580078125, -0.871429443359375, -0.78485107421875, -0.698272705078125, -0.6116943359375, -0.525115966796875, -0.43853759765625, -0.351959228515625, -0.265380859375, -0.178802490234375, -0.09222412109375, -0.005645751953125, 0.0809326171875, 0.167510986328125, 0.25408935546875, 0.340667724609375, 0.42724609375, 0.513824462890625, 0.60040283203125, 0.686981201171875, 0.7735595703125, 0.860137939453125, 0.94671630859375, 1.033294677734375, 1.119873046875, 1.206451416015625, 1.29302978515625, 1.379608154296875, 1.4661865234375, 1.552764892578125, 1.63934326171875, 1.725921630859375, 1.8125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 10.0, 11.0, 23.0, 29.0, 64.0, 77.0, 120.0, 228.0, 450.0, 833.0, 2069.0, 6217.0, 47833.0, 3781207.0, 334939.0, 14092.0, 3323.0, 1314.0, 631.0, 346.0, 189.0, 111.0, 59.0, 35.0, 33.0, 18.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.46875, -23.882568359375, -23.29638671875, -22.710205078125, -22.1240234375, -21.537841796875, -20.95166015625, -20.365478515625, -19.779296875, -19.193115234375, -18.60693359375, -18.020751953125, -17.4345703125, -16.848388671875, -16.26220703125, -15.676025390625, -15.08984375, -14.503662109375, -13.91748046875, -13.331298828125, -12.7451171875, -12.158935546875, -11.57275390625, -10.986572265625, -10.400390625, -9.814208984375, -9.22802734375, -8.641845703125, -8.0556640625, -7.469482421875, -6.88330078125, -6.297119140625, -5.7109375, -5.124755859375, -4.53857421875, -3.952392578125, -3.3662109375, -2.780029296875, -2.19384765625, -1.607666015625, -1.021484375, -0.435302734375, 0.15087890625, 0.737060546875, 1.3232421875, 1.909423828125, 2.49560546875, 3.081787109375, 3.66796875, 4.254150390625, 4.84033203125, 5.426513671875, 6.0126953125, 6.598876953125, 7.18505859375, 7.771240234375, 8.357421875, 8.943603515625, 9.52978515625, 10.115966796875, 10.7021484375, 11.288330078125, 11.87451171875, 12.460693359375, 13.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 12.0, 23.0, 34.0, 64.0, 139.0, 237.0, 451.0, 822.0, 948.0, 613.0, 318.0, 179.0, 94.0, 63.0, 28.0, 21.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.90625, -17.5263671875, -17.146484375, -16.7666015625, -16.38671875, -16.0068359375, -15.626953125, -15.2470703125, -14.8671875, -14.4873046875, -14.107421875, -13.7275390625, -13.34765625, -12.9677734375, -12.587890625, -12.2080078125, -11.828125, -11.4482421875, -11.068359375, -10.6884765625, -10.30859375, -9.9287109375, -9.548828125, -9.1689453125, -8.7890625, -8.4091796875, -8.029296875, -7.6494140625, -7.26953125, -6.8896484375, -6.509765625, -6.1298828125, -5.75, -5.3701171875, -4.990234375, -4.6103515625, -4.23046875, -3.8505859375, -3.470703125, -3.0908203125, -2.7109375, -2.3310546875, -1.951171875, -1.5712890625, -1.19140625, -0.8115234375, -0.431640625, -0.0517578125, 0.328125, 0.7080078125, 1.087890625, 1.4677734375, 1.84765625, 2.2275390625, 2.607421875, 2.9873046875, 3.3671875, 3.7470703125, 4.126953125, 4.5068359375, 4.88671875, 5.2666015625, 5.646484375, 6.0263671875, 6.40625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 10.0, 27.0, 50.0, 123.0, 263.0, 691.0, 3128.0, 691723.0, 3491822.0, 4969.0, 883.0, 330.0, 129.0, 62.0, 27.0, 12.0, 8.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.28125, -44.79248046875, -43.3037109375, -41.81494140625, -40.326171875, -38.83740234375, -37.3486328125, -35.85986328125, -34.37109375, -32.88232421875, -31.3935546875, -29.90478515625, -28.416015625, -26.92724609375, -25.4384765625, -23.94970703125, -22.4609375, -20.97216796875, -19.4833984375, -17.99462890625, -16.505859375, -15.01708984375, -13.5283203125, -12.03955078125, -10.55078125, -9.06201171875, -7.5732421875, -6.08447265625, -4.595703125, -3.10693359375, -1.6181640625, -0.12939453125, 1.359375, 2.84814453125, 4.3369140625, 5.82568359375, 7.314453125, 8.80322265625, 10.2919921875, 11.78076171875, 13.26953125, 14.75830078125, 16.2470703125, 17.73583984375, 19.224609375, 20.71337890625, 22.2021484375, 23.69091796875, 25.1796875, 26.66845703125, 28.1572265625, 29.64599609375, 31.134765625, 32.62353515625, 34.1123046875, 35.60107421875, 37.08984375, 38.57861328125, 40.0673828125, 41.55615234375, 43.044921875, 44.53369140625, 46.0224609375, 47.51123046875, 49.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 67.0, 329.0, 452.0, 125.0, 25.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-148.87753295898438, -146.17604064941406, -143.47454833984375, -140.77305603027344, -138.07156372070312, -135.3700714111328, -132.6685791015625, -129.9670867919922, -127.26558685302734, -124.56409454345703, -121.86260223388672, -119.1611099243164, -116.4596176147461, -113.75811767578125, -111.05662536621094, -108.35513305664062, -105.65364074707031, -102.9521484375, -100.25065612792969, -97.54916381835938, -94.84767150878906, -92.14617919921875, -89.44468688964844, -86.7431869506836, -84.04170227050781, -81.3402099609375, -78.63871765136719, -75.93722534179688, -73.23573303222656, -70.53424072265625, -67.83274841308594, -65.1312484741211, -62.42975616455078, -59.72826385498047, -57.026771545410156, -54.325279235839844, -51.623783111572266, -48.92229080200195, -46.22079849243164, -43.51930236816406, -40.81781005859375, -38.11631774902344, -35.414825439453125, -32.71333312988281, -30.011837005615234, -27.310344696044922, -24.60885238647461, -21.907358169555664, -19.20586585998535, -16.50437355041504, -13.802879333496094, -11.101387023925781, -8.399893760681152, -5.698400497436523, -2.996908187866211, -0.2954139709472656, 2.406078338623047, 5.107571601867676, 7.8090643882751465, 10.510557174682617, 13.212050437927246, 15.913543701171875, 18.615036010742188, 21.316530227661133, 24.018022537231445]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 8.0, 12.0, 7.0, 6.0, 13.0, 15.0, 12.0, 24.0, 22.0, 26.0, 29.0, 29.0, 27.0, 36.0, 46.0, 44.0, 44.0, 49.0, 51.0, 54.0, 36.0, 35.0, 48.0, 35.0, 30.0, 32.0, 35.0, 40.0, 24.0, 18.0, 22.0, 11.0, 18.0, 13.0, 15.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-29.539199829101562, -28.756149291992188, -27.973098754882812, -27.190048217773438, -26.406997680664062, -25.623945236206055, -24.84089469909668, -24.057844161987305, -23.27479362487793, -22.491743087768555, -21.70869255065918, -20.925642013549805, -20.142589569091797, -19.359539031982422, -18.576488494873047, -17.793437957763672, -17.010387420654297, -16.227336883544922, -15.444286346435547, -14.661234855651855, -13.87818431854248, -13.095133781433105, -12.312082290649414, -11.529031753540039, -10.745981216430664, -9.962930679321289, -9.179880142211914, -8.396828651428223, -7.613778114318848, -6.830727577209473, -6.0476765632629395, -5.264625549316406, -4.481575012207031, -3.698524236679077, -2.915473461151123, -2.132422685623169, -1.3493719100952148, -0.5663211345672607, 0.21672964096069336, 0.9997806549072266, 1.7828311920166016, 2.5658819675445557, 3.3489327430725098, 4.131983757019043, 4.915034294128418, 5.698084831237793, 6.481135845184326, 7.264186859130859, 8.047237396240234, 8.83028793334961, 9.613338470458984, 10.396389961242676, 11.17944049835205, 11.962491035461426, 12.745542526245117, 13.528593063354492, 14.311643600463867, 15.094694137573242, 15.877744674682617, 16.660795211791992, 17.44384765625, 18.226898193359375, 19.00994873046875, 19.792999267578125, 20.5760498046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 18.0, 14.0, 25.0, 21.0, 20.0, 31.0, 48.0, 49.0, 40.0, 65.0, 68.0, 56.0, 69.0, 63.0, 62.0, 65.0, 53.0, 43.0, 38.0, 40.0, 28.0, 22.0, 10.0, 17.0, 6.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-3.1328125, -3.0621490478515625, -2.991485595703125, -2.9208221435546875, -2.85015869140625, -2.7794952392578125, -2.708831787109375, -2.6381683349609375, -2.5675048828125, -2.4968414306640625, -2.426177978515625, -2.3555145263671875, -2.28485107421875, -2.2141876220703125, -2.143524169921875, -2.0728607177734375, -2.002197265625, -1.9315338134765625, -1.860870361328125, -1.7902069091796875, -1.71954345703125, -1.6488800048828125, -1.578216552734375, -1.5075531005859375, -1.4368896484375, -1.3662261962890625, -1.295562744140625, -1.2248992919921875, -1.15423583984375, -1.0835723876953125, -1.012908935546875, -0.9422454833984375, -0.87158203125, -0.8009185791015625, -0.730255126953125, -0.6595916748046875, -0.58892822265625, -0.5182647705078125, -0.447601318359375, -0.3769378662109375, -0.3062744140625, -0.2356109619140625, -0.164947509765625, -0.0942840576171875, -0.02362060546875, 0.0470428466796875, 0.117706298828125, 0.1883697509765625, 0.259033203125, 0.3296966552734375, 0.400360107421875, 0.4710235595703125, 0.54168701171875, 0.6123504638671875, 0.683013916015625, 0.7536773681640625, 0.8243408203125, 0.8950042724609375, 0.965667724609375, 1.0363311767578125, 1.10699462890625, 1.1776580810546875, 1.248321533203125, 1.3189849853515625, 1.3896484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 8.0, 5.0, 8.0, 11.0, 9.0, 11.0, 25.0, 35.0, 64.0, 97.0, 178.0, 414.0, 866.0, 1655.0, 3606.0, 7591.0, 16643.0, 38682.0, 103024.0, 415424.0, 311612.0, 87079.0, 33793.0, 14710.0, 6696.0, 3208.0, 1515.0, 746.0, 369.0, 179.0, 80.0, 60.0, 41.0, 23.0, 11.0, 8.0, 10.0, 13.0, 6.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0218048095703125, -0.02114248275756836, -0.02048015594482422, -0.019817829132080078, -0.019155502319335938, -0.018493175506591797, -0.017830848693847656, -0.017168521881103516, -0.016506195068359375, -0.015843868255615234, -0.015181541442871094, -0.014519214630126953, -0.013856887817382812, -0.013194561004638672, -0.012532234191894531, -0.01186990737915039, -0.01120758056640625, -0.01054525375366211, -0.009882926940917969, -0.009220600128173828, -0.008558273315429688, -0.007895946502685547, -0.007233619689941406, -0.006571292877197266, -0.005908966064453125, -0.005246639251708984, -0.004584312438964844, -0.003921985626220703, -0.0032596588134765625, -0.002597332000732422, -0.0019350051879882812, -0.0012726783752441406, -0.0006103515625, 5.1975250244140625e-05, 0.0007143020629882812, 0.0013766288757324219, 0.0020389556884765625, 0.002701282501220703, 0.0033636093139648438, 0.004025936126708984, 0.004688262939453125, 0.005350589752197266, 0.006012916564941406, 0.006675243377685547, 0.0073375701904296875, 0.007999897003173828, 0.008662223815917969, 0.00932455062866211, 0.00998687744140625, 0.01064920425415039, 0.011311531066894531, 0.011973857879638672, 0.012636184692382812, 0.013298511505126953, 0.013960838317871094, 0.014623165130615234, 0.015285491943359375, 0.015947818756103516, 0.016610145568847656, 0.017272472381591797, 0.017934799194335938, 0.018597126007080078, 0.01925945281982422, 0.01992177963256836, 0.0205841064453125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 0.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 15.0, 11.0, 20.0, 17.0, 14.0, 23.0, 20.0, 18.0, 30.0, 27.0, 31.0, 32.0, 51.0, 49.0, 46.0, 45.0, 1061.0, 42.0, 41.0, 41.0, 35.0, 42.0, 32.0, 36.0, 32.0, 28.0, 22.0, 16.0, 25.0, 18.0, 13.0, 9.0, 16.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.97998046875, -0.9477157592773438, -0.9154510498046875, -0.8831863403320312, -0.850921630859375, -0.8186569213867188, -0.7863922119140625, -0.7541275024414062, -0.72186279296875, -0.6895980834960938, -0.6573333740234375, -0.6250686645507812, -0.592803955078125, -0.5605392456054688, -0.5282745361328125, -0.49600982666015625, -0.4637451171875, -0.43148040771484375, -0.3992156982421875, -0.36695098876953125, -0.334686279296875, -0.30242156982421875, -0.2701568603515625, -0.23789215087890625, -0.20562744140625, -0.17336273193359375, -0.1410980224609375, -0.10883331298828125, -0.076568603515625, -0.04430389404296875, -0.0120391845703125, 0.02022552490234375, 0.052490234375, 0.08475494384765625, 0.1170196533203125, 0.14928436279296875, 0.181549072265625, 0.21381378173828125, 0.2460784912109375, 0.27834320068359375, 0.31060791015625, 0.34287261962890625, 0.3751373291015625, 0.40740203857421875, 0.439666748046875, 0.47193145751953125, 0.5041961669921875, 0.5364608764648438, 0.5687255859375, 0.6009902954101562, 0.6332550048828125, 0.6655197143554688, 0.697784423828125, 0.7300491333007812, 0.7623138427734375, 0.7945785522460938, 0.82684326171875, 0.8591079711914062, 0.8913726806640625, 0.9236373901367188, 0.955902099609375, 0.9881668090820312, 1.0204315185546875, 1.0526962280273438, 1.0849609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 28.0, 25.0, 39.0, 62.0, 109.0, 153.0, 231.0, 326.0, 383.0, 684.0, 969.0, 1480.0, 2228.0, 3402.0, 5230.0, 8127.0, 12528.0, 20118.0, 32612.0, 54585.0, 100946.0, 231085.0, 1334619.0, 122295.0, 63595.0, 37380.0, 23019.0, 14390.0, 9155.0, 5922.0, 3817.0, 2544.0, 1692.0, 1116.0, 682.0, 471.0, 355.0, 230.0, 133.0, 108.0, 74.0, 47.0, 40.0, 20.0, 26.0, 9.0, 9.0, 7.0, 5.0, 0.0, 3.0, 5.0], "bins": [-0.006641387939453125, -0.00644683837890625, -0.006252288818359375, -0.0060577392578125, -0.005863189697265625, -0.00566864013671875, -0.005474090576171875, -0.005279541015625, -0.005084991455078125, -0.00489044189453125, -0.004695892333984375, -0.0045013427734375, -0.004306793212890625, -0.00411224365234375, -0.003917694091796875, -0.00372314453125, -0.003528594970703125, -0.00333404541015625, -0.003139495849609375, -0.0029449462890625, -0.002750396728515625, -0.00255584716796875, -0.002361297607421875, -0.002166748046875, -0.001972198486328125, -0.00177764892578125, -0.001583099365234375, -0.0013885498046875, -0.001194000244140625, -0.00099945068359375, -0.000804901123046875, -0.0006103515625, -0.000415802001953125, -0.00022125244140625, -2.6702880859375e-05, 0.0001678466796875, 0.000362396240234375, 0.00055694580078125, 0.000751495361328125, 0.000946044921875, 0.001140594482421875, 0.00133514404296875, 0.001529693603515625, 0.0017242431640625, 0.001918792724609375, 0.00211334228515625, 0.002307891845703125, 0.00250244140625, 0.002696990966796875, 0.00289154052734375, 0.003086090087890625, 0.0032806396484375, 0.003475189208984375, 0.00366973876953125, 0.003864288330078125, 0.004058837890625, 0.004253387451171875, 0.00444793701171875, 0.004642486572265625, 0.0048370361328125, 0.005031585693359375, 0.00522613525390625, 0.005420684814453125, 0.005615234375, 0.005809783935546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 3.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 2222.0, 0.0, 1043919.0, 2264.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 3.0, 0.0, 2.0, 10.0], "bins": [-1.0728836059570312e-06, -1.039355993270874e-06, -1.0058283805847168e-06, -9.723007678985596e-07, -9.387731552124023e-07, -9.052455425262451e-07, -8.717179298400879e-07, -8.381903171539307e-07, -8.046627044677734e-07, -7.711350917816162e-07, -7.37607479095459e-07, -7.040798664093018e-07, -6.705522537231445e-07, -6.370246410369873e-07, -6.034970283508301e-07, -5.699694156646729e-07, -5.364418029785156e-07, -5.029141902923584e-07, -4.6938657760620117e-07, -4.3585896492004395e-07, -4.023313522338867e-07, -3.688037395477295e-07, -3.3527612686157227e-07, -3.0174851417541504e-07, -2.682209014892578e-07, -2.3469328880310059e-07, -2.0116567611694336e-07, -1.6763806343078613e-07, -1.341104507446289e-07, -1.0058283805847168e-07, -6.705522537231445e-08, -3.3527612686157227e-08, 0.0, 3.3527612686157227e-08, 6.705522537231445e-08, 1.0058283805847168e-07, 1.341104507446289e-07, 1.6763806343078613e-07, 2.0116567611694336e-07, 2.3469328880310059e-07, 2.682209014892578e-07, 3.0174851417541504e-07, 3.3527612686157227e-07, 3.688037395477295e-07, 4.023313522338867e-07, 4.3585896492004395e-07, 4.6938657760620117e-07, 5.029141902923584e-07, 5.364418029785156e-07, 5.699694156646729e-07, 6.034970283508301e-07, 6.370246410369873e-07, 6.705522537231445e-07, 7.040798664093018e-07, 7.37607479095459e-07, 7.711350917816162e-07, 8.046627044677734e-07, 8.381903171539307e-07, 8.717179298400879e-07, 9.052455425262451e-07, 9.387731552124023e-07, 9.723007678985596e-07, 1.0058283805847168e-06, 1.039355993270874e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 18.0, 14.0, 25.0, 21.0, 20.0, 31.0, 48.0, 49.0, 40.0, 65.0, 68.0, 56.0, 69.0, 63.0, 62.0, 65.0, 53.0, 43.0, 38.0, 40.0, 28.0, 22.0, 10.0, 17.0, 6.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-3.1328125, -3.0621490478515625, -2.991485595703125, -2.9208221435546875, -2.85015869140625, -2.7794952392578125, -2.708831787109375, -2.6381683349609375, -2.5675048828125, -2.4968414306640625, -2.426177978515625, -2.3555145263671875, -2.28485107421875, -2.2141876220703125, -2.143524169921875, -2.0728607177734375, -2.002197265625, -1.9315338134765625, -1.860870361328125, -1.7902069091796875, -1.71954345703125, -1.6488800048828125, -1.578216552734375, -1.5075531005859375, -1.4368896484375, -1.3662261962890625, -1.295562744140625, -1.2248992919921875, -1.15423583984375, -1.0835723876953125, -1.012908935546875, -0.9422454833984375, -0.87158203125, -0.8009185791015625, -0.730255126953125, -0.6595916748046875, -0.58892822265625, -0.5182647705078125, -0.447601318359375, -0.3769378662109375, -0.3062744140625, -0.2356109619140625, -0.164947509765625, -0.0942840576171875, -0.02362060546875, 0.0470428466796875, 0.117706298828125, 0.1883697509765625, 0.259033203125, 0.3296966552734375, 0.400360107421875, 0.4710235595703125, 0.54168701171875, 0.6123504638671875, 0.683013916015625, 0.7536773681640625, 0.8243408203125, 0.8950042724609375, 0.965667724609375, 1.0363311767578125, 1.10699462890625, 1.1776580810546875, 1.248321533203125, 1.3189849853515625, 1.3896484375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 7.0, 13.0, 14.0, 19.0, 30.0, 55.0, 75.0, 110.0, 193.0, 329.0, 510.0, 819.0, 1398.0, 2368.0, 4388.0, 8947.0, 22532.0, 128773.0, 746617.0, 93907.0, 19680.0, 8056.0, 4058.0, 2233.0, 1332.0, 792.0, 437.0, 307.0, 182.0, 127.0, 70.0, 48.0, 34.0, 27.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-9.8984375, -9.62677001953125, -9.3551025390625, -9.08343505859375, -8.811767578125, -8.54010009765625, -8.2684326171875, -7.99676513671875, -7.72509765625, -7.45343017578125, -7.1817626953125, -6.91009521484375, -6.638427734375, -6.36676025390625, -6.0950927734375, -5.82342529296875, -5.5517578125, -5.28009033203125, -5.0084228515625, -4.73675537109375, -4.465087890625, -4.19342041015625, -3.9217529296875, -3.65008544921875, -3.37841796875, -3.10675048828125, -2.8350830078125, -2.56341552734375, -2.291748046875, -2.02008056640625, -1.7484130859375, -1.47674560546875, -1.205078125, -0.93341064453125, -0.6617431640625, -0.39007568359375, -0.118408203125, 0.15325927734375, 0.4249267578125, 0.69659423828125, 0.96826171875, 1.23992919921875, 1.5115966796875, 1.78326416015625, 2.054931640625, 2.32659912109375, 2.5982666015625, 2.86993408203125, 3.1416015625, 3.41326904296875, 3.6849365234375, 3.95660400390625, 4.228271484375, 4.49993896484375, 4.7716064453125, 5.04327392578125, 5.31494140625, 5.58660888671875, 5.8582763671875, 6.12994384765625, 6.401611328125, 6.67327880859375, 6.9449462890625, 7.21661376953125, 7.48828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 1.0, 7.0, 17.0, 11.0, 12.0, 17.0, 24.0, 26.0, 19.0, 29.0, 25.0, 28.0, 36.0, 30.0, 45.0, 43.0, 73.0, 134.0, 1474.0, 376.0, 144.0, 58.0, 58.0, 52.0, 40.0, 42.0, 29.0, 31.0, 19.0, 19.0, 18.0, 20.0, 20.0, 16.0, 8.0, 8.0, 7.0, 12.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.70703125, -4.5640869140625, -4.421142578125, -4.2781982421875, -4.13525390625, -3.9923095703125, -3.849365234375, -3.7064208984375, -3.5634765625, -3.4205322265625, -3.277587890625, -3.1346435546875, -2.99169921875, -2.8487548828125, -2.705810546875, -2.5628662109375, -2.419921875, -2.2769775390625, -2.134033203125, -1.9910888671875, -1.84814453125, -1.7052001953125, -1.562255859375, -1.4193115234375, -1.2763671875, -1.1334228515625, -0.990478515625, -0.8475341796875, -0.70458984375, -0.5616455078125, -0.418701171875, -0.2757568359375, -0.1328125, 0.0101318359375, 0.153076171875, 0.2960205078125, 0.43896484375, 0.5819091796875, 0.724853515625, 0.8677978515625, 1.0107421875, 1.1536865234375, 1.296630859375, 1.4395751953125, 1.58251953125, 1.7254638671875, 1.868408203125, 2.0113525390625, 2.154296875, 2.2972412109375, 2.440185546875, 2.5831298828125, 2.72607421875, 2.8690185546875, 3.011962890625, 3.1549072265625, 3.2978515625, 3.4407958984375, 3.583740234375, 3.7266845703125, 3.86962890625, 4.0125732421875, 4.155517578125, 4.2984619140625, 4.44140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 12.0, 7.0, 8.0, 7.0, 10.0, 18.0, 16.0, 12.0, 19.0, 21.0, 22.0, 24.0, 42.0, 45.0, 65.0, 107.0, 213.0, 723.0, 9179.0, 3094224.0, 39200.0, 965.0, 284.0, 113.0, 73.0, 54.0, 28.0, 25.0, 22.0, 23.0, 25.0, 23.0, 20.0, 16.0, 8.0, 14.0, 11.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.734375, -19.068359375, -18.40234375, -17.736328125, -17.0703125, -16.404296875, -15.73828125, -15.072265625, -14.40625, -13.740234375, -13.07421875, -12.408203125, -11.7421875, -11.076171875, -10.41015625, -9.744140625, -9.078125, -8.412109375, -7.74609375, -7.080078125, -6.4140625, -5.748046875, -5.08203125, -4.416015625, -3.75, -3.083984375, -2.41796875, -1.751953125, -1.0859375, -0.419921875, 0.24609375, 0.912109375, 1.578125, 2.244140625, 2.91015625, 3.576171875, 4.2421875, 4.908203125, 5.57421875, 6.240234375, 6.90625, 7.572265625, 8.23828125, 8.904296875, 9.5703125, 10.236328125, 10.90234375, 11.568359375, 12.234375, 12.900390625, 13.56640625, 14.232421875, 14.8984375, 15.564453125, 16.23046875, 16.896484375, 17.5625, 18.228515625, 18.89453125, 19.560546875, 20.2265625, 20.892578125, 21.55859375, 22.224609375, 22.890625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 197.0, 784.0, 33.0, 1.0, 1.0, 0.0, 1.0], "bins": [-141.17442321777344, -138.7506103515625, -136.3267822265625, -133.90296936035156, -131.47914123535156, -129.05532836914062, -126.63150024414062, -124.20768737792969, -121.78385925292969, -119.36003875732422, -116.93621826171875, -114.51239776611328, -112.08857727050781, -109.66475677490234, -107.24093627929688, -104.81712341308594, -102.39330291748047, -99.969482421875, -97.54566192626953, -95.12184143066406, -92.6980209350586, -90.27420043945312, -87.85037994384766, -85.42655944824219, -83.00274658203125, -80.57892608642578, -78.15510559082031, -75.73128509521484, -73.30746459960938, -70.8836441040039, -68.45982360839844, -66.0360107421875, -63.612186431884766, -61.1883659362793, -58.76454544067383, -56.34072494506836, -53.916908264160156, -51.49308776855469, -49.06926727294922, -46.64544677734375, -44.22162628173828, -41.79780578613281, -39.373985290527344, -36.950164794921875, -34.526344299316406, -32.10252380371094, -29.678707122802734, -27.254886627197266, -24.831066131591797, -22.407245635986328, -19.98342514038086, -17.559606552124023, -15.135786056518555, -12.711965560913086, -10.288146018981934, -7.864326477050781, -5.440506935119629, -3.0166869163513184, -0.5928668975830078, 1.8309531211853027, 4.254773139953613, 6.678593635559082, 9.102413177490234, 11.526232719421387, 13.950053215026855]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 3.0, 5.0, 7.0, 17.0, 15.0, 32.0, 19.0, 26.0, 19.0, 23.0, 30.0, 35.0, 31.0, 32.0, 36.0, 44.0, 34.0, 47.0, 35.0, 42.0, 42.0, 45.0, 36.0, 27.0, 32.0, 35.0, 31.0, 31.0, 22.0, 22.0, 24.0, 20.0, 16.0, 15.0, 9.0, 10.0, 12.0, 7.0, 8.0, 5.0, 1.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.92745590209961, -16.432964324951172, -15.938474655151367, -15.443984031677246, -14.949493408203125, -14.455002784729004, -13.960512161254883, -13.466020584106445, -12.97153091430664, -12.47704029083252, -11.982549667358398, -11.488059043884277, -10.993568420410156, -10.499077796936035, -10.004587173461914, -9.510095596313477, -9.015604972839355, -8.521114349365234, -8.026623725891113, -7.532133102416992, -7.037642478942871, -6.54315185546875, -6.048660755157471, -5.55417013168335, -5.0596795082092285, -4.565188884735107, -4.070698261260986, -3.576207399368286, -3.081716775894165, -2.587226152420044, -2.0927352905273438, -1.5982446670532227, -1.1037540435791016, -0.6092633605003357, -0.11477267742156982, 0.3797180652618408, 0.8742086887359619, 1.368699312210083, 1.8631901741027832, 2.3576807975769043, 2.8521714210510254, 3.3466620445251465, 3.8411526679992676, 4.335643768310547, 4.830134391784668, 5.324625015258789, 5.81911563873291, 6.313606262207031, 6.808096885681152, 7.302587509155273, 7.7970781326293945, 8.291568756103516, 8.786059379577637, 9.280550003051758, 9.775041580200195, 10.26953125, 10.764022827148438, 11.258513450622559, 11.75300407409668, 12.2474946975708, 12.741985321044922, 13.236475944519043, 13.730966567993164, 14.225458145141602, 14.719947814941406]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 12.0, 24.0, 18.0, 22.0, 15.0, 42.0, 42.0, 48.0, 58.0, 61.0, 57.0, 55.0, 70.0, 70.0, 68.0, 52.0, 51.0, 37.0, 44.0, 35.0, 22.0, 20.0, 16.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-3.15234375, -3.080780029296875, -3.00921630859375, -2.937652587890625, -2.8660888671875, -2.794525146484375, -2.72296142578125, -2.651397705078125, -2.579833984375, -2.508270263671875, -2.43670654296875, -2.365142822265625, -2.2935791015625, -2.222015380859375, -2.15045166015625, -2.078887939453125, -2.00732421875, -1.935760498046875, -1.86419677734375, -1.792633056640625, -1.7210693359375, -1.649505615234375, -1.57794189453125, -1.506378173828125, -1.434814453125, -1.363250732421875, -1.29168701171875, -1.220123291015625, -1.1485595703125, -1.076995849609375, -1.00543212890625, -0.933868408203125, -0.8623046875, -0.790740966796875, -0.71917724609375, -0.647613525390625, -0.5760498046875, -0.504486083984375, -0.43292236328125, -0.361358642578125, -0.289794921875, -0.218231201171875, -0.14666748046875, -0.075103759765625, -0.0035400390625, 0.068023681640625, 0.13958740234375, 0.211151123046875, 0.28271484375, 0.354278564453125, 0.42584228515625, 0.497406005859375, 0.5689697265625, 0.640533447265625, 0.71209716796875, 0.783660888671875, 0.855224609375, 0.926788330078125, 0.99835205078125, 1.069915771484375, 1.1414794921875, 1.213043212890625, 1.28460693359375, 1.356170654296875, 1.427734375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 8.0, 5.0, 17.0, 17.0, 38.0, 31.0, 61.0, 92.0, 162.0, 315.0, 552.0, 1474.0, 7353.0, 115096.0, 3709689.0, 341748.0, 13941.0, 2092.0, 704.0, 353.0, 197.0, 120.0, 78.0, 40.0, 25.0, 33.0, 18.0, 8.0, 3.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-20.015625, -19.5570068359375, -19.098388671875, -18.6397705078125, -18.18115234375, -17.7225341796875, -17.263916015625, -16.8052978515625, -16.3466796875, -15.8880615234375, -15.429443359375, -14.9708251953125, -14.51220703125, -14.0535888671875, -13.594970703125, -13.1363525390625, -12.677734375, -12.2191162109375, -11.760498046875, -11.3018798828125, -10.84326171875, -10.3846435546875, -9.926025390625, -9.4674072265625, -9.0087890625, -8.5501708984375, -8.091552734375, -7.6329345703125, -7.17431640625, -6.7156982421875, -6.257080078125, -5.7984619140625, -5.33984375, -4.8812255859375, -4.422607421875, -3.9639892578125, -3.50537109375, -3.0467529296875, -2.588134765625, -2.1295166015625, -1.6708984375, -1.2122802734375, -0.753662109375, -0.2950439453125, 0.16357421875, 0.6221923828125, 1.080810546875, 1.5394287109375, 1.998046875, 2.4566650390625, 2.915283203125, 3.3739013671875, 3.83251953125, 4.2911376953125, 4.749755859375, 5.2083740234375, 5.6669921875, 6.1256103515625, 6.584228515625, 7.0428466796875, 7.50146484375, 7.9600830078125, 8.418701171875, 8.8773193359375, 9.3359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 16.0, 29.0, 21.0, 57.0, 75.0, 160.0, 235.0, 375.0, 573.0, 760.0, 631.0, 420.0, 290.0, 179.0, 104.0, 63.0, 30.0, 12.0, 15.0, 1.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.494384765625, -8.20751953125, -7.920654296875, -7.6337890625, -7.346923828125, -7.06005859375, -6.773193359375, -6.486328125, -6.199462890625, -5.91259765625, -5.625732421875, -5.3388671875, -5.052001953125, -4.76513671875, -4.478271484375, -4.19140625, -3.904541015625, -3.61767578125, -3.330810546875, -3.0439453125, -2.757080078125, -2.47021484375, -2.183349609375, -1.896484375, -1.609619140625, -1.32275390625, -1.035888671875, -0.7490234375, -0.462158203125, -0.17529296875, 0.111572265625, 0.3984375, 0.685302734375, 0.97216796875, 1.259033203125, 1.5458984375, 1.832763671875, 2.11962890625, 2.406494140625, 2.693359375, 2.980224609375, 3.26708984375, 3.553955078125, 3.8408203125, 4.127685546875, 4.41455078125, 4.701416015625, 4.98828125, 5.275146484375, 5.56201171875, 5.848876953125, 6.1357421875, 6.422607421875, 6.70947265625, 6.996337890625, 7.283203125, 7.570068359375, 7.85693359375, 8.143798828125, 8.4306640625, 8.717529296875, 9.00439453125, 9.291259765625, 9.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 9.0, 13.0, 12.0, 29.0, 29.0, 38.0, 68.0, 93.0, 150.0, 276.0, 541.0, 1037.0, 2743.0, 14790.0, 260557.0, 3580244.0, 311548.0, 16687.0, 2978.0, 1072.0, 569.0, 291.0, 188.0, 102.0, 85.0, 44.0, 28.0, 22.0, 18.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -15.84619140625, -15.2705078125, -14.69482421875, -14.119140625, -13.54345703125, -12.9677734375, -12.39208984375, -11.81640625, -11.24072265625, -10.6650390625, -10.08935546875, -9.513671875, -8.93798828125, -8.3623046875, -7.78662109375, -7.2109375, -6.63525390625, -6.0595703125, -5.48388671875, -4.908203125, -4.33251953125, -3.7568359375, -3.18115234375, -2.60546875, -2.02978515625, -1.4541015625, -0.87841796875, -0.302734375, 0.27294921875, 0.8486328125, 1.42431640625, 2.0, 2.57568359375, 3.1513671875, 3.72705078125, 4.302734375, 4.87841796875, 5.4541015625, 6.02978515625, 6.60546875, 7.18115234375, 7.7568359375, 8.33251953125, 8.908203125, 9.48388671875, 10.0595703125, 10.63525390625, 11.2109375, 11.78662109375, 12.3623046875, 12.93798828125, 13.513671875, 14.08935546875, 14.6650390625, 15.24072265625, 15.81640625, 16.39208984375, 16.9677734375, 17.54345703125, 18.119140625, 18.69482421875, 19.2705078125, 19.84619140625, 20.421875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 10.0, 32.0, 162.0, 313.0, 323.0, 133.0, 34.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.589736938476562, -16.253463745117188, -13.91718864440918, -11.580914497375488, -9.244640350341797, -6.9083662033081055, -4.572092056274414, -2.2358169555664062, 0.10045623779296875, 2.43673038482666, 4.773004531860352, 7.109278678894043, 9.445552825927734, 11.781826972961426, 14.118101119995117, 16.454376220703125, 18.7906494140625, 21.126922607421875, 23.463197708129883, 25.79947280883789, 28.135746002197266, 30.47201919555664, 32.80829620361328, 35.144569396972656, 37.48084259033203, 39.817115783691406, 42.15338897705078, 44.48966598510742, 46.8259391784668, 49.16221237182617, 51.49848937988281, 53.83476257324219, 56.17103576660156, 58.50730895996094, 60.84358215332031, 63.17985916137695, 65.51612854003906, 67.85240936279297, 70.18868255615234, 72.52495574951172, 74.8612289428711, 77.19750213623047, 79.53377532958984, 81.87004852294922, 84.20632934570312, 86.5426025390625, 88.87887573242188, 91.21514892578125, 93.55142211914062, 95.8876953125, 98.22396850585938, 100.56024169921875, 102.89651489257812, 105.23279571533203, 107.5690689086914, 109.90534210205078, 112.24161529541016, 114.57788848876953, 116.9141616821289, 119.25043487548828, 121.58671569824219, 123.92298889160156, 126.25926208496094, 128.5955352783203, 130.9318084716797]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 6.0, 10.0, 17.0, 10.0, 26.0, 10.0, 20.0, 21.0, 22.0, 35.0, 26.0, 34.0, 32.0, 34.0, 33.0, 54.0, 39.0, 34.0, 37.0, 34.0, 40.0, 36.0, 40.0, 35.0, 36.0, 28.0, 33.0, 24.0, 21.0, 18.0, 17.0, 15.0, 17.0, 16.0, 11.0, 8.0, 14.0, 6.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0], "bins": [-20.789962768554688, -20.206619262695312, -19.623275756835938, -19.03993034362793, -18.456586837768555, -17.87324333190918, -17.289897918701172, -16.706554412841797, -16.123210906982422, -15.539867401123047, -14.956522941589355, -14.373178482055664, -13.789834976196289, -13.206491470336914, -12.623147010803223, -12.039802551269531, -11.456459045410156, -10.873115539550781, -10.28977108001709, -9.706426620483398, -9.123083114624023, -8.539739608764648, -7.956395149230957, -7.373051166534424, -6.789707183837891, -6.206363201141357, -5.623019218444824, -5.039675235748291, -4.456331253051758, -3.8729872703552246, -3.2896432876586914, -2.706299304962158, -2.122955322265625, -1.5396113395690918, -0.9562673568725586, -0.3729233741760254, 0.2104206085205078, 0.793764591217041, 1.3771085739135742, 1.9604525566101074, 2.5437965393066406, 3.127140522003174, 3.710484504699707, 4.29382848739624, 4.877172470092773, 5.460516452789307, 6.04386043548584, 6.627204418182373, 7.210548400878906, 7.7938923835754395, 8.377236366271973, 8.960580825805664, 9.543924331665039, 10.127267837524414, 10.710612297058105, 11.293956756591797, 11.877300262451172, 12.460643768310547, 13.043988227844238, 13.62733268737793, 14.210676193237305, 14.79401969909668, 15.377364158630371, 15.960708618164062, 16.544052124023438]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 12.0, 16.0, 25.0, 25.0, 38.0, 35.0, 37.0, 43.0, 43.0, 69.0, 64.0, 67.0, 59.0, 62.0, 67.0, 55.0, 39.0, 42.0, 41.0, 29.0, 24.0, 16.0, 20.0, 13.0, 8.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.064453125, -2.99285888671875, -2.9212646484375, -2.84967041015625, -2.778076171875, -2.70648193359375, -2.6348876953125, -2.56329345703125, -2.49169921875, -2.42010498046875, -2.3485107421875, -2.27691650390625, -2.205322265625, -2.13372802734375, -2.0621337890625, -1.99053955078125, -1.9189453125, -1.84735107421875, -1.7757568359375, -1.70416259765625, -1.632568359375, -1.56097412109375, -1.4893798828125, -1.41778564453125, -1.34619140625, -1.27459716796875, -1.2030029296875, -1.13140869140625, -1.059814453125, -0.98822021484375, -0.9166259765625, -0.84503173828125, -0.7734375, -0.70184326171875, -0.6302490234375, -0.55865478515625, -0.487060546875, -0.41546630859375, -0.3438720703125, -0.27227783203125, -0.20068359375, -0.12908935546875, -0.0574951171875, 0.01409912109375, 0.085693359375, 0.15728759765625, 0.2288818359375, 0.30047607421875, 0.3720703125, 0.44366455078125, 0.5152587890625, 0.58685302734375, 0.658447265625, 0.73004150390625, 0.8016357421875, 0.87322998046875, 0.94482421875, 1.01641845703125, 1.0880126953125, 1.15960693359375, 1.231201171875, 1.30279541015625, 1.3743896484375, 1.44598388671875, 1.517578125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 14.0, 18.0, 29.0, 48.0, 85.0, 144.0, 277.0, 450.0, 980.0, 1990.0, 4413.0, 10226.0, 24121.0, 61967.0, 190593.0, 522948.0, 144393.0, 50174.0, 19938.0, 8507.0, 3760.0, 1698.0, 797.0, 428.0, 220.0, 123.0, 67.0, 48.0, 18.0, 16.0, 15.0, 4.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023162841796875, -0.02250838279724121, -0.021853923797607422, -0.021199464797973633, -0.020545005798339844, -0.019890546798706055, -0.019236087799072266, -0.018581628799438477, -0.017927169799804688, -0.0172727108001709, -0.01661825180053711, -0.01596379280090332, -0.015309333801269531, -0.014654874801635742, -0.014000415802001953, -0.013345956802368164, -0.012691497802734375, -0.012037038803100586, -0.011382579803466797, -0.010728120803833008, -0.010073661804199219, -0.00941920280456543, -0.00876474380493164, -0.008110284805297852, -0.0074558258056640625, -0.0068013668060302734, -0.006146907806396484, -0.005492448806762695, -0.004837989807128906, -0.004183530807495117, -0.003529071807861328, -0.002874612808227539, -0.00222015380859375, -0.001565694808959961, -0.0009112358093261719, -0.0002567768096923828, 0.00039768218994140625, 0.0010521411895751953, 0.0017066001892089844, 0.0023610591888427734, 0.0030155181884765625, 0.0036699771881103516, 0.004324436187744141, 0.00497889518737793, 0.005633354187011719, 0.006287813186645508, 0.006942272186279297, 0.007596731185913086, 0.008251190185546875, 0.008905649185180664, 0.009560108184814453, 0.010214567184448242, 0.010869026184082031, 0.01152348518371582, 0.01217794418334961, 0.012832403182983398, 0.013486862182617188, 0.014141321182250977, 0.014795780181884766, 0.015450239181518555, 0.016104698181152344, 0.016759157180786133, 0.017413616180419922, 0.01806807518005371, 0.0187225341796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 4.0, 10.0, 7.0, 13.0, 8.0, 21.0, 25.0, 12.0, 17.0, 25.0, 30.0, 31.0, 34.0, 33.0, 27.0, 28.0, 49.0, 41.0, 49.0, 1061.0, 48.0, 42.0, 33.0, 41.0, 25.0, 33.0, 34.0, 31.0, 32.0, 30.0, 30.0, 15.0, 20.0, 11.0, 13.0, 15.0, 5.0, 7.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0704803466796875, -1.036468505859375, -1.0024566650390625, -0.96844482421875, -0.9344329833984375, -0.900421142578125, -0.8664093017578125, -0.8323974609375, -0.7983856201171875, -0.764373779296875, -0.7303619384765625, -0.69635009765625, -0.6623382568359375, -0.628326416015625, -0.5943145751953125, -0.560302734375, -0.5262908935546875, -0.492279052734375, -0.4582672119140625, -0.42425537109375, -0.3902435302734375, -0.356231689453125, -0.3222198486328125, -0.2882080078125, -0.2541961669921875, -0.220184326171875, -0.1861724853515625, -0.15216064453125, -0.1181488037109375, -0.084136962890625, -0.0501251220703125, -0.01611328125, 0.0178985595703125, 0.051910400390625, 0.0859222412109375, 0.11993408203125, 0.1539459228515625, 0.187957763671875, 0.2219696044921875, 0.2559814453125, 0.2899932861328125, 0.324005126953125, 0.3580169677734375, 0.39202880859375, 0.4260406494140625, 0.460052490234375, 0.4940643310546875, 0.528076171875, 0.5620880126953125, 0.596099853515625, 0.6301116943359375, 0.66412353515625, 0.6981353759765625, 0.732147216796875, 0.7661590576171875, 0.8001708984375, 0.8341827392578125, 0.868194580078125, 0.9022064208984375, 0.93621826171875, 0.9702301025390625, 1.004241943359375, 1.0382537841796875, 1.072265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 0.0, 1.0, 7.0, 5.0, 6.0, 19.0, 35.0, 42.0, 58.0, 71.0, 142.0, 201.0, 291.0, 394.0, 648.0, 994.0, 1505.0, 2182.0, 3416.0, 5195.0, 8100.0, 13052.0, 20452.0, 32921.0, 54282.0, 92404.0, 202912.0, 1345625.0, 129312.0, 69463.0, 42111.0, 25838.0, 16266.0, 10303.0, 6585.0, 4212.0, 2731.0, 1811.0, 1121.0, 802.0, 558.0, 358.0, 219.0, 125.0, 117.0, 93.0, 51.0, 37.0, 25.0, 9.0, 8.0, 14.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.0061408281326293945, -0.005937814712524414, -0.005734801292419434, -0.005531787872314453, -0.005328774452209473, -0.005125761032104492, -0.004922747611999512, -0.004719734191894531, -0.004516720771789551, -0.00431370735168457, -0.00411069393157959, -0.003907680511474609, -0.003704667091369629, -0.0035016536712646484, -0.003298640251159668, -0.0030956268310546875, -0.002892613410949707, -0.0026895999908447266, -0.002486586570739746, -0.0022835731506347656, -0.002080559730529785, -0.0018775463104248047, -0.0016745328903198242, -0.0014715194702148438, -0.0012685060501098633, -0.0010654926300048828, -0.0008624792098999023, -0.0006594657897949219, -0.0004564523696899414, -0.00025343894958496094, -5.042552947998047e-05, 0.000152587890625, 0.00035560131072998047, 0.0005586147308349609, 0.0007616281509399414, 0.0009646415710449219, 0.0011676549911499023, 0.0013706684112548828, 0.0015736818313598633, 0.0017766952514648438, 0.0019797086715698242, 0.0021827220916748047, 0.002385735511779785, 0.0025887489318847656, 0.002791762351989746, 0.0029947757720947266, 0.003197789192199707, 0.0034008026123046875, 0.003603816032409668, 0.0038068294525146484, 0.004009842872619629, 0.004212856292724609, 0.00441586971282959, 0.00461888313293457, 0.004821896553039551, 0.005024909973144531, 0.005227923393249512, 0.005430936813354492, 0.005633950233459473, 0.005836963653564453, 0.006039977073669434, 0.006242990493774414, 0.0064460039138793945, 0.006649017333984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 990.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 0.0, 13.0, 0.0, 29.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 486.0, 0.0, 7355.0, 0.0, 1032694.0, 0.0, 7334.0, 0.0, 505.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 28.0, 0.0, 10.0, 0.0, 6.0, 4.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 12.0, 16.0, 25.0, 25.0, 38.0, 35.0, 37.0, 43.0, 43.0, 69.0, 64.0, 67.0, 59.0, 62.0, 67.0, 55.0, 39.0, 42.0, 41.0, 29.0, 24.0, 16.0, 20.0, 13.0, 8.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.064453125, -2.99285888671875, -2.9212646484375, -2.84967041015625, -2.778076171875, -2.70648193359375, -2.6348876953125, -2.56329345703125, -2.49169921875, -2.42010498046875, -2.3485107421875, -2.27691650390625, -2.205322265625, -2.13372802734375, -2.0621337890625, -1.99053955078125, -1.9189453125, -1.84735107421875, -1.7757568359375, -1.70416259765625, -1.632568359375, -1.56097412109375, -1.4893798828125, -1.41778564453125, -1.34619140625, -1.27459716796875, -1.2030029296875, -1.13140869140625, -1.059814453125, -0.98822021484375, -0.9166259765625, -0.84503173828125, -0.7734375, -0.70184326171875, -0.6302490234375, -0.55865478515625, -0.487060546875, -0.41546630859375, -0.3438720703125, -0.27227783203125, -0.20068359375, -0.12908935546875, -0.0574951171875, 0.01409912109375, 0.085693359375, 0.15728759765625, 0.2288818359375, 0.30047607421875, 0.3720703125, 0.44366455078125, 0.5152587890625, 0.58685302734375, 0.658447265625, 0.73004150390625, 0.8016357421875, 0.87322998046875, 0.94482421875, 1.01641845703125, 1.0880126953125, 1.15960693359375, 1.231201171875, 1.30279541015625, 1.3743896484375, 1.44598388671875, 1.517578125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 15.0, 24.0, 41.0, 57.0, 93.0, 157.0, 272.0, 451.0, 959.0, 1876.0, 4531.0, 14526.0, 58368.0, 308742.0, 528354.0, 96148.0, 22376.0, 6573.0, 2444.0, 1158.0, 540.0, 328.0, 217.0, 117.0, 63.0, 41.0, 31.0, 14.0, 10.0, 9.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.59765625, -2.5295867919921875, -2.461517333984375, -2.3934478759765625, -2.32537841796875, -2.2573089599609375, -2.189239501953125, -2.1211700439453125, -2.0531005859375, -1.9850311279296875, -1.916961669921875, -1.8488922119140625, -1.78082275390625, -1.7127532958984375, -1.644683837890625, -1.5766143798828125, -1.508544921875, -1.4404754638671875, -1.372406005859375, -1.3043365478515625, -1.23626708984375, -1.1681976318359375, -1.100128173828125, -1.0320587158203125, -0.9639892578125, -0.8959197998046875, -0.827850341796875, -0.7597808837890625, -0.69171142578125, -0.6236419677734375, -0.555572509765625, -0.4875030517578125, -0.41943359375, -0.3513641357421875, -0.283294677734375, -0.2152252197265625, -0.14715576171875, -0.0790863037109375, -0.011016845703125, 0.0570526123046875, 0.1251220703125, 0.1931915283203125, 0.261260986328125, 0.3293304443359375, 0.39739990234375, 0.4654693603515625, 0.533538818359375, 0.6016082763671875, 0.669677734375, 0.7377471923828125, 0.805816650390625, 0.8738861083984375, 0.94195556640625, 1.0100250244140625, 1.078094482421875, 1.1461639404296875, 1.2142333984375, 1.2823028564453125, 1.350372314453125, 1.4184417724609375, 1.48651123046875, 1.5545806884765625, 1.622650146484375, 1.6907196044921875, 1.7587890625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 7.0, 10.0, 9.0, 13.0, 21.0, 19.0, 17.0, 25.0, 22.0, 23.0, 29.0, 35.0, 33.0, 32.0, 51.0, 57.0, 89.0, 371.0, 1608.0, 103.0, 44.0, 46.0, 47.0, 39.0, 41.0, 40.0, 25.0, 38.0, 20.0, 32.0, 9.0, 13.0, 20.0, 12.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.9150390625, -4.740234375, -4.5654296875, -4.390625, -4.2158203125, -4.041015625, -3.8662109375, -3.69140625, -3.5166015625, -3.341796875, -3.1669921875, -2.9921875, -2.8173828125, -2.642578125, -2.4677734375, -2.29296875, -2.1181640625, -1.943359375, -1.7685546875, -1.59375, -1.4189453125, -1.244140625, -1.0693359375, -0.89453125, -0.7197265625, -0.544921875, -0.3701171875, -0.1953125, -0.0205078125, 0.154296875, 0.3291015625, 0.50390625, 0.6787109375, 0.853515625, 1.0283203125, 1.203125, 1.3779296875, 1.552734375, 1.7275390625, 1.90234375, 2.0771484375, 2.251953125, 2.4267578125, 2.6015625, 2.7763671875, 2.951171875, 3.1259765625, 3.30078125, 3.4755859375, 3.650390625, 3.8251953125, 4.0, 4.1748046875, 4.349609375, 4.5244140625, 4.69921875, 4.8740234375, 5.048828125, 5.2236328125, 5.3984375, 5.5732421875, 5.748046875, 5.9228515625, 6.09765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 9.0, 8.0, 12.0, 21.0, 10.0, 11.0, 19.0, 20.0, 27.0, 37.0, 39.0, 39.0, 79.0, 72.0, 136.0, 224.0, 537.0, 1478.0, 14793.0, 3044403.0, 79553.0, 2659.0, 671.0, 280.0, 129.0, 91.0, 73.0, 48.0, 38.0, 23.0, 25.0, 20.0, 15.0, 21.0, 13.0, 21.0, 10.0, 6.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.546875, -11.2138671875, -10.880859375, -10.5478515625, -10.21484375, -9.8818359375, -9.548828125, -9.2158203125, -8.8828125, -8.5498046875, -8.216796875, -7.8837890625, -7.55078125, -7.2177734375, -6.884765625, -6.5517578125, -6.21875, -5.8857421875, -5.552734375, -5.2197265625, -4.88671875, -4.5537109375, -4.220703125, -3.8876953125, -3.5546875, -3.2216796875, -2.888671875, -2.5556640625, -2.22265625, -1.8896484375, -1.556640625, -1.2236328125, -0.890625, -0.5576171875, -0.224609375, 0.1083984375, 0.44140625, 0.7744140625, 1.107421875, 1.4404296875, 1.7734375, 2.1064453125, 2.439453125, 2.7724609375, 3.10546875, 3.4384765625, 3.771484375, 4.1044921875, 4.4375, 4.7705078125, 5.103515625, 5.4365234375, 5.76953125, 6.1025390625, 6.435546875, 6.7685546875, 7.1015625, 7.4345703125, 7.767578125, 8.1005859375, 8.43359375, 8.7666015625, 9.099609375, 9.4326171875, 9.765625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 19.0, 375.0, 598.0, 23.0, 0.0, 0.0, 2.0], "bins": [-67.957275390625, -66.80784606933594, -65.65841674804688, -64.50898742675781, -63.35955810546875, -62.21012878417969, -61.060699462890625, -59.91127014160156, -58.7618408203125, -57.61241149902344, -56.462982177734375, -55.31355285644531, -54.16412353515625, -53.01469421386719, -51.865264892578125, -50.71583557128906, -49.56640625, -48.41697692871094, -47.267547607421875, -46.11811828613281, -44.96868896484375, -43.81925964355469, -42.669830322265625, -41.52040100097656, -40.370967864990234, -39.22153854370117, -38.07210922241211, -36.92267990112305, -35.773250579833984, -34.62382125854492, -33.47439193725586, -32.3249626159668, -31.175533294677734, -30.026103973388672, -28.87667465209961, -27.727245330810547, -26.577816009521484, -25.428386688232422, -24.27895736694336, -23.129528045654297, -21.980098724365234, -20.830669403076172, -19.68124008178711, -18.531810760498047, -17.382381439208984, -16.232952117919922, -15.083521842956543, -13.93409252166748, -12.784662246704102, -11.635232925415039, -10.485803604125977, -9.336374282836914, -8.186944961547852, -7.037515163421631, -5.88808536529541, -4.738656044006348, -3.589226722717285, -2.4397974014282227, -1.290367841720581, -0.14093828201293945, 1.008491039276123, 2.1579203605651855, 3.3073501586914062, 4.456779479980469, 5.606208801269531]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 6.0, 8.0, 13.0, 25.0, 20.0, 23.0, 18.0, 21.0, 32.0, 34.0, 33.0, 37.0, 40.0, 44.0, 44.0, 39.0, 41.0, 35.0, 36.0, 43.0, 39.0, 41.0, 40.0, 33.0, 40.0, 38.0, 25.0, 21.0, 21.0, 17.0, 16.0, 15.0, 13.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.0784969329834, -19.500879287719727, -18.923263549804688, -18.345645904541016, -17.768030166625977, -17.190412521362305, -16.612796783447266, -16.035179138183594, -15.457562446594238, -14.879945755004883, -14.302329063415527, -13.724712371826172, -13.1470947265625, -12.569478988647461, -11.991861343383789, -11.414244651794434, -10.836627960205078, -10.259011268615723, -9.681394577026367, -9.103777885437012, -8.526161193847656, -7.948544025421143, -7.370926856994629, -6.793310165405273, -6.215693473815918, -5.6380767822265625, -5.060460090637207, -4.482842922210693, -3.905226230621338, -3.3276095390319824, -2.749992609024048, -2.1723756790161133, -1.594757080078125, -1.01714026927948, -0.43952345848083496, 0.13809335231781006, 0.7157101631164551, 1.2933268547058105, 1.8709437847137451, 2.4485607147216797, 3.026177406311035, 3.6037940979003906, 4.181410789489746, 4.75902795791626, 5.336644649505615, 5.914261341094971, 6.491878509521484, 7.06949520111084, 7.647111892700195, 8.22472858428955, 8.802345275878906, 9.379961967468262, 9.957578659057617, 10.535196304321289, 11.112812995910645, 11.6904296875, 12.268046379089355, 12.845663070678711, 13.423279762268066, 14.000896453857422, 14.578514099121094, 15.156129837036133, 15.733747482299805, 16.311363220214844, 16.888980865478516]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 16.0, 13.0, 17.0, 31.0, 30.0, 31.0, 41.0, 28.0, 46.0, 53.0, 65.0, 68.0, 54.0, 64.0, 70.0, 63.0, 48.0, 37.0, 47.0, 36.0, 25.0, 25.0, 14.0, 19.0, 13.0, 4.0, 8.0, 9.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.08203125, -3.0094451904296875, -2.936859130859375, -2.8642730712890625, -2.79168701171875, -2.7191009521484375, -2.646514892578125, -2.5739288330078125, -2.5013427734375, -2.4287567138671875, -2.356170654296875, -2.2835845947265625, -2.21099853515625, -2.1384124755859375, -2.065826416015625, -1.9932403564453125, -1.920654296875, -1.8480682373046875, -1.775482177734375, -1.7028961181640625, -1.63031005859375, -1.5577239990234375, -1.485137939453125, -1.4125518798828125, -1.3399658203125, -1.2673797607421875, -1.194793701171875, -1.1222076416015625, -1.04962158203125, -0.9770355224609375, -0.904449462890625, -0.8318634033203125, -0.75927734375, -0.6866912841796875, -0.614105224609375, -0.5415191650390625, -0.46893310546875, -0.3963470458984375, -0.323760986328125, -0.2511749267578125, -0.1785888671875, -0.1060028076171875, -0.033416748046875, 0.0391693115234375, 0.11175537109375, 0.1843414306640625, 0.256927490234375, 0.3295135498046875, 0.402099609375, 0.4746856689453125, 0.547271728515625, 0.6198577880859375, 0.69244384765625, 0.7650299072265625, 0.837615966796875, 0.9102020263671875, 0.9827880859375, 1.0553741455078125, 1.127960205078125, 1.2005462646484375, 1.27313232421875, 1.3457183837890625, 1.418304443359375, 1.4908905029296875, 1.5634765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 25.0, 29.0, 27.0, 42.0, 60.0, 82.0, 174.0, 237.0, 595.0, 1720.0, 9327.0, 87901.0, 2223289.0, 1786588.0, 73295.0, 8084.0, 1585.0, 544.0, 219.0, 140.0, 88.0, 62.0, 37.0, 32.0, 18.0, 16.0, 10.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-12.921875, -12.6064453125, -12.291015625, -11.9755859375, -11.66015625, -11.3447265625, -11.029296875, -10.7138671875, -10.3984375, -10.0830078125, -9.767578125, -9.4521484375, -9.13671875, -8.8212890625, -8.505859375, -8.1904296875, -7.875, -7.5595703125, -7.244140625, -6.9287109375, -6.61328125, -6.2978515625, -5.982421875, -5.6669921875, -5.3515625, -5.0361328125, -4.720703125, -4.4052734375, -4.08984375, -3.7744140625, -3.458984375, -3.1435546875, -2.828125, -2.5126953125, -2.197265625, -1.8818359375, -1.56640625, -1.2509765625, -0.935546875, -0.6201171875, -0.3046875, 0.0107421875, 0.326171875, 0.6416015625, 0.95703125, 1.2724609375, 1.587890625, 1.9033203125, 2.21875, 2.5341796875, 2.849609375, 3.1650390625, 3.48046875, 3.7958984375, 4.111328125, 4.4267578125, 4.7421875, 5.0576171875, 5.373046875, 5.6884765625, 6.00390625, 6.3193359375, 6.634765625, 6.9501953125, 7.265625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 9.0, 19.0, 36.0, 77.0, 132.0, 248.0, 413.0, 608.0, 821.0, 647.0, 451.0, 262.0, 142.0, 83.0, 47.0, 28.0, 19.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.75360107421875, -6.4407958984375, -6.12799072265625, -5.815185546875, -5.50238037109375, -5.1895751953125, -4.87677001953125, -4.56396484375, -4.25115966796875, -3.9383544921875, -3.62554931640625, -3.312744140625, -2.99993896484375, -2.6871337890625, -2.37432861328125, -2.0615234375, -1.74871826171875, -1.4359130859375, -1.12310791015625, -0.810302734375, -0.49749755859375, -0.1846923828125, 0.12811279296875, 0.44091796875, 0.75372314453125, 1.0665283203125, 1.37933349609375, 1.692138671875, 2.00494384765625, 2.3177490234375, 2.63055419921875, 2.943359375, 3.25616455078125, 3.5689697265625, 3.88177490234375, 4.194580078125, 4.50738525390625, 4.8201904296875, 5.13299560546875, 5.44580078125, 5.75860595703125, 6.0714111328125, 6.38421630859375, 6.697021484375, 7.00982666015625, 7.3226318359375, 7.63543701171875, 7.9482421875, 8.26104736328125, 8.5738525390625, 8.88665771484375, 9.199462890625, 9.51226806640625, 9.8250732421875, 10.13787841796875, 10.45068359375, 10.76348876953125, 11.0762939453125, 11.38909912109375, 11.701904296875, 12.01470947265625, 12.3275146484375, 12.64031982421875, 12.953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 10.0, 11.0, 11.0, 21.0, 11.0, 28.0, 43.0, 50.0, 81.0, 134.0, 193.0, 362.0, 588.0, 1349.0, 4062.0, 19563.0, 185063.0, 2816702.0, 1078819.0, 72457.0, 9911.0, 2530.0, 969.0, 488.0, 275.0, 180.0, 108.0, 59.0, 68.0, 41.0, 31.0, 13.0, 15.0, 15.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.421630859375, -13.96826171875, -13.514892578125, -13.0615234375, -12.608154296875, -12.15478515625, -11.701416015625, -11.248046875, -10.794677734375, -10.34130859375, -9.887939453125, -9.4345703125, -8.981201171875, -8.52783203125, -8.074462890625, -7.62109375, -7.167724609375, -6.71435546875, -6.260986328125, -5.8076171875, -5.354248046875, -4.90087890625, -4.447509765625, -3.994140625, -3.540771484375, -3.08740234375, -2.634033203125, -2.1806640625, -1.727294921875, -1.27392578125, -0.820556640625, -0.3671875, 0.086181640625, 0.53955078125, 0.992919921875, 1.4462890625, 1.899658203125, 2.35302734375, 2.806396484375, 3.259765625, 3.713134765625, 4.16650390625, 4.619873046875, 5.0732421875, 5.526611328125, 5.97998046875, 6.433349609375, 6.88671875, 7.340087890625, 7.79345703125, 8.246826171875, 8.7001953125, 9.153564453125, 9.60693359375, 10.060302734375, 10.513671875, 10.967041015625, 11.42041015625, 11.873779296875, 12.3271484375, 12.780517578125, 13.23388671875, 13.687255859375, 14.140625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 17.0, 81.0, 200.0, 310.0, 253.0, 111.0, 35.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.1061782836914, -94.59596252441406, -92.08575439453125, -89.5755386352539, -87.06532287597656, -84.55510711669922, -82.04489135742188, -79.53468322753906, -77.02446746826172, -74.51425170898438, -72.00404357910156, -69.49382781982422, -66.98361206054688, -64.47339630126953, -61.96318435668945, -59.452972412109375, -56.94275665283203, -54.43254089355469, -51.92232894897461, -49.41211700439453, -46.90190124511719, -44.391685485839844, -41.881473541259766, -39.37126159667969, -36.861045837402344, -34.350830078125, -31.840618133544922, -29.33040428161621, -26.8201904296875, -24.30997657775879, -21.799762725830078, -19.289548873901367, -16.77933120727539, -14.26911735534668, -11.758903503417969, -9.248689651489258, -6.738475799560547, -4.228261947631836, -1.718048095703125, 0.7921657562255859, 3.302379608154297, 5.812593460083008, 8.322807312011719, 10.83302116394043, 13.34323501586914, 15.853448867797852, 18.363662719726562, 20.873876571655273, 23.384090423583984, 25.894304275512695, 28.404518127441406, 30.914731979370117, 33.42494583129883, 35.935157775878906, 38.44537353515625, 40.955589294433594, 43.46580123901367, 45.97601318359375, 48.486228942871094, 50.99644470214844, 53.506656646728516, 56.016868591308594, 58.52708435058594, 61.03730010986328, 63.54751205444336]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 9.0, 12.0, 13.0, 13.0, 16.0, 22.0, 28.0, 24.0, 21.0, 28.0, 16.0, 40.0, 33.0, 36.0, 36.0, 31.0, 32.0, 45.0, 25.0, 37.0, 32.0, 51.0, 32.0, 34.0, 23.0, 28.0, 26.0, 27.0, 21.0, 33.0, 16.0, 23.0, 15.0, 20.0, 19.0, 10.0, 15.0, 10.0, 5.0, 6.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-18.29857635498047, -17.76156234741211, -17.22454833984375, -16.687536239624023, -16.150522232055664, -15.613508224487305, -15.076494216918945, -14.539480209350586, -14.002467155456543, -13.465453147888184, -12.92844009399414, -12.391426086425781, -11.854412078857422, -11.317399024963379, -10.78038501739502, -10.243371963500977, -9.706357955932617, -9.169343948364258, -8.632330894470215, -8.095316886901855, -7.558303356170654, -7.021289825439453, -6.484275817871094, -5.947262287139893, -5.410248756408691, -4.87323522567749, -4.336221694946289, -3.7992076873779297, -3.2621941566467285, -2.7251806259155273, -2.188166856765747, -1.6511530876159668, -1.1141395568847656, -0.5771259069442749, -0.04011225700378418, 0.49690139293670654, 1.0339150428771973, 1.5709285736083984, 2.1079423427581787, 2.644956111907959, 3.18196964263916, 3.7189831733703613, 4.2559967041015625, 4.793010711669922, 5.330024242401123, 5.867037773132324, 6.404051780700684, 6.941065311431885, 7.478078842163086, 8.015092849731445, 8.552105903625488, 9.089119911193848, 9.62613296508789, 10.16314697265625, 10.70016098022461, 11.237174987792969, 11.774188041687012, 12.311202049255371, 12.848215103149414, 13.385229110717773, 13.922243118286133, 14.459256172180176, 14.996270179748535, 15.533283233642578, 16.070297241210938]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 9.0, 6.0, 15.0, 9.0, 16.0, 10.0, 20.0, 19.0, 33.0, 49.0, 50.0, 35.0, 59.0, 54.0, 62.0, 57.0, 49.0, 60.0, 59.0, 68.0, 55.0, 40.0, 35.0, 29.0, 28.0, 20.0, 11.0, 18.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8162078857421875, -2.741790771484375, -2.6673736572265625, -2.59295654296875, -2.5185394287109375, -2.444122314453125, -2.3697052001953125, -2.2952880859375, -2.2208709716796875, -2.146453857421875, -2.0720367431640625, -1.99761962890625, -1.9232025146484375, -1.848785400390625, -1.7743682861328125, -1.699951171875, -1.6255340576171875, -1.551116943359375, -1.4766998291015625, -1.40228271484375, -1.3278656005859375, -1.253448486328125, -1.1790313720703125, -1.1046142578125, -1.0301971435546875, -0.955780029296875, -0.8813629150390625, -0.80694580078125, -0.7325286865234375, -0.658111572265625, -0.5836944580078125, -0.50927734375, -0.4348602294921875, -0.360443115234375, -0.2860260009765625, -0.21160888671875, -0.1371917724609375, -0.062774658203125, 0.0116424560546875, 0.0860595703125, 0.1604766845703125, 0.234893798828125, 0.3093109130859375, 0.38372802734375, 0.4581451416015625, 0.532562255859375, 0.6069793701171875, 0.681396484375, 0.7558135986328125, 0.830230712890625, 0.9046478271484375, 0.97906494140625, 1.0534820556640625, 1.127899169921875, 1.2023162841796875, 1.2767333984375, 1.3511505126953125, 1.425567626953125, 1.4999847412109375, 1.57440185546875, 1.6488189697265625, 1.723236083984375, 1.7976531982421875, 1.8720703125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 10.0, 17.0, 14.0, 25.0, 53.0, 62.0, 123.0, 166.0, 323.0, 577.0, 1039.0, 2000.0, 3708.0, 7463.0, 14951.0, 32214.0, 74631.0, 207590.0, 455021.0, 143040.0, 56522.0, 24714.0, 11887.0, 5880.0, 2974.0, 1568.0, 863.0, 452.0, 254.0, 154.0, 89.0, 51.0, 41.0, 21.0, 19.0, 7.0, 4.0, 0.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0191802978515625, -0.01862168312072754, -0.018063068389892578, -0.017504453659057617, -0.016945838928222656, -0.016387224197387695, -0.015828609466552734, -0.015269994735717773, -0.014711380004882812, -0.014152765274047852, -0.01359415054321289, -0.01303553581237793, -0.012476921081542969, -0.011918306350708008, -0.011359691619873047, -0.010801076889038086, -0.010242462158203125, -0.009683847427368164, -0.009125232696533203, -0.008566617965698242, -0.008008003234863281, -0.00744938850402832, -0.006890773773193359, -0.0063321590423583984, -0.0057735443115234375, -0.0052149295806884766, -0.004656314849853516, -0.004097700119018555, -0.0035390853881835938, -0.002980470657348633, -0.002421855926513672, -0.001863241195678711, -0.00130462646484375, -0.0007460117340087891, -0.00018739700317382812, 0.0003712177276611328, 0.0009298324584960938, 0.0014884471893310547, 0.0020470619201660156, 0.0026056766510009766, 0.0031642913818359375, 0.0037229061126708984, 0.004281520843505859, 0.00484013557434082, 0.005398750305175781, 0.005957365036010742, 0.006515979766845703, 0.007074594497680664, 0.007633209228515625, 0.008191823959350586, 0.008750438690185547, 0.009309053421020508, 0.009867668151855469, 0.01042628288269043, 0.01098489761352539, 0.011543512344360352, 0.012102127075195312, 0.012660741806030273, 0.013219356536865234, 0.013777971267700195, 0.014336585998535156, 0.014895200729370117, 0.015453815460205078, 0.01601243019104004, 0.016571044921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 12.0, 8.0, 16.0, 17.0, 17.0, 13.0, 29.0, 31.0, 35.0, 22.0, 36.0, 32.0, 49.0, 35.0, 48.0, 37.0, 1074.0, 40.0, 40.0, 24.0, 29.0, 36.0, 43.0, 35.0, 30.0, 25.0, 32.0, 25.0, 33.0, 15.0, 16.0, 11.0, 16.0, 18.0, 13.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0726318359375, -1.036865234375, -1.0010986328125, -0.96533203125, -0.9295654296875, -0.893798828125, -0.8580322265625, -0.822265625, -0.7864990234375, -0.750732421875, -0.7149658203125, -0.67919921875, -0.6434326171875, -0.607666015625, -0.5718994140625, -0.5361328125, -0.5003662109375, -0.464599609375, -0.4288330078125, -0.39306640625, -0.3572998046875, -0.321533203125, -0.2857666015625, -0.25, -0.2142333984375, -0.178466796875, -0.1427001953125, -0.10693359375, -0.0711669921875, -0.035400390625, 0.0003662109375, 0.0361328125, 0.0718994140625, 0.107666015625, 0.1434326171875, 0.17919921875, 0.2149658203125, 0.250732421875, 0.2864990234375, 0.322265625, 0.3580322265625, 0.393798828125, 0.4295654296875, 0.46533203125, 0.5010986328125, 0.536865234375, 0.5726318359375, 0.6083984375, 0.6441650390625, 0.679931640625, 0.7156982421875, 0.75146484375, 0.7872314453125, 0.822998046875, 0.8587646484375, 0.89453125, 0.9302978515625, 0.966064453125, 1.0018310546875, 1.03759765625, 1.0733642578125, 1.109130859375, 1.1448974609375, 1.1806640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 11.0, 6.0, 17.0, 43.0, 56.0, 77.0, 119.0, 161.0, 277.0, 436.0, 619.0, 920.0, 1553.0, 2396.0, 3613.0, 5795.0, 9418.0, 14640.0, 23853.0, 38674.0, 64669.0, 112999.0, 1301692.0, 243799.0, 109072.0, 62191.0, 37528.0, 23214.0, 14306.0, 9020.0, 5639.0, 3678.0, 2279.0, 1493.0, 1033.0, 623.0, 366.0, 260.0, 194.0, 142.0, 70.0, 59.0, 30.0, 29.0, 25.0, 11.0, 14.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.006916046142578125, -0.006706297397613525, -0.006496548652648926, -0.006286799907684326, -0.0060770511627197266, -0.005867302417755127, -0.005657553672790527, -0.005447804927825928, -0.005238056182861328, -0.0050283074378967285, -0.004818558692932129, -0.004608809947967529, -0.00439906120300293, -0.00418931245803833, -0.0039795637130737305, -0.003769814968109131, -0.0035600662231445312, -0.0033503174781799316, -0.003140568733215332, -0.0029308199882507324, -0.002721071243286133, -0.002511322498321533, -0.0023015737533569336, -0.002091825008392334, -0.0018820762634277344, -0.0016723275184631348, -0.0014625787734985352, -0.0012528300285339355, -0.001043081283569336, -0.0008333325386047363, -0.0006235837936401367, -0.0004138350486755371, -0.0002040863037109375, 5.662441253662109e-06, 0.00021541118621826172, 0.00042515993118286133, 0.0006349086761474609, 0.0008446574211120605, 0.0010544061660766602, 0.0012641549110412598, 0.0014739036560058594, 0.001683652400970459, 0.0018934011459350586, 0.002103149890899658, 0.002312898635864258, 0.0025226473808288574, 0.002732396125793457, 0.0029421448707580566, 0.0031518936157226562, 0.003361642360687256, 0.0035713911056518555, 0.003781139850616455, 0.003990888595581055, 0.004200637340545654, 0.004410386085510254, 0.0046201348304748535, 0.004829883575439453, 0.005039632320404053, 0.005249381065368652, 0.005459129810333252, 0.0056688785552978516, 0.005878627300262451, 0.006088376045227051, 0.00629812479019165, 0.00650787353515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 998.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [18.0, 0.0, 8.0, 0.0, 0.0, 11.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 52.0, 0.0, 755.0, 0.0, 0.0, 5962.0, 0.0, 0.0, 1034942.0, 0.0, 5984.0, 0.0, 0.0, 715.0, 0.0, 0.0, 59.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 10.0, 0.0, 16.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 9.0, 6.0, 15.0, 9.0, 16.0, 10.0, 20.0, 19.0, 33.0, 49.0, 50.0, 35.0, 59.0, 54.0, 62.0, 57.0, 49.0, 60.0, 59.0, 68.0, 55.0, 40.0, 35.0, 29.0, 28.0, 20.0, 11.0, 18.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8162078857421875, -2.741790771484375, -2.6673736572265625, -2.59295654296875, -2.5185394287109375, -2.444122314453125, -2.3697052001953125, -2.2952880859375, -2.2208709716796875, -2.146453857421875, -2.0720367431640625, -1.99761962890625, -1.9232025146484375, -1.848785400390625, -1.7743682861328125, -1.699951171875, -1.6255340576171875, -1.551116943359375, -1.4766998291015625, -1.40228271484375, -1.3278656005859375, -1.253448486328125, -1.1790313720703125, -1.1046142578125, -1.0301971435546875, -0.955780029296875, -0.8813629150390625, -0.80694580078125, -0.7325286865234375, -0.658111572265625, -0.5836944580078125, -0.50927734375, -0.4348602294921875, -0.360443115234375, -0.2860260009765625, -0.21160888671875, -0.1371917724609375, -0.062774658203125, 0.0116424560546875, 0.0860595703125, 0.1604766845703125, 0.234893798828125, 0.3093109130859375, 0.38372802734375, 0.4581451416015625, 0.532562255859375, 0.6069793701171875, 0.681396484375, 0.7558135986328125, 0.830230712890625, 0.9046478271484375, 0.97906494140625, 1.0534820556640625, 1.127899169921875, 1.2023162841796875, 1.2767333984375, 1.3511505126953125, 1.425567626953125, 1.4999847412109375, 1.57440185546875, 1.6488189697265625, 1.723236083984375, 1.7976531982421875, 1.8720703125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 16.0, 10.0, 28.0, 36.0, 100.0, 177.0, 346.0, 775.0, 1841.0, 4521.0, 11392.0, 30568.0, 105352.0, 713714.0, 124879.0, 33631.0, 12617.0, 4897.0, 1970.0, 868.0, 400.0, 178.0, 88.0, 72.0, 25.0, 11.0, 8.0, 8.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.85546875, -2.761993408203125, -2.66851806640625, -2.575042724609375, -2.4815673828125, -2.388092041015625, -2.29461669921875, -2.201141357421875, -2.107666015625, -2.014190673828125, -1.92071533203125, -1.827239990234375, -1.7337646484375, -1.640289306640625, -1.54681396484375, -1.453338623046875, -1.35986328125, -1.266387939453125, -1.17291259765625, -1.079437255859375, -0.9859619140625, -0.892486572265625, -0.79901123046875, -0.705535888671875, -0.612060546875, -0.518585205078125, -0.42510986328125, -0.331634521484375, -0.2381591796875, -0.144683837890625, -0.05120849609375, 0.042266845703125, 0.1357421875, 0.229217529296875, 0.32269287109375, 0.416168212890625, 0.5096435546875, 0.603118896484375, 0.69659423828125, 0.790069580078125, 0.883544921875, 0.977020263671875, 1.07049560546875, 1.163970947265625, 1.2574462890625, 1.350921630859375, 1.44439697265625, 1.537872314453125, 1.63134765625, 1.724822998046875, 1.81829833984375, 1.911773681640625, 2.0052490234375, 2.098724365234375, 2.19219970703125, 2.285675048828125, 2.379150390625, 2.472625732421875, 2.56610107421875, 2.659576416015625, 2.7530517578125, 2.846527099609375, 2.94000244140625, 3.033477783203125, 3.126953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 17.0, 13.0, 19.0, 21.0, 20.0, 19.0, 27.0, 38.0, 34.0, 33.0, 41.0, 53.0, 74.0, 110.0, 1700.0, 242.0, 102.0, 40.0, 33.0, 32.0, 43.0, 37.0, 38.0, 24.0, 26.0, 22.0, 26.0, 10.0, 15.0, 10.0, 15.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.625, -5.44256591796875, -5.2601318359375, -5.07769775390625, -4.895263671875, -4.71282958984375, -4.5303955078125, -4.34796142578125, -4.16552734375, -3.98309326171875, -3.8006591796875, -3.61822509765625, -3.435791015625, -3.25335693359375, -3.0709228515625, -2.88848876953125, -2.7060546875, -2.52362060546875, -2.3411865234375, -2.15875244140625, -1.976318359375, -1.79388427734375, -1.6114501953125, -1.42901611328125, -1.24658203125, -1.06414794921875, -0.8817138671875, -0.69927978515625, -0.516845703125, -0.33441162109375, -0.1519775390625, 0.03045654296875, 0.212890625, 0.39532470703125, 0.5777587890625, 0.76019287109375, 0.942626953125, 1.12506103515625, 1.3074951171875, 1.48992919921875, 1.67236328125, 1.85479736328125, 2.0372314453125, 2.21966552734375, 2.402099609375, 2.58453369140625, 2.7669677734375, 2.94940185546875, 3.1318359375, 3.31427001953125, 3.4967041015625, 3.67913818359375, 3.861572265625, 4.04400634765625, 4.2264404296875, 4.40887451171875, 4.59130859375, 4.77374267578125, 4.9561767578125, 5.13861083984375, 5.321044921875, 5.50347900390625, 5.6859130859375, 5.86834716796875, 6.05078125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 9.0, 7.0, 7.0, 12.0, 13.0, 19.0, 14.0, 21.0, 35.0, 29.0, 39.0, 72.0, 96.0, 138.0, 239.0, 466.0, 1604.0, 11384.0, 415481.0, 2689898.0, 22125.0, 2522.0, 599.0, 297.0, 143.0, 103.0, 68.0, 58.0, 29.0, 26.0, 19.0, 24.0, 14.0, 16.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.1875, -9.8800048828125, -9.572509765625, -9.2650146484375, -8.95751953125, -8.6500244140625, -8.342529296875, -8.0350341796875, -7.7275390625, -7.4200439453125, -7.112548828125, -6.8050537109375, -6.49755859375, -6.1900634765625, -5.882568359375, -5.5750732421875, -5.267578125, -4.9600830078125, -4.652587890625, -4.3450927734375, -4.03759765625, -3.7301025390625, -3.422607421875, -3.1151123046875, -2.8076171875, -2.5001220703125, -2.192626953125, -1.8851318359375, -1.57763671875, -1.2701416015625, -0.962646484375, -0.6551513671875, -0.34765625, -0.0401611328125, 0.267333984375, 0.5748291015625, 0.88232421875, 1.1898193359375, 1.497314453125, 1.8048095703125, 2.1123046875, 2.4197998046875, 2.727294921875, 3.0347900390625, 3.34228515625, 3.6497802734375, 3.957275390625, 4.2647705078125, 4.572265625, 4.8797607421875, 5.187255859375, 5.4947509765625, 5.80224609375, 6.1097412109375, 6.417236328125, 6.7247314453125, 7.0322265625, 7.3397216796875, 7.647216796875, 7.9547119140625, 8.26220703125, 8.5697021484375, 8.877197265625, 9.1846923828125, 9.4921875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 24.0, 83.0, 151.0, 265.0, 219.0, 160.0, 79.0, 22.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9689764976501465, -4.418506622314453, -3.868037223815918, -3.3175673484802246, -2.7670977115631104, -2.216628074645996, -1.6661581993103027, -1.1156885623931885, -0.5652189254760742, -0.014749228954315186, 0.5357204675674438, 1.0861902236938477, 1.636659860610962, 2.187129497528076, 2.7375993728637695, 3.288069009780884, 3.838538646697998, 4.389008522033691, 4.939477920532227, 5.48994779586792, 6.040417671203613, 6.590887069702148, 7.141356945037842, 7.691826820373535, 8.24229621887207, 8.792765617370605, 9.343235969543457, 9.893705368041992, 10.444174766540527, 10.994644165039062, 11.545114517211914, 12.09558391571045, 12.646055221557617, 13.196524620056152, 13.746994972229004, 14.297464370727539, 14.847933769226074, 15.39840316772461, 15.948873519897461, 16.499343872070312, 17.04981231689453, 17.600282669067383, 18.1507511138916, 18.701221466064453, 19.251691818237305, 19.802160263061523, 20.352630615234375, 20.903100967407227, 21.453571319580078, 22.00404167175293, 22.55451011657715, 23.10498046875, 23.65545082092285, 24.20591926574707, 24.756389617919922, 25.306859970092773, 25.857328414916992, 26.407798767089844, 26.958267211914062, 27.508737564086914, 28.059207916259766, 28.609676361083984, 29.160146713256836, 29.710617065429688, 30.261085510253906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 1.0, 4.0, 5.0, 11.0, 7.0, 14.0, 25.0, 19.0, 16.0, 18.0, 22.0, 28.0, 44.0, 32.0, 36.0, 37.0, 36.0, 51.0, 33.0, 39.0, 43.0, 36.0, 44.0, 36.0, 45.0, 40.0, 26.0, 26.0, 28.0, 33.0, 26.0, 16.0, 19.0, 13.0, 24.0, 15.0, 14.0, 7.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.887758255004883, -18.264698028564453, -17.641637802124023, -17.018577575683594, -16.395517349243164, -15.772457122802734, -15.149397850036621, -14.526337623596191, -13.903277397155762, -13.280217170715332, -12.657156944274902, -12.034096717834473, -11.41103744506836, -10.78797721862793, -10.1649169921875, -9.54185676574707, -8.91879653930664, -8.295736312866211, -7.672676086425781, -7.04961633682251, -6.42655611038208, -5.80349588394165, -5.180436134338379, -4.557375907897949, -3.9343156814575195, -3.31125545501709, -2.6881954669952393, -2.0651354789733887, -1.442075252532959, -0.8190150260925293, -0.1959550380706787, 0.4271049499511719, 1.0501651763916016, 1.6732252836227417, 2.296285390853882, 2.9193453788757324, 3.542405605316162, 4.165465831756592, 4.788525581359863, 5.411585807800293, 6.034646034240723, 6.657706260681152, 7.280766487121582, 7.9038262367248535, 8.526885986328125, 9.149946212768555, 9.773006439208984, 10.396066665649414, 11.019126892089844, 11.642187118530273, 12.265247344970703, 12.888307571411133, 13.511367797851562, 14.134428024291992, 14.757487297058105, 15.380547523498535, 16.00360870361328, 16.62666893005371, 17.24972915649414, 17.87278938293457, 18.495849609375, 19.11890983581543, 19.74197006225586, 20.365028381347656, 20.988088607788086]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 13.0, 10.0, 17.0, 10.0, 13.0, 20.0, 31.0, 37.0, 55.0, 37.0, 56.0, 56.0, 51.0, 68.0, 43.0, 49.0, 67.0, 66.0, 52.0, 51.0, 38.0, 33.0, 26.0, 24.0, 16.0, 15.0, 13.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7997589111328125, -2.724517822265625, -2.6492767333984375, -2.57403564453125, -2.4987945556640625, -2.423553466796875, -2.3483123779296875, -2.2730712890625, -2.1978302001953125, -2.122589111328125, -2.0473480224609375, -1.97210693359375, -1.8968658447265625, -1.821624755859375, -1.7463836669921875, -1.671142578125, -1.5959014892578125, -1.520660400390625, -1.4454193115234375, -1.37017822265625, -1.2949371337890625, -1.219696044921875, -1.1444549560546875, -1.0692138671875, -0.9939727783203125, -0.918731689453125, -0.8434906005859375, -0.76824951171875, -0.6930084228515625, -0.617767333984375, -0.5425262451171875, -0.46728515625, -0.3920440673828125, -0.316802978515625, -0.2415618896484375, -0.16632080078125, -0.0910797119140625, -0.015838623046875, 0.0594024658203125, 0.1346435546875, 0.2098846435546875, 0.285125732421875, 0.3603668212890625, 0.43560791015625, 0.5108489990234375, 0.586090087890625, 0.6613311767578125, 0.736572265625, 0.8118133544921875, 0.887054443359375, 0.9622955322265625, 1.03753662109375, 1.1127777099609375, 1.188018798828125, 1.2632598876953125, 1.3385009765625, 1.4137420654296875, 1.488983154296875, 1.5642242431640625, 1.63946533203125, 1.7147064208984375, 1.789947509765625, 1.8651885986328125, 1.9404296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 19.0, 16.0, 15.0, 20.0, 20.0, 26.0, 40.0, 46.0, 74.0, 105.0, 252.0, 576.0, 1598.0, 7556.0, 51914.0, 676609.0, 3194326.0, 230616.0, 24316.0, 4151.0, 1070.0, 376.0, 150.0, 93.0, 86.0, 45.0, 32.0, 29.0, 26.0, 10.0, 16.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0078125, -9.7161865234375, -9.424560546875, -9.1329345703125, -8.84130859375, -8.5496826171875, -8.258056640625, -7.9664306640625, -7.6748046875, -7.3831787109375, -7.091552734375, -6.7999267578125, -6.50830078125, -6.2166748046875, -5.925048828125, -5.6334228515625, -5.341796875, -5.0501708984375, -4.758544921875, -4.4669189453125, -4.17529296875, -3.8836669921875, -3.592041015625, -3.3004150390625, -3.0087890625, -2.7171630859375, -2.425537109375, -2.1339111328125, -1.84228515625, -1.5506591796875, -1.259033203125, -0.9674072265625, -0.67578125, -0.3841552734375, -0.092529296875, 0.1990966796875, 0.49072265625, 0.7823486328125, 1.073974609375, 1.3656005859375, 1.6572265625, 1.9488525390625, 2.240478515625, 2.5321044921875, 2.82373046875, 3.1153564453125, 3.406982421875, 3.6986083984375, 3.990234375, 4.2818603515625, 4.573486328125, 4.8651123046875, 5.15673828125, 5.4483642578125, 5.739990234375, 6.0316162109375, 6.3232421875, 6.6148681640625, 6.906494140625, 7.1981201171875, 7.48974609375, 7.7813720703125, 8.072998046875, 8.3646240234375, 8.65625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 8.0, 16.0, 32.0, 55.0, 103.0, 163.0, 292.0, 510.0, 844.0, 840.0, 520.0, 317.0, 171.0, 96.0, 49.0, 24.0, 10.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.375, -16.03363037109375, -15.6922607421875, -15.35089111328125, -15.009521484375, -14.66815185546875, -14.3267822265625, -13.98541259765625, -13.64404296875, -13.30267333984375, -12.9613037109375, -12.61993408203125, -12.278564453125, -11.93719482421875, -11.5958251953125, -11.25445556640625, -10.9130859375, -10.57171630859375, -10.2303466796875, -9.88897705078125, -9.547607421875, -9.20623779296875, -8.8648681640625, -8.52349853515625, -8.18212890625, -7.84075927734375, -7.4993896484375, -7.15802001953125, -6.816650390625, -6.47528076171875, -6.1339111328125, -5.79254150390625, -5.451171875, -5.10980224609375, -4.7684326171875, -4.42706298828125, -4.085693359375, -3.74432373046875, -3.4029541015625, -3.06158447265625, -2.72021484375, -2.37884521484375, -2.0374755859375, -1.69610595703125, -1.354736328125, -1.01336669921875, -0.6719970703125, -0.33062744140625, 0.0107421875, 0.35211181640625, 0.6934814453125, 1.03485107421875, 1.376220703125, 1.71759033203125, 2.0589599609375, 2.40032958984375, 2.74169921875, 3.08306884765625, 3.4244384765625, 3.76580810546875, 4.107177734375, 4.44854736328125, 4.7899169921875, 5.13128662109375, 5.47265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 13.0, 12.0, 11.0, 25.0, 31.0, 58.0, 112.0, 146.0, 365.0, 880.0, 3783.0, 57427.0, 3360730.0, 751169.0, 16427.0, 1913.0, 551.0, 230.0, 141.0, 86.0, 32.0, 38.0, 35.0, 20.0, 13.0, 8.0, 6.0, 1.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.563232421875, -15.76708984375, -14.970947265625, -14.1748046875, -13.378662109375, -12.58251953125, -11.786376953125, -10.990234375, -10.194091796875, -9.39794921875, -8.601806640625, -7.8056640625, -7.009521484375, -6.21337890625, -5.417236328125, -4.62109375, -3.824951171875, -3.02880859375, -2.232666015625, -1.4365234375, -0.640380859375, 0.15576171875, 0.951904296875, 1.748046875, 2.544189453125, 3.34033203125, 4.136474609375, 4.9326171875, 5.728759765625, 6.52490234375, 7.321044921875, 8.1171875, 8.913330078125, 9.70947265625, 10.505615234375, 11.3017578125, 12.097900390625, 12.89404296875, 13.690185546875, 14.486328125, 15.282470703125, 16.07861328125, 16.874755859375, 17.6708984375, 18.467041015625, 19.26318359375, 20.059326171875, 20.85546875, 21.651611328125, 22.44775390625, 23.243896484375, 24.0400390625, 24.836181640625, 25.63232421875, 26.428466796875, 27.224609375, 28.020751953125, 28.81689453125, 29.613037109375, 30.4091796875, 31.205322265625, 32.00146484375, 32.797607421875, 33.59375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 43.0, 61.0, 104.0, 152.0, 153.0, 141.0, 121.0, 83.0, 56.0, 22.0, 12.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.122764587402344, -60.66960525512695, -59.21644592285156, -57.763282775878906, -56.310123443603516, -54.856964111328125, -53.403804779052734, -51.950645446777344, -50.49748611450195, -49.04432678222656, -47.59116744995117, -46.13800811767578, -44.684844970703125, -43.231685638427734, -41.778526306152344, -40.32536697387695, -38.87220764160156, -37.41904830932617, -35.96588897705078, -34.512725830078125, -33.059566497802734, -31.606407165527344, -30.153247833251953, -28.700088500976562, -27.246925354003906, -25.793766021728516, -24.340604782104492, -22.8874454498291, -21.43428611755371, -19.981124877929688, -18.527965545654297, -17.074806213378906, -15.621644973754883, -14.168484687805176, -12.715325355529785, -11.262165069580078, -9.809005737304688, -8.35584545135498, -6.902685165405273, -5.449525833129883, -3.996365547180176, -2.543205738067627, -1.090045690536499, 0.3631143569946289, 1.8162741661071777, 3.2694339752197266, 4.722594261169434, 6.175753593444824, 7.628913879394531, 9.082074165344238, 10.535233497619629, 11.988393783569336, 13.441553115844727, 14.894713401794434, 16.34787368774414, 17.80103302001953, 19.254192352294922, 20.707351684570312, 22.160512924194336, 23.613672256469727, 25.066831588745117, 26.51999282836914, 27.97315216064453, 29.426311492919922, 30.879472732543945]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 4.0, 8.0, 9.0, 13.0, 10.0, 13.0, 11.0, 15.0, 21.0, 23.0, 24.0, 18.0, 44.0, 32.0, 35.0, 42.0, 39.0, 42.0, 43.0, 39.0, 51.0, 41.0, 51.0, 44.0, 44.0, 27.0, 42.0, 37.0, 26.0, 24.0, 30.0, 22.0, 18.0, 15.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.445066452026367, -20.74574089050293, -20.046417236328125, -19.347091674804688, -18.64776611328125, -17.948440551757812, -17.249114990234375, -16.54979133605957, -15.850465774536133, -15.151140213012695, -14.451815605163574, -13.752490997314453, -13.053165435791016, -12.353839874267578, -11.654515266418457, -10.955190658569336, -10.255865097045898, -9.556539535522461, -8.85721492767334, -8.157890319824219, -7.458564758300781, -6.759239673614502, -6.059914588928223, -5.360589504241943, -4.661264419555664, -3.9619393348693848, -3.2626142501831055, -2.563289165496826, -1.8639640808105469, -1.1646389961242676, -0.4653139114379883, 0.23401117324829102, 0.9333343505859375, 1.6326594352722168, 2.331984519958496, 3.0313096046447754, 3.7306346893310547, 4.429959774017334, 5.129284858703613, 5.828609943389893, 6.527935028076172, 7.227260112762451, 7.9265851974487305, 8.625909805297852, 9.325235366821289, 10.024560928344727, 10.723885536193848, 11.423210144042969, 12.122535705566406, 12.821861267089844, 13.521185874938965, 14.220510482788086, 14.919836044311523, 15.619161605834961, 16.318485260009766, 17.017810821533203, 17.71713638305664, 18.416461944580078, 19.115787506103516, 19.81511116027832, 20.514436721801758, 21.213762283325195, 21.9130859375, 22.612411499023438, 23.311737060546875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 9.0, 16.0, 7.0, 14.0, 11.0, 18.0, 16.0, 32.0, 41.0, 38.0, 41.0, 46.0, 45.0, 55.0, 47.0, 56.0, 54.0, 55.0, 52.0, 51.0, 62.0, 31.0, 31.0, 35.0, 26.0, 22.0, 24.0, 12.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71875, -2.64459228515625, -2.5704345703125, -2.49627685546875, -2.422119140625, -2.34796142578125, -2.2738037109375, -2.19964599609375, -2.12548828125, -2.05133056640625, -1.9771728515625, -1.90301513671875, -1.828857421875, -1.75469970703125, -1.6805419921875, -1.60638427734375, -1.5322265625, -1.45806884765625, -1.3839111328125, -1.30975341796875, -1.235595703125, -1.16143798828125, -1.0872802734375, -1.01312255859375, -0.93896484375, -0.86480712890625, -0.7906494140625, -0.71649169921875, -0.642333984375, -0.56817626953125, -0.4940185546875, -0.41986083984375, -0.345703125, -0.27154541015625, -0.1973876953125, -0.12322998046875, -0.049072265625, 0.02508544921875, 0.0992431640625, 0.17340087890625, 0.24755859375, 0.32171630859375, 0.3958740234375, 0.47003173828125, 0.544189453125, 0.61834716796875, 0.6925048828125, 0.76666259765625, 0.8408203125, 0.91497802734375, 0.9891357421875, 1.06329345703125, 1.137451171875, 1.21160888671875, 1.2857666015625, 1.35992431640625, 1.43408203125, 1.50823974609375, 1.5823974609375, 1.65655517578125, 1.730712890625, 1.80487060546875, 1.8790283203125, 1.95318603515625, 2.02734375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 3.0, 14.0, 18.0, 27.0, 38.0, 53.0, 101.0, 151.0, 239.0, 395.0, 606.0, 997.0, 1559.0, 2846.0, 4639.0, 8287.0, 14334.0, 25620.0, 49873.0, 103556.0, 307771.0, 311669.0, 105086.0, 49890.0, 26517.0, 14373.0, 8109.0, 4662.0, 2787.0, 1647.0, 1029.0, 641.0, 379.0, 240.0, 139.0, 68.0, 57.0, 42.0, 25.0, 15.0, 14.0, 12.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0162353515625, -0.01575791835784912, -0.015280485153198242, -0.014803051948547363, -0.014325618743896484, -0.013848185539245605, -0.013370752334594727, -0.012893319129943848, -0.012415885925292969, -0.01193845272064209, -0.011461019515991211, -0.010983586311340332, -0.010506153106689453, -0.010028719902038574, -0.009551286697387695, -0.009073853492736816, -0.008596420288085938, -0.008118987083435059, -0.00764155387878418, -0.007164120674133301, -0.006686687469482422, -0.006209254264831543, -0.005731821060180664, -0.005254387855529785, -0.004776954650878906, -0.004299521446228027, -0.0038220882415771484, -0.0033446550369262695, -0.0028672218322753906, -0.0023897886276245117, -0.0019123554229736328, -0.001434922218322754, -0.000957489013671875, -0.0004800558090209961, -2.6226043701171875e-06, 0.0004748106002807617, 0.0009522438049316406, 0.0014296770095825195, 0.0019071102142333984, 0.0023845434188842773, 0.0028619766235351562, 0.003339409828186035, 0.003816843032836914, 0.004294276237487793, 0.004771709442138672, 0.005249142646789551, 0.00572657585144043, 0.006204009056091309, 0.0066814422607421875, 0.007158875465393066, 0.007636308670043945, 0.008113741874694824, 0.008591175079345703, 0.009068608283996582, 0.009546041488647461, 0.01002347469329834, 0.010500907897949219, 0.010978341102600098, 0.011455774307250977, 0.011933207511901855, 0.012410640716552734, 0.012888073921203613, 0.013365507125854492, 0.013842940330505371, 0.01432037353515625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 6.0, 5.0, 9.0, 13.0, 11.0, 15.0, 12.0, 13.0, 15.0, 17.0, 20.0, 26.0, 31.0, 41.0, 39.0, 46.0, 34.0, 44.0, 49.0, 1063.0, 45.0, 31.0, 34.0, 40.0, 42.0, 39.0, 38.0, 26.0, 33.0, 28.0, 18.0, 22.0, 21.0, 22.0, 11.0, 13.0, 6.0, 6.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.1953125, -1.1561279296875, -1.116943359375, -1.0777587890625, -1.03857421875, -0.9993896484375, -0.960205078125, -0.9210205078125, -0.8818359375, -0.8426513671875, -0.803466796875, -0.7642822265625, -0.72509765625, -0.6859130859375, -0.646728515625, -0.6075439453125, -0.568359375, -0.5291748046875, -0.489990234375, -0.4508056640625, -0.41162109375, -0.3724365234375, -0.333251953125, -0.2940673828125, -0.2548828125, -0.2156982421875, -0.176513671875, -0.1373291015625, -0.09814453125, -0.0589599609375, -0.019775390625, 0.0194091796875, 0.05859375, 0.0977783203125, 0.136962890625, 0.1761474609375, 0.21533203125, 0.2545166015625, 0.293701171875, 0.3328857421875, 0.3720703125, 0.4112548828125, 0.450439453125, 0.4896240234375, 0.52880859375, 0.5679931640625, 0.607177734375, 0.6463623046875, 0.685546875, 0.7247314453125, 0.763916015625, 0.8031005859375, 0.84228515625, 0.8814697265625, 0.920654296875, 0.9598388671875, 0.9990234375, 1.0382080078125, 1.077392578125, 1.1165771484375, 1.15576171875, 1.1949462890625, 1.234130859375, 1.2733154296875, 1.3125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 7.0, 21.0, 17.0, 40.0, 74.0, 76.0, 111.0, 167.0, 271.0, 447.0, 559.0, 810.0, 1207.0, 1854.0, 2759.0, 4100.0, 6238.0, 9679.0, 15103.0, 23859.0, 39471.0, 67743.0, 127778.0, 1339385.0, 214543.0, 97302.0, 54112.0, 32442.0, 19700.0, 12684.0, 8306.0, 5345.0, 3605.0, 2449.0, 1552.0, 1084.0, 757.0, 466.0, 328.0, 231.0, 129.0, 95.0, 68.0, 45.0, 34.0, 25.0, 20.0, 11.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0], "bins": [-0.00792694091796875, -0.007692456245422363, -0.0074579715728759766, -0.00722348690032959, -0.006989002227783203, -0.006754517555236816, -0.00652003288269043, -0.006285548210144043, -0.006051063537597656, -0.0058165788650512695, -0.005582094192504883, -0.005347609519958496, -0.005113124847412109, -0.004878640174865723, -0.004644155502319336, -0.004409670829772949, -0.0041751861572265625, -0.003940701484680176, -0.003706216812133789, -0.0034717321395874023, -0.0032372474670410156, -0.003002762794494629, -0.002768278121948242, -0.0025337934494018555, -0.0022993087768554688, -0.002064824104309082, -0.0018303394317626953, -0.0015958547592163086, -0.0013613700866699219, -0.0011268854141235352, -0.0008924007415771484, -0.0006579160690307617, -0.000423431396484375, -0.00018894672393798828, 4.553794860839844e-05, 0.00028002262115478516, 0.0005145072937011719, 0.0007489919662475586, 0.0009834766387939453, 0.001217961311340332, 0.0014524459838867188, 0.0016869306564331055, 0.0019214153289794922, 0.002155900001525879, 0.0023903846740722656, 0.0026248693466186523, 0.002859354019165039, 0.0030938386917114258, 0.0033283233642578125, 0.0035628080368041992, 0.003797292709350586, 0.004031777381896973, 0.004266262054443359, 0.004500746726989746, 0.004735231399536133, 0.0049697160720825195, 0.005204200744628906, 0.005438685417175293, 0.00567317008972168, 0.005907654762268066, 0.006142139434814453, 0.00637662410736084, 0.0066111087799072266, 0.006845593452453613, 0.007080078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1000.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [9.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 20.0, 0.0, 0.0, 61.0, 0.0, 960.0, 0.0, 0.0, 5984.0, 0.0, 0.0, 1034427.0, 0.0, 6024.0, 0.0, 0.0, 944.0, 0.0, 0.0, 55.0, 0.0, 17.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 5.0, 0.0, 4.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 9.0, 16.0, 7.0, 14.0, 11.0, 18.0, 16.0, 32.0, 41.0, 38.0, 41.0, 46.0, 45.0, 55.0, 47.0, 56.0, 54.0, 55.0, 52.0, 51.0, 62.0, 31.0, 31.0, 35.0, 26.0, 22.0, 24.0, 12.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71875, -2.64459228515625, -2.5704345703125, -2.49627685546875, -2.422119140625, -2.34796142578125, -2.2738037109375, -2.19964599609375, -2.12548828125, -2.05133056640625, -1.9771728515625, -1.90301513671875, -1.828857421875, -1.75469970703125, -1.6805419921875, -1.60638427734375, -1.5322265625, -1.45806884765625, -1.3839111328125, -1.30975341796875, -1.235595703125, -1.16143798828125, -1.0872802734375, -1.01312255859375, -0.93896484375, -0.86480712890625, -0.7906494140625, -0.71649169921875, -0.642333984375, -0.56817626953125, -0.4940185546875, -0.41986083984375, -0.345703125, -0.27154541015625, -0.1973876953125, -0.12322998046875, -0.049072265625, 0.02508544921875, 0.0992431640625, 0.17340087890625, 0.24755859375, 0.32171630859375, 0.3958740234375, 0.47003173828125, 0.544189453125, 0.61834716796875, 0.6925048828125, 0.76666259765625, 0.8408203125, 0.91497802734375, 0.9891357421875, 1.06329345703125, 1.137451171875, 1.21160888671875, 1.2857666015625, 1.35992431640625, 1.43408203125, 1.50823974609375, 1.5823974609375, 1.65655517578125, 1.730712890625, 1.80487060546875, 1.8790283203125, 1.95318603515625, 2.02734375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 8.0, 23.0, 19.0, 36.0, 60.0, 60.0, 115.0, 161.0, 254.0, 363.0, 587.0, 950.0, 1584.0, 2423.0, 4055.0, 6975.0, 12453.0, 24466.0, 57204.0, 192700.0, 506814.0, 141809.0, 47304.0, 21099.0, 11187.0, 6102.0, 3666.0, 2216.0, 1381.0, 893.0, 550.0, 344.0, 239.0, 156.0, 108.0, 57.0, 41.0, 29.0, 23.0, 12.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.568359375, -1.5252685546875, -1.482177734375, -1.4390869140625, -1.39599609375, -1.3529052734375, -1.309814453125, -1.2667236328125, -1.2236328125, -1.1805419921875, -1.137451171875, -1.0943603515625, -1.05126953125, -1.0081787109375, -0.965087890625, -0.9219970703125, -0.87890625, -0.8358154296875, -0.792724609375, -0.7496337890625, -0.70654296875, -0.6634521484375, -0.620361328125, -0.5772705078125, -0.5341796875, -0.4910888671875, -0.447998046875, -0.4049072265625, -0.36181640625, -0.3187255859375, -0.275634765625, -0.2325439453125, -0.189453125, -0.1463623046875, -0.103271484375, -0.0601806640625, -0.01708984375, 0.0260009765625, 0.069091796875, 0.1121826171875, 0.1552734375, 0.1983642578125, 0.241455078125, 0.2845458984375, 0.32763671875, 0.3707275390625, 0.413818359375, 0.4569091796875, 0.5, 0.5430908203125, 0.586181640625, 0.6292724609375, 0.67236328125, 0.7154541015625, 0.758544921875, 0.8016357421875, 0.8447265625, 0.8878173828125, 0.930908203125, 0.9739990234375, 1.01708984375, 1.0601806640625, 1.103271484375, 1.1463623046875, 1.189453125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 19.0, 30.0, 26.0, 40.0, 42.0, 52.0, 44.0, 63.0, 93.0, 317.0, 1706.0, 97.0, 72.0, 65.0, 55.0, 51.0, 39.0, 32.0, 22.0, 20.0, 21.0, 23.0, 9.0, 11.0, 13.0, 9.0, 7.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.6815185546875, -7.417724609375, -7.1539306640625, -6.89013671875, -6.6263427734375, -6.362548828125, -6.0987548828125, -5.8349609375, -5.5711669921875, -5.307373046875, -5.0435791015625, -4.77978515625, -4.5159912109375, -4.252197265625, -3.9884033203125, -3.724609375, -3.4608154296875, -3.197021484375, -2.9332275390625, -2.66943359375, -2.4056396484375, -2.141845703125, -1.8780517578125, -1.6142578125, -1.3504638671875, -1.086669921875, -0.8228759765625, -0.55908203125, -0.2952880859375, -0.031494140625, 0.2322998046875, 0.49609375, 0.7598876953125, 1.023681640625, 1.2874755859375, 1.55126953125, 1.8150634765625, 2.078857421875, 2.3426513671875, 2.6064453125, 2.8702392578125, 3.134033203125, 3.3978271484375, 3.66162109375, 3.9254150390625, 4.189208984375, 4.4530029296875, 4.716796875, 4.9805908203125, 5.244384765625, 5.5081787109375, 5.77197265625, 6.0357666015625, 6.299560546875, 6.5633544921875, 6.8271484375, 7.0909423828125, 7.354736328125, 7.6185302734375, 7.88232421875, 8.1461181640625, 8.409912109375, 8.6737060546875, 8.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 16.0, 9.0, 10.0, 15.0, 19.0, 22.0, 28.0, 47.0, 67.0, 92.0, 147.0, 247.0, 405.0, 981.0, 3352.0, 23011.0, 2669611.0, 429122.0, 14348.0, 2339.0, 807.0, 350.0, 232.0, 119.0, 80.0, 51.0, 42.0, 30.0, 17.0, 17.0, 10.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.25, -10.9180908203125, -10.586181640625, -10.2542724609375, -9.92236328125, -9.5904541015625, -9.258544921875, -8.9266357421875, -8.5947265625, -8.2628173828125, -7.930908203125, -7.5989990234375, -7.26708984375, -6.9351806640625, -6.603271484375, -6.2713623046875, -5.939453125, -5.6075439453125, -5.275634765625, -4.9437255859375, -4.61181640625, -4.2799072265625, -3.947998046875, -3.6160888671875, -3.2841796875, -2.9522705078125, -2.620361328125, -2.2884521484375, -1.95654296875, -1.6246337890625, -1.292724609375, -0.9608154296875, -0.62890625, -0.2969970703125, 0.034912109375, 0.3668212890625, 0.69873046875, 1.0306396484375, 1.362548828125, 1.6944580078125, 2.0263671875, 2.3582763671875, 2.690185546875, 3.0220947265625, 3.35400390625, 3.6859130859375, 4.017822265625, 4.3497314453125, 4.681640625, 5.0135498046875, 5.345458984375, 5.6773681640625, 6.00927734375, 6.3411865234375, 6.673095703125, 7.0050048828125, 7.3369140625, 7.6688232421875, 8.000732421875, 8.3326416015625, 8.66455078125, 8.9964599609375, 9.328369140625, 9.6602783203125, 9.9921875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 734.0, 282.0, 1.0], "bins": [-292.466796875, -287.7378845214844, -283.0090026855469, -278.28009033203125, -273.55120849609375, -268.8222961425781, -264.0933837890625, -259.364501953125, -254.63558959960938, -249.9066925048828, -245.17779541015625, -240.44888305664062, -235.71998596191406, -230.9910888671875, -226.26219177246094, -221.53329467773438, -216.8043975830078, -212.07550048828125, -207.3466033935547, -202.61769104003906, -197.8887939453125, -193.15989685058594, -188.43099975585938, -183.7021026611328, -178.97320556640625, -174.2443084716797, -169.51541137695312, -164.7864990234375, -160.05760192871094, -155.32870483398438, -150.5998077392578, -145.87091064453125, -141.14199829101562, -136.41310119628906, -131.6842041015625, -126.9552993774414, -122.22639465332031, -117.49749755859375, -112.76860046386719, -108.03970336914062, -103.31079864501953, -98.58190155029297, -93.85299682617188, -89.12409973144531, -84.39520263671875, -79.66629791259766, -74.9374008178711, -70.20849609375, -65.47959899902344, -60.75069808959961, -56.02179718017578, -51.29290008544922, -46.56399917602539, -41.83509826660156, -37.106201171875, -32.37730026245117, -27.648401260375977, -22.91950225830078, -18.190601348876953, -13.461701393127441, -8.73280143737793, -4.003900527954102, 0.7249984741210938, 5.453897476196289, 10.182798385620117]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 1.0, 3.0, 7.0, 8.0, 10.0, 16.0, 14.0, 18.0, 22.0, 18.0, 22.0, 22.0, 21.0, 20.0, 22.0, 38.0, 36.0, 24.0, 42.0, 30.0, 37.0, 29.0, 46.0, 29.0, 32.0, 42.0, 43.0, 38.0, 34.0, 27.0, 27.0, 20.0, 28.0, 24.0, 26.0, 23.0, 14.0, 13.0, 15.0, 10.0, 8.0, 8.0, 5.0, 7.0, 6.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0], "bins": [-21.769140243530273, -21.129335403442383, -20.489532470703125, -19.849727630615234, -19.209924697875977, -18.570119857788086, -17.930316925048828, -17.290512084960938, -16.650707244873047, -16.010902404785156, -15.371099472045898, -14.731295585632324, -14.09149169921875, -13.45168685913086, -12.811882972717285, -12.172079086303711, -11.532276153564453, -10.892472267150879, -10.252668380737305, -9.61286449432373, -8.973060607910156, -8.333255767822266, -7.693451881408691, -7.053647994995117, -6.413844108581543, -5.774040222167969, -5.1342363357543945, -4.494431972503662, -3.854628086090088, -3.2148241996765137, -2.5750200748443604, -1.935215950012207, -1.2954120635986328, -0.655608057975769, -0.015804052352905273, 0.6239999532699585, 1.2638039588928223, 1.9036078453063965, 2.54341197013855, 3.183216094970703, 3.8230199813842773, 4.462823867797852, 5.102627754211426, 5.742432117462158, 6.382236003875732, 7.022039890289307, 7.661844253540039, 8.301648139953613, 8.941452026367188, 9.581255912780762, 10.221059799194336, 10.86086368560791, 11.500667572021484, 12.140472412109375, 12.78027629852295, 13.420080184936523, 14.059884071350098, 14.699687957763672, 15.339491844177246, 15.97929573059082, 16.61910057067871, 17.25890350341797, 17.89870834350586, 18.53851318359375, 19.178316116333008]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 9.0, 8.0, 10.0, 12.0, 9.0, 8.0, 8.0, 16.0, 24.0, 24.0, 29.0, 39.0, 52.0, 44.0, 42.0, 50.0, 48.0, 46.0, 65.0, 56.0, 54.0, 48.0, 48.0, 49.0, 44.0, 33.0, 20.0, 25.0, 15.0, 22.0, 14.0, 11.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.787109375, -2.711669921875, -2.63623046875, -2.560791015625, -2.4853515625, -2.409912109375, -2.33447265625, -2.259033203125, -2.18359375, -2.108154296875, -2.03271484375, -1.957275390625, -1.8818359375, -1.806396484375, -1.73095703125, -1.655517578125, -1.580078125, -1.504638671875, -1.42919921875, -1.353759765625, -1.2783203125, -1.202880859375, -1.12744140625, -1.052001953125, -0.9765625, -0.901123046875, -0.82568359375, -0.750244140625, -0.6748046875, -0.599365234375, -0.52392578125, -0.448486328125, -0.373046875, -0.297607421875, -0.22216796875, -0.146728515625, -0.0712890625, 0.004150390625, 0.07958984375, 0.155029296875, 0.23046875, 0.305908203125, 0.38134765625, 0.456787109375, 0.5322265625, 0.607666015625, 0.68310546875, 0.758544921875, 0.833984375, 0.909423828125, 0.98486328125, 1.060302734375, 1.1357421875, 1.211181640625, 1.28662109375, 1.362060546875, 1.4375, 1.512939453125, 1.58837890625, 1.663818359375, 1.7392578125, 1.814697265625, 1.89013671875, 1.965576171875, 2.041015625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 17.0, 12.0, 13.0, 20.0, 22.0, 35.0, 66.0, 127.0, 210.0, 486.0, 1144.0, 3100.0, 9495.0, 34004.0, 150617.0, 1156212.0, 2426968.0, 324908.0, 62266.0, 16302.0, 4927.0, 1816.0, 709.0, 357.0, 171.0, 99.0, 47.0, 35.0, 26.0, 19.0, 13.0, 10.0, 3.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.68646240234375, -6.5018310546875, -6.31719970703125, -6.132568359375, -5.94793701171875, -5.7633056640625, -5.57867431640625, -5.39404296875, -5.20941162109375, -5.0247802734375, -4.84014892578125, -4.655517578125, -4.47088623046875, -4.2862548828125, -4.10162353515625, -3.9169921875, -3.73236083984375, -3.5477294921875, -3.36309814453125, -3.178466796875, -2.99383544921875, -2.8092041015625, -2.62457275390625, -2.43994140625, -2.25531005859375, -2.0706787109375, -1.88604736328125, -1.701416015625, -1.51678466796875, -1.3321533203125, -1.14752197265625, -0.962890625, -0.77825927734375, -0.5936279296875, -0.40899658203125, -0.224365234375, -0.03973388671875, 0.1448974609375, 0.32952880859375, 0.51416015625, 0.69879150390625, 0.8834228515625, 1.06805419921875, 1.252685546875, 1.43731689453125, 1.6219482421875, 1.80657958984375, 1.9912109375, 2.17584228515625, 2.3604736328125, 2.54510498046875, 2.729736328125, 2.91436767578125, 3.0989990234375, 3.28363037109375, 3.46826171875, 3.65289306640625, 3.8375244140625, 4.02215576171875, 4.206787109375, 4.39141845703125, 4.5760498046875, 4.76068115234375, 4.9453125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 5.0, 16.0, 21.0, 20.0, 25.0, 44.0, 69.0, 96.0, 132.0, 211.0, 343.0, 473.0, 563.0, 572.0, 432.0, 335.0, 224.0, 148.0, 94.0, 78.0, 54.0, 38.0, 20.0, 19.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1875, -8.9576416015625, -8.727783203125, -8.4979248046875, -8.26806640625, -8.0382080078125, -7.808349609375, -7.5784912109375, -7.3486328125, -7.1187744140625, -6.888916015625, -6.6590576171875, -6.42919921875, -6.1993408203125, -5.969482421875, -5.7396240234375, -5.509765625, -5.2799072265625, -5.050048828125, -4.8201904296875, -4.59033203125, -4.3604736328125, -4.130615234375, -3.9007568359375, -3.6708984375, -3.4410400390625, -3.211181640625, -2.9813232421875, -2.75146484375, -2.5216064453125, -2.291748046875, -2.0618896484375, -1.83203125, -1.6021728515625, -1.372314453125, -1.1424560546875, -0.91259765625, -0.6827392578125, -0.452880859375, -0.2230224609375, 0.0068359375, 0.2366943359375, 0.466552734375, 0.6964111328125, 0.92626953125, 1.1561279296875, 1.385986328125, 1.6158447265625, 1.845703125, 2.0755615234375, 2.305419921875, 2.5352783203125, 2.76513671875, 2.9949951171875, 3.224853515625, 3.4547119140625, 3.6845703125, 3.9144287109375, 4.144287109375, 4.3741455078125, 4.60400390625, 4.8338623046875, 5.063720703125, 5.2935791015625, 5.5234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 17.0, 30.0, 38.0, 69.0, 113.0, 226.0, 363.0, 844.0, 2212.0, 8960.0, 62659.0, 813458.0, 3031703.0, 241598.0, 24755.0, 4599.0, 1402.0, 592.0, 274.0, 135.0, 92.0, 56.0, 32.0, 24.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.5859375, -13.1219482421875, -12.657958984375, -12.1939697265625, -11.72998046875, -11.2659912109375, -10.802001953125, -10.3380126953125, -9.8740234375, -9.4100341796875, -8.946044921875, -8.4820556640625, -8.01806640625, -7.5540771484375, -7.090087890625, -6.6260986328125, -6.162109375, -5.6981201171875, -5.234130859375, -4.7701416015625, -4.30615234375, -3.8421630859375, -3.378173828125, -2.9141845703125, -2.4501953125, -1.9862060546875, -1.522216796875, -1.0582275390625, -0.59423828125, -0.1302490234375, 0.333740234375, 0.7977294921875, 1.26171875, 1.7257080078125, 2.189697265625, 2.6536865234375, 3.11767578125, 3.5816650390625, 4.045654296875, 4.5096435546875, 4.9736328125, 5.4376220703125, 5.901611328125, 6.3656005859375, 6.82958984375, 7.2935791015625, 7.757568359375, 8.2215576171875, 8.685546875, 9.1495361328125, 9.613525390625, 10.0775146484375, 10.54150390625, 11.0054931640625, 11.469482421875, 11.9334716796875, 12.3974609375, 12.8614501953125, 13.325439453125, 13.7894287109375, 14.25341796875, 14.7174072265625, 15.181396484375, 15.6453857421875, 16.109375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 8.0, 16.0, 22.0, 51.0, 76.0, 88.0, 120.0, 135.0, 148.0, 122.0, 69.0, 63.0, 38.0, 21.0, 12.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.174633026123047, -26.935260772705078, -25.69588851928711, -24.45651626586914, -23.217144012451172, -21.977771759033203, -20.738399505615234, -19.499027252197266, -18.259654998779297, -17.020282745361328, -15.78091049194336, -14.54153823852539, -13.302165985107422, -12.062793731689453, -10.823421478271484, -9.584049224853516, -8.344676971435547, -7.105304718017578, -5.865932464599609, -4.626560211181641, -3.387187957763672, -2.147815704345703, -0.9084434509277344, 0.3309288024902344, 1.5703010559082031, 2.809673309326172, 4.049045562744141, 5.288417816162109, 6.527790069580078, 7.767162322998047, 9.006534576416016, 10.245906829833984, 11.485282897949219, 12.724655151367188, 13.964027404785156, 15.203399658203125, 16.442771911621094, 17.682144165039062, 18.92151641845703, 20.160888671875, 21.40026092529297, 22.639633178710938, 23.879005432128906, 25.118377685546875, 26.357749938964844, 27.597122192382812, 28.83649444580078, 30.07586669921875, 31.31523895263672, 32.55461120605469, 33.793983459472656, 35.033355712890625, 36.272727966308594, 37.51210021972656, 38.75147247314453, 39.9908447265625, 41.23021697998047, 42.46958923339844, 43.708961486816406, 44.948333740234375, 46.187705993652344, 47.42707824707031, 48.66645050048828, 49.90582275390625, 51.14519500732422]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 6.0, 9.0, 10.0, 16.0, 15.0, 10.0, 18.0, 18.0, 22.0, 32.0, 30.0, 40.0, 29.0, 39.0, 47.0, 41.0, 36.0, 31.0, 52.0, 47.0, 50.0, 51.0, 43.0, 34.0, 40.0, 28.0, 20.0, 27.0, 27.0, 19.0, 18.0, 21.0, 12.0, 13.0, 8.0, 8.0, 11.0, 7.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.300743103027344, -20.645584106445312, -19.99042320251465, -19.335264205932617, -18.680103302001953, -18.024944305419922, -17.36978530883789, -16.71462631225586, -16.059465408325195, -15.404305458068848, -14.7491455078125, -14.093986511230469, -13.438826560974121, -12.783666610717773, -12.128507614135742, -11.473347663879395, -10.818187713623047, -10.1630277633667, -9.507867813110352, -8.85270881652832, -8.197548866271973, -7.542388916015625, -6.8872294425964355, -6.232069969177246, -5.576910018920898, -4.921750068664551, -4.266590595245361, -3.6114308834075928, -2.956271171569824, -2.3011114597320557, -1.645951747894287, -0.9907922744750977, -0.33563232421875, 0.31952738761901855, 0.9746870994567871, 1.6298468112945557, 2.285006523132324, 2.9401662349700928, 3.5953259468078613, 4.250485420227051, 4.905645370483398, 5.560805320739746, 6.2159647941589355, 6.871124267578125, 7.526284217834473, 8.18144416809082, 8.836603164672852, 9.4917631149292, 10.146923065185547, 10.802083015441895, 11.457242965698242, 12.112401962280273, 12.767561912536621, 13.422721862792969, 14.077880859375, 14.733040809631348, 15.388200759887695, 16.043359756469727, 16.69852066040039, 17.353679656982422, 18.008838653564453, 18.663999557495117, 19.31915855407715, 19.974319458007812, 20.629478454589844]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 14.0, 11.0, 10.0, 7.0, 17.0, 19.0, 21.0, 22.0, 32.0, 39.0, 42.0, 47.0, 38.0, 43.0, 52.0, 56.0, 54.0, 56.0, 46.0, 38.0, 50.0, 40.0, 45.0, 32.0, 35.0, 22.0, 19.0, 20.0, 16.0, 12.0, 14.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5557861328125, -2.480712890625, -2.4056396484375, -2.33056640625, -2.2554931640625, -2.180419921875, -2.1053466796875, -2.0302734375, -1.9552001953125, -1.880126953125, -1.8050537109375, -1.72998046875, -1.6549072265625, -1.579833984375, -1.5047607421875, -1.4296875, -1.3546142578125, -1.279541015625, -1.2044677734375, -1.12939453125, -1.0543212890625, -0.979248046875, -0.9041748046875, -0.8291015625, -0.7540283203125, -0.678955078125, -0.6038818359375, -0.52880859375, -0.4537353515625, -0.378662109375, -0.3035888671875, -0.228515625, -0.1534423828125, -0.078369140625, -0.0032958984375, 0.07177734375, 0.1468505859375, 0.221923828125, 0.2969970703125, 0.3720703125, 0.4471435546875, 0.522216796875, 0.5972900390625, 0.67236328125, 0.7474365234375, 0.822509765625, 0.8975830078125, 0.97265625, 1.0477294921875, 1.122802734375, 1.1978759765625, 1.27294921875, 1.3480224609375, 1.423095703125, 1.4981689453125, 1.5732421875, 1.6483154296875, 1.723388671875, 1.7984619140625, 1.87353515625, 1.9486083984375, 2.023681640625, 2.0987548828125, 2.173828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 14.0, 18.0, 23.0, 28.0, 65.0, 79.0, 123.0, 213.0, 349.0, 516.0, 825.0, 1340.0, 1955.0, 3110.0, 4808.0, 7814.0, 12557.0, 20268.0, 34231.0, 59463.0, 112473.0, 320617.0, 243186.0, 94681.0, 51462.0, 30040.0, 17862.0, 11138.0, 7071.0, 4385.0, 2882.0, 1790.0, 1129.0, 733.0, 473.0, 304.0, 181.0, 112.0, 77.0, 47.0, 23.0, 29.0, 17.0, 8.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.01385498046875, -0.013433575630187988, -0.013012170791625977, -0.012590765953063965, -0.012169361114501953, -0.011747956275939941, -0.01132655143737793, -0.010905146598815918, -0.010483741760253906, -0.010062336921691895, -0.009640932083129883, -0.009219527244567871, -0.00879812240600586, -0.008376717567443848, -0.007955312728881836, -0.007533907890319824, -0.0071125030517578125, -0.006691098213195801, -0.006269693374633789, -0.005848288536071777, -0.005426883697509766, -0.005005478858947754, -0.004584074020385742, -0.0041626691818237305, -0.0037412643432617188, -0.003319859504699707, -0.0028984546661376953, -0.0024770498275756836, -0.002055644989013672, -0.0016342401504516602, -0.0012128353118896484, -0.0007914304733276367, -0.000370025634765625, 5.137920379638672e-05, 0.00047278404235839844, 0.0008941888809204102, 0.0013155937194824219, 0.0017369985580444336, 0.0021584033966064453, 0.002579808235168457, 0.0030012130737304688, 0.0034226179122924805, 0.003844022750854492, 0.004265427589416504, 0.004686832427978516, 0.005108237266540527, 0.005529642105102539, 0.005951046943664551, 0.0063724517822265625, 0.006793856620788574, 0.007215261459350586, 0.007636666297912598, 0.00805807113647461, 0.008479475975036621, 0.008900880813598633, 0.009322285652160645, 0.009743690490722656, 0.010165095329284668, 0.01058650016784668, 0.011007905006408691, 0.011429309844970703, 0.011850714683532715, 0.012272119522094727, 0.012693524360656738, 0.01311492919921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 16.0, 12.0, 12.0, 27.0, 21.0, 29.0, 30.0, 34.0, 40.0, 38.0, 36.0, 38.0, 45.0, 42.0, 1078.0, 38.0, 46.0, 50.0, 40.0, 32.0, 50.0, 44.0, 21.0, 26.0, 22.0, 27.0, 24.0, 20.0, 16.0, 8.0, 8.0, 9.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.740234375, -1.6942138671875, -1.648193359375, -1.6021728515625, -1.55615234375, -1.5101318359375, -1.464111328125, -1.4180908203125, -1.3720703125, -1.3260498046875, -1.280029296875, -1.2340087890625, -1.18798828125, -1.1419677734375, -1.095947265625, -1.0499267578125, -1.00390625, -0.9578857421875, -0.911865234375, -0.8658447265625, -0.81982421875, -0.7738037109375, -0.727783203125, -0.6817626953125, -0.6357421875, -0.5897216796875, -0.543701171875, -0.4976806640625, -0.45166015625, -0.4056396484375, -0.359619140625, -0.3135986328125, -0.267578125, -0.2215576171875, -0.175537109375, -0.1295166015625, -0.08349609375, -0.0374755859375, 0.008544921875, 0.0545654296875, 0.1005859375, 0.1466064453125, 0.192626953125, 0.2386474609375, 0.28466796875, 0.3306884765625, 0.376708984375, 0.4227294921875, 0.46875, 0.5147705078125, 0.560791015625, 0.6068115234375, 0.65283203125, 0.6988525390625, 0.744873046875, 0.7908935546875, 0.8369140625, 0.8829345703125, 0.928955078125, 0.9749755859375, 1.02099609375, 1.0670166015625, 1.113037109375, 1.1590576171875, 1.205078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 13.0, 5.0, 8.0, 21.0, 34.0, 54.0, 69.0, 117.0, 220.0, 349.0, 589.0, 972.0, 1752.0, 2759.0, 5069.0, 8621.0, 15150.0, 27375.0, 50093.0, 95903.0, 227885.0, 1382660.0, 131264.0, 65419.0, 35183.0, 19437.0, 10828.0, 6288.0, 3648.0, 2097.0, 1246.0, 758.0, 471.0, 278.0, 174.0, 128.0, 82.0, 38.0, 22.0, 13.0, 14.0, 15.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.0089186429977417, -0.008613348007202148, -0.008308053016662598, -0.008002758026123047, -0.007697463035583496, -0.007392168045043945, -0.0070868730545043945, -0.006781578063964844, -0.006476283073425293, -0.006170988082885742, -0.005865693092346191, -0.005560398101806641, -0.00525510311126709, -0.004949808120727539, -0.004644513130187988, -0.0043392181396484375, -0.004033923149108887, -0.003728628158569336, -0.003423333168029785, -0.0031180381774902344, -0.0028127431869506836, -0.002507448196411133, -0.002202153205871582, -0.0018968582153320312, -0.0015915632247924805, -0.0012862682342529297, -0.000980973243713379, -0.0006756782531738281, -0.00037038326263427734, -6.508827209472656e-05, 0.00024020671844482422, 0.000545501708984375, 0.0008507966995239258, 0.0011560916900634766, 0.0014613866806030273, 0.0017666816711425781, 0.002071976661682129, 0.0023772716522216797, 0.0026825666427612305, 0.0029878616333007812, 0.003293156623840332, 0.003598451614379883, 0.0039037466049194336, 0.004209041595458984, 0.004514336585998535, 0.004819631576538086, 0.005124926567077637, 0.0054302215576171875, 0.005735516548156738, 0.006040811538696289, 0.00634610652923584, 0.006651401519775391, 0.006956696510314941, 0.007261991500854492, 0.007567286491394043, 0.007872581481933594, 0.008177876472473145, 0.008483171463012695, 0.008788466453552246, 0.009093761444091797, 0.009399056434631348, 0.009704351425170898, 0.01000964641571045, 0.01031494140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 979.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 20.0, 1.0, 0.0, 4.0, 2.0, 5.0, 0.0, 13.0, 40.0, 55.0, 0.0, 313.0, 2397.0, 10804.0, 0.0, 1021150.0, 10988.0, 2288.0, 0.0, 315.0, 72.0, 37.0, 0.0, 24.0, 4.0, 3.0, 0.0, 3.0, 0.0, 11.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 14.0, 11.0, 10.0, 7.0, 17.0, 19.0, 21.0, 22.0, 32.0, 39.0, 42.0, 47.0, 38.0, 43.0, 52.0, 56.0, 54.0, 56.0, 46.0, 38.0, 50.0, 40.0, 45.0, 32.0, 35.0, 22.0, 19.0, 20.0, 16.0, 12.0, 14.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5557861328125, -2.480712890625, -2.4056396484375, -2.33056640625, -2.2554931640625, -2.180419921875, -2.1053466796875, -2.0302734375, -1.9552001953125, -1.880126953125, -1.8050537109375, -1.72998046875, -1.6549072265625, -1.579833984375, -1.5047607421875, -1.4296875, -1.3546142578125, -1.279541015625, -1.2044677734375, -1.12939453125, -1.0543212890625, -0.979248046875, -0.9041748046875, -0.8291015625, -0.7540283203125, -0.678955078125, -0.6038818359375, -0.52880859375, -0.4537353515625, -0.378662109375, -0.3035888671875, -0.228515625, -0.1534423828125, -0.078369140625, -0.0032958984375, 0.07177734375, 0.1468505859375, 0.221923828125, 0.2969970703125, 0.3720703125, 0.4471435546875, 0.522216796875, 0.5972900390625, 0.67236328125, 0.7474365234375, 0.822509765625, 0.8975830078125, 0.97265625, 1.0477294921875, 1.122802734375, 1.1978759765625, 1.27294921875, 1.3480224609375, 1.423095703125, 1.4981689453125, 1.5732421875, 1.6483154296875, 1.723388671875, 1.7984619140625, 1.87353515625, 1.9486083984375, 2.023681640625, 2.0987548828125, 2.173828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 9.0, 7.0, 13.0, 15.0, 22.0, 27.0, 51.0, 77.0, 85.0, 107.0, 181.0, 272.0, 379.0, 552.0, 844.0, 1183.0, 1778.0, 2760.0, 4125.0, 6688.0, 10928.0, 19352.0, 35285.0, 72605.0, 188407.0, 406711.0, 155979.0, 63079.0, 31560.0, 17650.0, 10146.0, 6196.0, 3836.0, 2480.0, 1725.0, 1072.0, 728.0, 461.0, 369.0, 204.0, 176.0, 132.0, 80.0, 54.0, 53.0, 36.0, 17.0, 20.0, 9.0, 12.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4365234375, -1.3907928466796875, -1.345062255859375, -1.2993316650390625, -1.25360107421875, -1.2078704833984375, -1.162139892578125, -1.1164093017578125, -1.0706787109375, -1.0249481201171875, -0.979217529296875, -0.9334869384765625, -0.88775634765625, -0.8420257568359375, -0.796295166015625, -0.7505645751953125, -0.704833984375, -0.6591033935546875, -0.613372802734375, -0.5676422119140625, -0.52191162109375, -0.4761810302734375, -0.430450439453125, -0.3847198486328125, -0.3389892578125, -0.2932586669921875, -0.247528076171875, -0.2017974853515625, -0.15606689453125, -0.1103363037109375, -0.064605712890625, -0.0188751220703125, 0.02685546875, 0.0725860595703125, 0.118316650390625, 0.1640472412109375, 0.20977783203125, 0.2555084228515625, 0.301239013671875, 0.3469696044921875, 0.3927001953125, 0.4384307861328125, 0.484161376953125, 0.5298919677734375, 0.57562255859375, 0.6213531494140625, 0.667083740234375, 0.7128143310546875, 0.758544921875, 0.8042755126953125, 0.850006103515625, 0.8957366943359375, 0.94146728515625, 0.9871978759765625, 1.032928466796875, 1.0786590576171875, 1.1243896484375, 1.1701202392578125, 1.215850830078125, 1.2615814208984375, 1.30731201171875, 1.3530426025390625, 1.398773193359375, 1.4445037841796875, 1.490234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 10.0, 10.0, 9.0, 13.0, 9.0, 17.0, 16.0, 25.0, 25.0, 42.0, 25.0, 31.0, 35.0, 46.0, 62.0, 75.0, 75.0, 245.0, 1613.0, 147.0, 90.0, 54.0, 47.0, 39.0, 42.0, 34.0, 25.0, 26.0, 29.0, 17.0, 20.0, 17.0, 17.0, 11.0, 9.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-7.8671875, -7.6383056640625, -7.409423828125, -7.1805419921875, -6.95166015625, -6.7227783203125, -6.493896484375, -6.2650146484375, -6.0361328125, -5.8072509765625, -5.578369140625, -5.3494873046875, -5.12060546875, -4.8917236328125, -4.662841796875, -4.4339599609375, -4.205078125, -3.9761962890625, -3.747314453125, -3.5184326171875, -3.28955078125, -3.0606689453125, -2.831787109375, -2.6029052734375, -2.3740234375, -2.1451416015625, -1.916259765625, -1.6873779296875, -1.45849609375, -1.2296142578125, -1.000732421875, -0.7718505859375, -0.54296875, -0.3140869140625, -0.085205078125, 0.1436767578125, 0.37255859375, 0.6014404296875, 0.830322265625, 1.0592041015625, 1.2880859375, 1.5169677734375, 1.745849609375, 1.9747314453125, 2.20361328125, 2.4324951171875, 2.661376953125, 2.8902587890625, 3.119140625, 3.3480224609375, 3.576904296875, 3.8057861328125, 4.03466796875, 4.2635498046875, 4.492431640625, 4.7213134765625, 4.9501953125, 5.1790771484375, 5.407958984375, 5.6368408203125, 5.86572265625, 6.0946044921875, 6.323486328125, 6.5523681640625, 6.78125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 11.0, 12.0, 9.0, 19.0, 11.0, 20.0, 22.0, 34.0, 37.0, 54.0, 69.0, 127.0, 167.0, 320.0, 607.0, 1645.0, 8426.0, 102324.0, 2909526.0, 110297.0, 8679.0, 1686.0, 623.0, 361.0, 186.0, 106.0, 68.0, 49.0, 49.0, 31.0, 23.0, 15.0, 15.0, 11.0, 11.0, 9.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.3125, -9.9852294921875, -9.657958984375, -9.3306884765625, -9.00341796875, -8.6761474609375, -8.348876953125, -8.0216064453125, -7.6943359375, -7.3670654296875, -7.039794921875, -6.7125244140625, -6.38525390625, -6.0579833984375, -5.730712890625, -5.4034423828125, -5.076171875, -4.7489013671875, -4.421630859375, -4.0943603515625, -3.76708984375, -3.4398193359375, -3.112548828125, -2.7852783203125, -2.4580078125, -2.1307373046875, -1.803466796875, -1.4761962890625, -1.14892578125, -0.8216552734375, -0.494384765625, -0.1671142578125, 0.16015625, 0.4874267578125, 0.814697265625, 1.1419677734375, 1.46923828125, 1.7965087890625, 2.123779296875, 2.4510498046875, 2.7783203125, 3.1055908203125, 3.432861328125, 3.7601318359375, 4.08740234375, 4.4146728515625, 4.741943359375, 5.0692138671875, 5.396484375, 5.7237548828125, 6.051025390625, 6.3782958984375, 6.70556640625, 7.0328369140625, 7.360107421875, 7.6873779296875, 8.0146484375, 8.3419189453125, 8.669189453125, 8.9964599609375, 9.32373046875, 9.6510009765625, 9.978271484375, 10.3055419921875, 10.6328125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [104.0, 905.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9601569175720215, -1.7863740921020508, 3.38740873336792, 8.56119155883789, 13.734973907470703, 18.908756256103516, 24.08254051208496, 29.256322860717773, 34.43010711669922, 39.60388946533203, 44.777671813964844, 49.951454162597656, 55.12523651123047, 60.29901885986328, 65.47280883789062, 70.64659118652344, 75.82036590576172, 80.99414825439453, 86.16793060302734, 91.34171295166016, 96.51549530029297, 101.68927764892578, 106.86306762695312, 112.03684997558594, 117.21063232421875, 122.38441467285156, 127.55819702148438, 132.7319793701172, 137.90576171875, 143.0795440673828, 148.25332641601562, 153.42710876464844, 158.6009063720703, 163.77468872070312, 168.94847106933594, 174.12225341796875, 179.29603576660156, 184.46981811523438, 189.6436004638672, 194.8173828125, 199.9911651611328, 205.16494750976562, 210.33872985839844, 215.51251220703125, 220.68629455566406, 225.86007690429688, 231.0338592529297, 236.2076416015625, 241.38143920898438, 246.5552215576172, 251.72900390625, 256.9028015136719, 262.0765686035156, 267.2503662109375, 272.42413330078125, 277.5979309082031, 282.7716979980469, 287.94549560546875, 293.1192626953125, 298.2930603027344, 303.4668273925781, 308.640625, 313.81439208984375, 318.9881896972656, 324.1619567871094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 14.0, 11.0, 20.0, 11.0, 23.0, 24.0, 19.0, 30.0, 32.0, 37.0, 37.0, 45.0, 35.0, 45.0, 28.0, 51.0, 45.0, 43.0, 43.0, 37.0, 36.0, 35.0, 48.0, 38.0, 30.0, 26.0, 37.0, 18.0, 16.0, 8.0, 14.0, 11.0, 11.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.54470443725586, -29.739673614501953, -28.934642791748047, -28.12961196899414, -27.324583053588867, -26.51955223083496, -25.714521408081055, -24.90949058532715, -24.104461669921875, -23.29943084716797, -22.494400024414062, -21.689369201660156, -20.884340286254883, -20.079309463500977, -19.27427864074707, -18.469247817993164, -17.664216995239258, -16.85918617248535, -16.054155349731445, -15.249125480651855, -14.444095611572266, -13.63906478881836, -12.834033966064453, -12.029003143310547, -11.223973274230957, -10.41894245147705, -9.613912582397461, -8.808881759643555, -8.003850936889648, -7.198821067810059, -6.393790245056152, -5.588759899139404, -4.783731460571289, -3.978701114654541, -3.173670530319214, -2.3686399459838867, -1.5636096000671387, -0.7585792541503906, 0.046451568603515625, 0.8514819145202637, 1.6565122604370117, 2.4615426063537598, 3.266573190689087, 4.071603775024414, 4.876634120941162, 5.68166446685791, 6.486695289611816, 7.2917256355285645, 8.096755981445312, 8.901786804199219, 9.706816673278809, 10.511847496032715, 11.316877365112305, 12.121908187866211, 12.926939010620117, 13.731969833374023, 14.536999702453613, 15.34203052520752, 16.14706039428711, 16.952091217041016, 17.757122039794922, 18.562152862548828, 19.367183685302734, 20.172212600708008, 20.977243423461914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 1.0, 10.0, 14.0, 13.0, 12.0, 9.0, 18.0, 26.0, 22.0, 31.0, 26.0, 46.0, 53.0, 47.0, 46.0, 36.0, 56.0, 51.0, 64.0, 36.0, 46.0, 48.0, 39.0, 52.0, 37.0, 32.0, 26.0, 15.0, 13.0, 23.0, 15.0, 9.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.569000244140625, -2.49151611328125, -2.414031982421875, -2.3365478515625, -2.259063720703125, -2.18157958984375, -2.104095458984375, -2.026611328125, -1.949127197265625, -1.87164306640625, -1.794158935546875, -1.7166748046875, -1.639190673828125, -1.56170654296875, -1.484222412109375, -1.40673828125, -1.329254150390625, -1.25177001953125, -1.174285888671875, -1.0968017578125, -1.019317626953125, -0.94183349609375, -0.864349365234375, -0.786865234375, -0.709381103515625, -0.63189697265625, -0.554412841796875, -0.4769287109375, -0.399444580078125, -0.32196044921875, -0.244476318359375, -0.1669921875, -0.089508056640625, -0.01202392578125, 0.065460205078125, 0.1429443359375, 0.220428466796875, 0.29791259765625, 0.375396728515625, 0.452880859375, 0.530364990234375, 0.60784912109375, 0.685333251953125, 0.7628173828125, 0.840301513671875, 0.91778564453125, 0.995269775390625, 1.07275390625, 1.150238037109375, 1.22772216796875, 1.305206298828125, 1.3826904296875, 1.460174560546875, 1.53765869140625, 1.615142822265625, 1.692626953125, 1.770111083984375, 1.84759521484375, 1.925079345703125, 2.0025634765625, 2.080047607421875, 2.15753173828125, 2.235015869140625, 2.3125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 9.0, 11.0, 19.0, 16.0, 24.0, 23.0, 37.0, 78.0, 119.0, 228.0, 552.0, 1451.0, 4559.0, 16578.0, 70848.0, 463659.0, 2806713.0, 705475.0, 93968.0, 21088.0, 5619.0, 1841.0, 644.0, 296.0, 121.0, 77.0, 50.0, 41.0, 23.0, 14.0, 20.0, 13.0, 8.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.44140625, -7.2322998046875, -7.023193359375, -6.8140869140625, -6.60498046875, -6.3958740234375, -6.186767578125, -5.9776611328125, -5.7685546875, -5.5594482421875, -5.350341796875, -5.1412353515625, -4.93212890625, -4.7230224609375, -4.513916015625, -4.3048095703125, -4.095703125, -3.8865966796875, -3.677490234375, -3.4683837890625, -3.25927734375, -3.0501708984375, -2.841064453125, -2.6319580078125, -2.4228515625, -2.2137451171875, -2.004638671875, -1.7955322265625, -1.58642578125, -1.3773193359375, -1.168212890625, -0.9591064453125, -0.75, -0.5408935546875, -0.331787109375, -0.1226806640625, 0.08642578125, 0.2955322265625, 0.504638671875, 0.7137451171875, 0.9228515625, 1.1319580078125, 1.341064453125, 1.5501708984375, 1.75927734375, 1.9683837890625, 2.177490234375, 2.3865966796875, 2.595703125, 2.8048095703125, 3.013916015625, 3.2230224609375, 3.43212890625, 3.6412353515625, 3.850341796875, 4.0594482421875, 4.2685546875, 4.4776611328125, 4.686767578125, 4.8958740234375, 5.10498046875, 5.3140869140625, 5.523193359375, 5.7322998046875, 5.94140625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 10.0, 7.0, 21.0, 23.0, 64.0, 85.0, 157.0, 323.0, 562.0, 812.0, 760.0, 525.0, 333.0, 175.0, 93.0, 67.0, 28.0, 12.0, 10.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.4044189453125, -11.058837890625, -10.7132568359375, -10.36767578125, -10.0220947265625, -9.676513671875, -9.3309326171875, -8.9853515625, -8.6397705078125, -8.294189453125, -7.9486083984375, -7.60302734375, -7.2574462890625, -6.911865234375, -6.5662841796875, -6.220703125, -5.8751220703125, -5.529541015625, -5.1839599609375, -4.83837890625, -4.4927978515625, -4.147216796875, -3.8016357421875, -3.4560546875, -3.1104736328125, -2.764892578125, -2.4193115234375, -2.07373046875, -1.7281494140625, -1.382568359375, -1.0369873046875, -0.69140625, -0.3458251953125, -0.000244140625, 0.3453369140625, 0.69091796875, 1.0364990234375, 1.382080078125, 1.7276611328125, 2.0732421875, 2.4188232421875, 2.764404296875, 3.1099853515625, 3.45556640625, 3.8011474609375, 4.146728515625, 4.4923095703125, 4.837890625, 5.1834716796875, 5.529052734375, 5.8746337890625, 6.22021484375, 6.5657958984375, 6.911376953125, 7.2569580078125, 7.6025390625, 7.9481201171875, 8.293701171875, 8.6392822265625, 8.98486328125, 9.3304443359375, 9.676025390625, 10.0216064453125, 10.3671875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 12.0, 25.0, 27.0, 50.0, 86.0, 129.0, 218.0, 364.0, 592.0, 1297.0, 4021.0, 22211.0, 254842.0, 3208463.0, 647882.0, 44151.0, 6320.0, 1728.0, 792.0, 426.0, 244.0, 138.0, 98.0, 63.0, 34.0, 25.0, 20.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.515625, -15.0255126953125, -14.535400390625, -14.0452880859375, -13.55517578125, -13.0650634765625, -12.574951171875, -12.0848388671875, -11.5947265625, -11.1046142578125, -10.614501953125, -10.1243896484375, -9.63427734375, -9.1441650390625, -8.654052734375, -8.1639404296875, -7.673828125, -7.1837158203125, -6.693603515625, -6.2034912109375, -5.71337890625, -5.2232666015625, -4.733154296875, -4.2430419921875, -3.7529296875, -3.2628173828125, -2.772705078125, -2.2825927734375, -1.79248046875, -1.3023681640625, -0.812255859375, -0.3221435546875, 0.16796875, 0.6580810546875, 1.148193359375, 1.6383056640625, 2.12841796875, 2.6185302734375, 3.108642578125, 3.5987548828125, 4.0888671875, 4.5789794921875, 5.069091796875, 5.5592041015625, 6.04931640625, 6.5394287109375, 7.029541015625, 7.5196533203125, 8.009765625, 8.4998779296875, 8.989990234375, 9.4801025390625, 9.97021484375, 10.4603271484375, 10.950439453125, 11.4405517578125, 11.9306640625, 12.4207763671875, 12.910888671875, 13.4010009765625, 13.89111328125, 14.3812255859375, 14.871337890625, 15.3614501953125, 15.8515625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 10.0, 30.0, 60.0, 86.0, 164.0, 177.0, 179.0, 136.0, 92.0, 43.0, 24.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.16366958618164, -41.268028259277344, -39.37238693237305, -37.47674560546875, -35.58110809326172, -33.68546676635742, -31.789825439453125, -29.894184112548828, -27.998544692993164, -26.102903366088867, -24.207263946533203, -22.311622619628906, -20.41598129272461, -18.520341873168945, -16.62470054626465, -14.729060173034668, -12.833419799804688, -10.937779426574707, -9.042139053344727, -7.14649772644043, -5.250857353210449, -3.3552169799804688, -1.4595756530761719, 0.4360647201538086, 2.331705093383789, 4.2273454666137695, 6.122986316680908, 8.018627166748047, 9.914267539978027, 11.809907913208008, 13.705549240112305, 15.601189613342285, 17.496826171875, 19.392467498779297, 21.28810691833496, 23.183748245239258, 25.079387664794922, 26.97502899169922, 28.870670318603516, 30.766311645507812, 32.661949157714844, 34.55759048461914, 36.45323181152344, 38.34886932373047, 40.244510650634766, 42.14015197753906, 44.03579330444336, 45.931434631347656, 47.82707595825195, 49.72271728515625, 51.61835861206055, 53.513999938964844, 55.409637451171875, 57.30527877807617, 59.20092010498047, 61.096561431884766, 62.99220275878906, 64.8878402709961, 66.78348541259766, 68.67912292480469, 70.57476806640625, 72.47040557861328, 74.36604309082031, 76.26168823242188, 78.1573257446289]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 10.0, 11.0, 8.0, 8.0, 16.0, 15.0, 12.0, 15.0, 26.0, 22.0, 25.0, 35.0, 27.0, 28.0, 37.0, 36.0, 30.0, 37.0, 40.0, 43.0, 33.0, 32.0, 41.0, 37.0, 42.0, 31.0, 33.0, 28.0, 31.0, 33.0, 22.0, 20.0, 15.0, 24.0, 18.0, 6.0, 8.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-20.6429443359375, -20.021011352539062, -19.399080276489258, -18.77714729309082, -18.155216217041016, -17.533283233642578, -16.91135025024414, -16.289417266845703, -15.667486190795898, -15.045554161071777, -14.423622131347656, -13.801689147949219, -13.179757118225098, -12.557825088500977, -11.935892105102539, -11.313960075378418, -10.692028045654297, -10.070096015930176, -9.448163986206055, -8.826231002807617, -8.204298973083496, -7.582366943359375, -6.960434436798096, -6.338501930236816, -5.716569900512695, -5.094637870788574, -4.472705364227295, -3.8507730960845947, -3.2288408279418945, -2.6069085597991943, -1.9849762916564941, -1.3630437850952148, -0.7411117553710938, -0.11917948722839355, 0.5027527809143066, 1.1246850490570068, 1.746617317199707, 2.3685495853424072, 2.9904818534851074, 3.6124143600463867, 4.234346389770508, 4.856278419494629, 5.478210926055908, 6.1001434326171875, 6.722075462341309, 7.34400749206543, 7.965939998626709, 8.587872505187988, 9.20980453491211, 9.83173656463623, 10.453668594360352, 11.075601577758789, 11.69753360748291, 12.319465637207031, 12.941398620605469, 13.56333065032959, 14.185262680053711, 14.807194709777832, 15.429126739501953, 16.05105972290039, 16.672992706298828, 17.294923782348633, 17.91685676574707, 18.538787841796875, 19.160720825195312]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 11.0, 12.0, 16.0, 18.0, 19.0, 10.0, 31.0, 30.0, 24.0, 27.0, 44.0, 39.0, 48.0, 38.0, 21.0, 42.0, 42.0, 54.0, 49.0, 44.0, 37.0, 44.0, 35.0, 31.0, 42.0, 30.0, 24.0, 20.0, 15.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.150390625, -2.081634521484375, -2.01287841796875, -1.944122314453125, -1.8753662109375, -1.806610107421875, -1.73785400390625, -1.669097900390625, -1.600341796875, -1.531585693359375, -1.46282958984375, -1.394073486328125, -1.3253173828125, -1.256561279296875, -1.18780517578125, -1.119049072265625, -1.05029296875, -0.981536865234375, -0.91278076171875, -0.844024658203125, -0.7752685546875, -0.706512451171875, -0.63775634765625, -0.569000244140625, -0.500244140625, -0.431488037109375, -0.36273193359375, -0.293975830078125, -0.2252197265625, -0.156463623046875, -0.08770751953125, -0.018951416015625, 0.0498046875, 0.118560791015625, 0.18731689453125, 0.256072998046875, 0.3248291015625, 0.393585205078125, 0.46234130859375, 0.531097412109375, 0.599853515625, 0.668609619140625, 0.73736572265625, 0.806121826171875, 0.8748779296875, 0.943634033203125, 1.01239013671875, 1.081146240234375, 1.14990234375, 1.218658447265625, 1.28741455078125, 1.356170654296875, 1.4249267578125, 1.493682861328125, 1.56243896484375, 1.631195068359375, 1.699951171875, 1.768707275390625, 1.83746337890625, 1.906219482421875, 1.9749755859375, 2.043731689453125, 2.11248779296875, 2.181243896484375, 2.25]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 11.0, 6.0, 17.0, 29.0, 30.0, 53.0, 89.0, 131.0, 176.0, 272.0, 434.0, 639.0, 892.0, 1519.0, 2163.0, 3397.0, 5334.0, 8162.0, 13161.0, 21160.0, 35024.0, 60665.0, 114177.0, 287264.0, 249123.0, 103140.0, 55213.0, 32581.0, 19742.0, 12276.0, 7662.0, 4870.0, 3100.0, 2091.0, 1320.0, 832.0, 609.0, 404.0, 250.0, 184.0, 118.0, 84.0, 47.0, 35.0, 21.0, 20.0, 15.0, 7.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.01360321044921875, -0.013190031051635742, -0.012776851654052734, -0.012363672256469727, -0.011950492858886719, -0.011537313461303711, -0.011124134063720703, -0.010710954666137695, -0.010297775268554688, -0.00988459587097168, -0.009471416473388672, -0.009058237075805664, -0.008645057678222656, -0.008231878280639648, -0.00781869888305664, -0.007405519485473633, -0.006992340087890625, -0.006579160690307617, -0.006165981292724609, -0.0057528018951416016, -0.005339622497558594, -0.004926443099975586, -0.004513263702392578, -0.00410008430480957, -0.0036869049072265625, -0.0032737255096435547, -0.002860546112060547, -0.002447366714477539, -0.0020341873168945312, -0.0016210079193115234, -0.0012078285217285156, -0.0007946491241455078, -0.0003814697265625, 3.170967102050781e-05, 0.0004448890686035156, 0.0008580684661865234, 0.0012712478637695312, 0.001684427261352539, 0.002097606658935547, 0.0025107860565185547, 0.0029239654541015625, 0.0033371448516845703, 0.003750324249267578, 0.004163503646850586, 0.004576683044433594, 0.0049898624420166016, 0.005403041839599609, 0.005816221237182617, 0.006229400634765625, 0.006642580032348633, 0.007055759429931641, 0.0074689388275146484, 0.007882118225097656, 0.008295297622680664, 0.008708477020263672, 0.00912165641784668, 0.009534835815429688, 0.009948015213012695, 0.010361194610595703, 0.010774374008178711, 0.011187553405761719, 0.011600732803344727, 0.012013912200927734, 0.012427091598510742, 0.01284027099609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 9.0, 19.0, 13.0, 12.0, 30.0, 31.0, 26.0, 38.0, 44.0, 33.0, 46.0, 52.0, 52.0, 52.0, 1068.0, 46.0, 53.0, 42.0, 43.0, 27.0, 36.0, 35.0, 40.0, 28.0, 21.0, 19.0, 17.0, 19.0, 10.0, 9.0, 11.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.77734375, -1.727081298828125, -1.67681884765625, -1.626556396484375, -1.5762939453125, -1.526031494140625, -1.47576904296875, -1.425506591796875, -1.375244140625, -1.324981689453125, -1.27471923828125, -1.224456787109375, -1.1741943359375, -1.123931884765625, -1.07366943359375, -1.023406982421875, -0.97314453125, -0.922882080078125, -0.87261962890625, -0.822357177734375, -0.7720947265625, -0.721832275390625, -0.67156982421875, -0.621307373046875, -0.571044921875, -0.520782470703125, -0.47052001953125, -0.420257568359375, -0.3699951171875, -0.319732666015625, -0.26947021484375, -0.219207763671875, -0.1689453125, -0.118682861328125, -0.06842041015625, -0.018157958984375, 0.0321044921875, 0.082366943359375, 0.13262939453125, 0.182891845703125, 0.233154296875, 0.283416748046875, 0.33367919921875, 0.383941650390625, 0.4342041015625, 0.484466552734375, 0.53472900390625, 0.584991455078125, 0.63525390625, 0.685516357421875, 0.73577880859375, 0.786041259765625, 0.8363037109375, 0.886566162109375, 0.93682861328125, 0.987091064453125, 1.037353515625, 1.087615966796875, 1.13787841796875, 1.188140869140625, 1.2384033203125, 1.288665771484375, 1.33892822265625, 1.389190673828125, 1.439453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 16.0, 12.0, 14.0, 27.0, 53.0, 85.0, 93.0, 164.0, 262.0, 428.0, 677.0, 1084.0, 1773.0, 2976.0, 4931.0, 8603.0, 14747.0, 26485.0, 47523.0, 90889.0, 219700.0, 1392243.0, 136007.0, 65163.0, 35399.0, 19828.0, 11322.0, 6542.0, 3903.0, 2375.0, 1383.0, 881.0, 532.0, 341.0, 220.0, 153.0, 103.0, 62.0, 44.0, 31.0, 16.0, 17.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00954437255859375, -0.009228944778442383, -0.008913516998291016, -0.008598089218139648, -0.008282661437988281, -0.007967233657836914, -0.007651805877685547, -0.00733637809753418, -0.0070209503173828125, -0.006705522537231445, -0.006390094757080078, -0.006074666976928711, -0.005759239196777344, -0.0054438114166259766, -0.005128383636474609, -0.004812955856323242, -0.004497528076171875, -0.004182100296020508, -0.0038666725158691406, -0.0035512447357177734, -0.0032358169555664062, -0.002920389175415039, -0.002604961395263672, -0.0022895336151123047, -0.0019741058349609375, -0.0016586780548095703, -0.0013432502746582031, -0.001027822494506836, -0.0007123947143554688, -0.00039696693420410156, -8.153915405273438e-05, 0.0002338886260986328, 0.00054931640625, 0.0008647441864013672, 0.0011801719665527344, 0.0014955997467041016, 0.0018110275268554688, 0.002126455307006836, 0.002441883087158203, 0.0027573108673095703, 0.0030727386474609375, 0.0033881664276123047, 0.003703594207763672, 0.004019021987915039, 0.004334449768066406, 0.0046498775482177734, 0.004965305328369141, 0.005280733108520508, 0.005596160888671875, 0.005911588668823242, 0.006227016448974609, 0.0065424442291259766, 0.006857872009277344, 0.007173299789428711, 0.007488727569580078, 0.007804155349731445, 0.008119583129882812, 0.00843501091003418, 0.008750438690185547, 0.009065866470336914, 0.009381294250488281, 0.009696722030639648, 0.010012149810791016, 0.010327577590942383, 0.01064300537109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 973.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 19.0, 1.0, 0.0, 10.0, 1.0, 11.0, 0.0, 2.0, 38.0, 55.0, 0.0, 331.0, 2405.0, 11960.0, 0.0, 1018940.0, 11984.0, 2299.0, 0.0, 360.0, 61.0, 38.0, 0.0, 7.0, 4.0, 4.0, 0.0, 5.0, 5.0, 15.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 11.0, 12.0, 16.0, 18.0, 19.0, 10.0, 31.0, 30.0, 24.0, 27.0, 44.0, 39.0, 48.0, 38.0, 21.0, 42.0, 42.0, 54.0, 49.0, 44.0, 37.0, 44.0, 35.0, 31.0, 42.0, 30.0, 24.0, 20.0, 15.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.150390625, -2.081634521484375, -2.01287841796875, -1.944122314453125, -1.8753662109375, -1.806610107421875, -1.73785400390625, -1.669097900390625, -1.600341796875, -1.531585693359375, -1.46282958984375, -1.394073486328125, -1.3253173828125, -1.256561279296875, -1.18780517578125, -1.119049072265625, -1.05029296875, -0.981536865234375, -0.91278076171875, -0.844024658203125, -0.7752685546875, -0.706512451171875, -0.63775634765625, -0.569000244140625, -0.500244140625, -0.431488037109375, -0.36273193359375, -0.293975830078125, -0.2252197265625, -0.156463623046875, -0.08770751953125, -0.018951416015625, 0.0498046875, 0.118560791015625, 0.18731689453125, 0.256072998046875, 0.3248291015625, 0.393585205078125, 0.46234130859375, 0.531097412109375, 0.599853515625, 0.668609619140625, 0.73736572265625, 0.806121826171875, 0.8748779296875, 0.943634033203125, 1.01239013671875, 1.081146240234375, 1.14990234375, 1.218658447265625, 1.28741455078125, 1.356170654296875, 1.4249267578125, 1.493682861328125, 1.56243896484375, 1.631195068359375, 1.699951171875, 1.768707275390625, 1.83746337890625, 1.906219482421875, 1.9749755859375, 2.043731689453125, 2.11248779296875, 2.181243896484375, 2.25]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 5.0, 2.0, 8.0, 11.0, 19.0, 22.0, 28.0, 36.0, 52.0, 77.0, 137.0, 198.0, 309.0, 460.0, 776.0, 1189.0, 1900.0, 2964.0, 4951.0, 8050.0, 13456.0, 22749.0, 40406.0, 93820.0, 431212.0, 270642.0, 70898.0, 34187.0, 19676.0, 11696.0, 7033.0, 4289.0, 2631.0, 1732.0, 1056.0, 627.0, 396.0, 288.0, 173.0, 123.0, 87.0, 52.0, 32.0, 27.0, 21.0, 12.0, 11.0, 8.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.068359375, -2.0013427734375, -1.934326171875, -1.8673095703125, -1.80029296875, -1.7332763671875, -1.666259765625, -1.5992431640625, -1.5322265625, -1.4652099609375, -1.398193359375, -1.3311767578125, -1.26416015625, -1.1971435546875, -1.130126953125, -1.0631103515625, -0.99609375, -0.9290771484375, -0.862060546875, -0.7950439453125, -0.72802734375, -0.6610107421875, -0.593994140625, -0.5269775390625, -0.4599609375, -0.3929443359375, -0.325927734375, -0.2589111328125, -0.19189453125, -0.1248779296875, -0.057861328125, 0.0091552734375, 0.076171875, 0.1431884765625, 0.210205078125, 0.2772216796875, 0.34423828125, 0.4112548828125, 0.478271484375, 0.5452880859375, 0.6123046875, 0.6793212890625, 0.746337890625, 0.8133544921875, 0.88037109375, 0.9473876953125, 1.014404296875, 1.0814208984375, 1.1484375, 1.2154541015625, 1.282470703125, 1.3494873046875, 1.41650390625, 1.4835205078125, 1.550537109375, 1.6175537109375, 1.6845703125, 1.7515869140625, 1.818603515625, 1.8856201171875, 1.95263671875, 2.0196533203125, 2.086669921875, 2.1536865234375, 2.220703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 6.0, 7.0, 14.0, 13.0, 21.0, 19.0, 22.0, 24.0, 30.0, 32.0, 38.0, 39.0, 61.0, 45.0, 77.0, 116.0, 334.0, 1529.0, 141.0, 80.0, 50.0, 43.0, 41.0, 37.0, 36.0, 26.0, 18.0, 21.0, 25.0, 18.0, 13.0, 12.0, 7.0, 8.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7578125, -7.5159912109375, -7.274169921875, -7.0323486328125, -6.79052734375, -6.5487060546875, -6.306884765625, -6.0650634765625, -5.8232421875, -5.5814208984375, -5.339599609375, -5.0977783203125, -4.85595703125, -4.6141357421875, -4.372314453125, -4.1304931640625, -3.888671875, -3.6468505859375, -3.405029296875, -3.1632080078125, -2.92138671875, -2.6795654296875, -2.437744140625, -2.1959228515625, -1.9541015625, -1.7122802734375, -1.470458984375, -1.2286376953125, -0.98681640625, -0.7449951171875, -0.503173828125, -0.2613525390625, -0.01953125, 0.2222900390625, 0.464111328125, 0.7059326171875, 0.94775390625, 1.1895751953125, 1.431396484375, 1.6732177734375, 1.9150390625, 2.1568603515625, 2.398681640625, 2.6405029296875, 2.88232421875, 3.1241455078125, 3.365966796875, 3.6077880859375, 3.849609375, 4.0914306640625, 4.333251953125, 4.5750732421875, 4.81689453125, 5.0587158203125, 5.300537109375, 5.5423583984375, 5.7841796875, 6.0260009765625, 6.267822265625, 6.5096435546875, 6.75146484375, 6.9932861328125, 7.235107421875, 7.4769287109375, 7.71875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 8.0, 6.0, 7.0, 5.0, 14.0, 16.0, 19.0, 27.0, 26.0, 38.0, 52.0, 59.0, 91.0, 150.0, 204.0, 321.0, 1000.0, 3881.0, 32593.0, 2440153.0, 641860.0, 20605.0, 2784.0, 776.0, 345.0, 186.0, 124.0, 82.0, 64.0, 53.0, 39.0, 11.0, 27.0, 23.0, 12.0, 11.0, 4.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.60498046875, -11.2412109375, -10.87744140625, -10.513671875, -10.14990234375, -9.7861328125, -9.42236328125, -9.05859375, -8.69482421875, -8.3310546875, -7.96728515625, -7.603515625, -7.23974609375, -6.8759765625, -6.51220703125, -6.1484375, -5.78466796875, -5.4208984375, -5.05712890625, -4.693359375, -4.32958984375, -3.9658203125, -3.60205078125, -3.23828125, -2.87451171875, -2.5107421875, -2.14697265625, -1.783203125, -1.41943359375, -1.0556640625, -0.69189453125, -0.328125, 0.03564453125, 0.3994140625, 0.76318359375, 1.126953125, 1.49072265625, 1.8544921875, 2.21826171875, 2.58203125, 2.94580078125, 3.3095703125, 3.67333984375, 4.037109375, 4.40087890625, 4.7646484375, 5.12841796875, 5.4921875, 5.85595703125, 6.2197265625, 6.58349609375, 6.947265625, 7.31103515625, 7.6748046875, 8.03857421875, 8.40234375, 8.76611328125, 9.1298828125, 9.49365234375, 9.857421875, 10.22119140625, 10.5849609375, 10.94873046875, 11.3125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 248.0, 686.0, 76.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.660686492919922, -23.813861846923828, -20.967037200927734, -18.12021255493164, -15.27338695526123, -12.426562309265137, -9.579736709594727, -6.732912063598633, -3.886087417602539, -1.0392625331878662, 1.8075623512268066, 4.654387474060059, 7.501212120056152, 10.348036766052246, 13.194862365722656, 16.04168701171875, 18.888511657714844, 21.735336303710938, 24.58216094970703, 27.428985595703125, 30.27581024169922, 33.12263488769531, 35.969459533691406, 38.8162841796875, 41.663108825683594, 44.50993347167969, 47.35675811767578, 50.203582763671875, 53.05040740966797, 55.89723205566406, 58.744056701660156, 61.59088134765625, 64.43770599365234, 67.28453063964844, 70.13135528564453, 72.97817993164062, 75.82500457763672, 78.67182922363281, 81.5186538696289, 84.365478515625, 87.2123031616211, 90.05912780761719, 92.90595245361328, 95.75277709960938, 98.59960174560547, 101.44642639160156, 104.29325103759766, 107.14007568359375, 109.98690795898438, 112.83373260498047, 115.68055725097656, 118.52738189697266, 121.37420654296875, 124.22103118896484, 127.06785583496094, 129.91468811035156, 132.76150512695312, 135.60833740234375, 138.4551544189453, 141.30198669433594, 144.1488037109375, 146.99563598632812, 149.8424530029297, 152.6892852783203, 155.53610229492188]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 5.0, 7.0, 11.0, 7.0, 7.0, 22.0, 19.0, 21.0, 23.0, 25.0, 26.0, 22.0, 29.0, 43.0, 40.0, 37.0, 36.0, 39.0, 36.0, 44.0, 48.0, 38.0, 31.0, 43.0, 37.0, 35.0, 39.0, 30.0, 28.0, 20.0, 24.0, 20.0, 20.0, 13.0, 14.0, 12.0, 9.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.083560943603516, -23.362991333007812, -22.64242172241211, -21.921852111816406, -21.201282501220703, -20.480712890625, -19.760143280029297, -19.03957176208496, -18.319002151489258, -17.598432540893555, -16.87786293029785, -16.15729331970215, -15.436722755432129, -14.716153144836426, -13.995583534240723, -13.275012969970703, -12.554444313049316, -11.833874702453613, -11.11330509185791, -10.39273452758789, -9.672164916992188, -8.951595306396484, -8.231025695800781, -7.51045560836792, -6.789885997772217, -6.069316387176514, -5.348746299743652, -4.628176689147949, -3.907606840133667, -3.1870369911193848, -2.4664673805236816, -1.7458972930908203, -1.0253276824951172, -0.30475789308547974, 0.4158118963241577, 1.1363816261291504, 1.8569514751434326, 2.577521324157715, 3.298090934753418, 4.018661022186279, 4.739230632781982, 5.4598002433776855, 6.180370330810547, 6.90093994140625, 7.621509552001953, 8.342079162597656, 9.06264877319336, 9.783219337463379, 10.503788948059082, 11.224358558654785, 11.944928169250488, 12.665498733520508, 13.386068344116211, 14.106637954711914, 14.827207565307617, 15.54777717590332, 16.268346786499023, 16.988916397094727, 17.70948600769043, 18.430055618286133, 19.150625228881836, 19.871196746826172, 20.591766357421875, 21.312335968017578, 22.03290557861328]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 6.0, 4.0, 13.0, 3.0, 8.0, 12.0, 18.0, 17.0, 17.0, 21.0, 25.0, 33.0, 30.0, 33.0, 35.0, 34.0, 45.0, 42.0, 30.0, 37.0, 42.0, 57.0, 47.0, 45.0, 36.0, 41.0, 43.0, 33.0, 32.0, 30.0, 18.0, 25.0, 19.0, 17.0, 11.0, 10.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.283203125, -2.212066650390625, -2.14093017578125, -2.069793701171875, -1.9986572265625, -1.927520751953125, -1.85638427734375, -1.785247802734375, -1.714111328125, -1.642974853515625, -1.57183837890625, -1.500701904296875, -1.4295654296875, -1.358428955078125, -1.28729248046875, -1.216156005859375, -1.14501953125, -1.073883056640625, -1.00274658203125, -0.931610107421875, -0.8604736328125, -0.789337158203125, -0.71820068359375, -0.647064208984375, -0.575927734375, -0.504791259765625, -0.43365478515625, -0.362518310546875, -0.2913818359375, -0.220245361328125, -0.14910888671875, -0.077972412109375, -0.0068359375, 0.064300537109375, 0.13543701171875, 0.206573486328125, 0.2777099609375, 0.348846435546875, 0.41998291015625, 0.491119384765625, 0.562255859375, 0.633392333984375, 0.70452880859375, 0.775665283203125, 0.8468017578125, 0.917938232421875, 0.98907470703125, 1.060211181640625, 1.13134765625, 1.202484130859375, 1.27362060546875, 1.344757080078125, 1.4158935546875, 1.487030029296875, 1.55816650390625, 1.629302978515625, 1.700439453125, 1.771575927734375, 1.84271240234375, 1.913848876953125, 1.9849853515625, 2.056121826171875, 2.12725830078125, 2.198394775390625, 2.26953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 20.0, 25.0, 51.0, 58.0, 95.0, 133.0, 223.0, 349.0, 530.0, 916.0, 1589.0, 2732.0, 5107.0, 9536.0, 18982.0, 39965.0, 90610.0, 237036.0, 766115.0, 1652928.0, 900227.0, 277134.0, 101578.0, 44403.0, 20862.0, 10279.0, 5528.0, 3022.0, 1629.0, 952.0, 582.0, 364.0, 230.0, 167.0, 88.0, 74.0, 44.0, 29.0, 22.0, 13.0, 11.0, 9.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.3673095703125, -3.263916015625, -3.1605224609375, -3.05712890625, -2.9537353515625, -2.850341796875, -2.7469482421875, -2.6435546875, -2.5401611328125, -2.436767578125, -2.3333740234375, -2.22998046875, -2.1265869140625, -2.023193359375, -1.9197998046875, -1.81640625, -1.7130126953125, -1.609619140625, -1.5062255859375, -1.40283203125, -1.2994384765625, -1.196044921875, -1.0926513671875, -0.9892578125, -0.8858642578125, -0.782470703125, -0.6790771484375, -0.57568359375, -0.4722900390625, -0.368896484375, -0.2655029296875, -0.162109375, -0.0587158203125, 0.044677734375, 0.1480712890625, 0.25146484375, 0.3548583984375, 0.458251953125, 0.5616455078125, 0.6650390625, 0.7684326171875, 0.871826171875, 0.9752197265625, 1.07861328125, 1.1820068359375, 1.285400390625, 1.3887939453125, 1.4921875, 1.5955810546875, 1.698974609375, 1.8023681640625, 1.90576171875, 2.0091552734375, 2.112548828125, 2.2159423828125, 2.3193359375, 2.4227294921875, 2.526123046875, 2.6295166015625, 2.73291015625, 2.8363037109375, 2.939697265625, 3.0430908203125, 3.146484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 12.0, 13.0, 16.0, 13.0, 19.0, 40.0, 44.0, 72.0, 82.0, 95.0, 141.0, 219.0, 283.0, 327.0, 401.0, 439.0, 431.0, 329.0, 256.0, 216.0, 162.0, 112.0, 103.0, 73.0, 49.0, 30.0, 20.0, 16.0, 13.0, 10.0, 5.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.12890625, -6.9437255859375, -6.758544921875, -6.5733642578125, -6.38818359375, -6.2030029296875, -6.017822265625, -5.8326416015625, -5.6474609375, -5.4622802734375, -5.277099609375, -5.0919189453125, -4.90673828125, -4.7215576171875, -4.536376953125, -4.3511962890625, -4.166015625, -3.9808349609375, -3.795654296875, -3.6104736328125, -3.42529296875, -3.2401123046875, -3.054931640625, -2.8697509765625, -2.6845703125, -2.4993896484375, -2.314208984375, -2.1290283203125, -1.94384765625, -1.7586669921875, -1.573486328125, -1.3883056640625, -1.203125, -1.0179443359375, -0.832763671875, -0.6475830078125, -0.46240234375, -0.2772216796875, -0.092041015625, 0.0931396484375, 0.2783203125, 0.4635009765625, 0.648681640625, 0.8338623046875, 1.01904296875, 1.2042236328125, 1.389404296875, 1.5745849609375, 1.759765625, 1.9449462890625, 2.130126953125, 2.3153076171875, 2.50048828125, 2.6856689453125, 2.870849609375, 3.0560302734375, 3.2412109375, 3.4263916015625, 3.611572265625, 3.7967529296875, 3.98193359375, 4.1671142578125, 4.352294921875, 4.5374755859375, 4.72265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 20.0, 33.0, 33.0, 50.0, 80.0, 124.0, 234.0, 368.0, 691.0, 1566.0, 4511.0, 16015.0, 76422.0, 503492.0, 2668388.0, 780589.0, 110327.0, 21601.0, 5801.0, 1995.0, 814.0, 428.0, 251.0, 139.0, 92.0, 62.0, 44.0, 26.0, 19.0, 14.0, 7.0, 11.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0103759765625, -7.684814453125, -7.3592529296875, -7.03369140625, -6.7081298828125, -6.382568359375, -6.0570068359375, -5.7314453125, -5.4058837890625, -5.080322265625, -4.7547607421875, -4.42919921875, -4.1036376953125, -3.778076171875, -3.4525146484375, -3.126953125, -2.8013916015625, -2.475830078125, -2.1502685546875, -1.82470703125, -1.4991455078125, -1.173583984375, -0.8480224609375, -0.5224609375, -0.1968994140625, 0.128662109375, 0.4542236328125, 0.77978515625, 1.1053466796875, 1.430908203125, 1.7564697265625, 2.08203125, 2.4075927734375, 2.733154296875, 3.0587158203125, 3.38427734375, 3.7098388671875, 4.035400390625, 4.3609619140625, 4.6865234375, 5.0120849609375, 5.337646484375, 5.6632080078125, 5.98876953125, 6.3143310546875, 6.639892578125, 6.9654541015625, 7.291015625, 7.6165771484375, 7.942138671875, 8.2677001953125, 8.59326171875, 8.9188232421875, 9.244384765625, 9.5699462890625, 9.8955078125, 10.2210693359375, 10.546630859375, 10.8721923828125, 11.19775390625, 11.5233154296875, 11.848876953125, 12.1744384765625, 12.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 24.0, 37.0, 75.0, 111.0, 144.0, 173.0, 141.0, 122.0, 79.0, 58.0, 24.0, 10.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.887874603271484, -43.20592498779297, -41.52397537231445, -39.84202575683594, -38.16007995605469, -36.478126525878906, -34.796180725097656, -33.11423110961914, -31.432281494140625, -29.75033187866211, -28.068382263183594, -26.38643455505371, -24.704484939575195, -23.02253532409668, -21.340587615966797, -19.65863800048828, -17.976688385009766, -16.29473876953125, -14.61279010772705, -12.930841445922852, -11.248891830444336, -9.56694221496582, -7.884993553161621, -6.203044891357422, -4.521095275878906, -2.839146137237549, -1.1571969985961914, 0.524752140045166, 2.2067012786865234, 3.888650894165039, 5.570599555969238, 7.2525482177734375, 8.934494018554688, 10.616443634033203, 12.298392295837402, 13.980340957641602, 15.662290573120117, 17.344240188598633, 19.026187896728516, 20.70813751220703, 22.390087127685547, 24.072036743164062, 25.753986358642578, 27.43593406677246, 29.117883682250977, 30.799833297729492, 32.481781005859375, 34.16373062133789, 35.845680236816406, 37.52762985229492, 39.20957946777344, 40.89152908325195, 42.57347869873047, 44.25542449951172, 45.937374114990234, 47.61932373046875, 49.301273345947266, 50.98322296142578, 52.6651725769043, 54.34712219238281, 56.02906799316406, 57.711021423339844, 59.392967224121094, 61.07491683959961, 62.756866455078125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 9.0, 4.0, 8.0, 7.0, 9.0, 14.0, 11.0, 16.0, 23.0, 22.0, 27.0, 32.0, 30.0, 24.0, 31.0, 46.0, 36.0, 52.0, 35.0, 54.0, 38.0, 45.0, 41.0, 42.0, 33.0, 33.0, 26.0, 33.0, 29.0, 20.0, 21.0, 23.0, 24.0, 23.0, 17.0, 14.0, 10.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.47724151611328, -19.817333221435547, -19.15742301940918, -18.497514724731445, -17.837604522705078, -17.177696228027344, -16.517786026000977, -15.857877731323242, -15.197968482971191, -14.53805923461914, -13.87814998626709, -13.218240737915039, -12.558332443237305, -11.898422241210938, -11.238513946533203, -10.578604698181152, -9.918695449829102, -9.25878620147705, -8.598876953125, -7.938968181610107, -7.279058933258057, -6.619149684906006, -5.959240913391113, -5.2993316650390625, -4.639422416687012, -3.979513168334961, -3.3196041584014893, -2.6596951484680176, -1.9997859001159668, -1.339876651763916, -0.6799676418304443, -0.020058631896972656, 0.6398506164550781, 1.2997597455978394, 1.9596688747406006, 2.6195778846740723, 3.279487133026123, 3.939396381378174, 4.599305152893066, 5.259214401245117, 5.919123649597168, 6.579032897949219, 7.2389421463012695, 7.898850917816162, 8.558759689331055, 9.218669891357422, 9.878578186035156, 10.538487434387207, 11.198396682739258, 11.858305931091309, 12.51821517944336, 13.17812442779541, 13.838033676147461, 14.497941970825195, 15.157851219177246, 15.817760467529297, 16.47766876220703, 17.137577056884766, 17.797487258911133, 18.457395553588867, 19.117305755615234, 19.77721405029297, 20.437124252319336, 21.09703254699707, 21.756942749023438]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 17.0, 15.0, 13.0, 16.0, 36.0, 30.0, 39.0, 28.0, 28.0, 34.0, 42.0, 39.0, 55.0, 38.0, 40.0, 50.0, 34.0, 45.0, 33.0, 39.0, 37.0, 19.0, 26.0, 32.0, 23.0, 20.0, 32.0, 18.0, 12.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.939056396484375, -1.87030029296875, -1.801544189453125, -1.7327880859375, -1.664031982421875, -1.59527587890625, -1.526519775390625, -1.457763671875, -1.389007568359375, -1.32025146484375, -1.251495361328125, -1.1827392578125, -1.113983154296875, -1.04522705078125, -0.976470947265625, -0.90771484375, -0.838958740234375, -0.77020263671875, -0.701446533203125, -0.6326904296875, -0.563934326171875, -0.49517822265625, -0.426422119140625, -0.357666015625, -0.288909912109375, -0.22015380859375, -0.151397705078125, -0.0826416015625, -0.013885498046875, 0.05487060546875, 0.123626708984375, 0.1923828125, 0.261138916015625, 0.32989501953125, 0.398651123046875, 0.4674072265625, 0.536163330078125, 0.60491943359375, 0.673675537109375, 0.742431640625, 0.811187744140625, 0.87994384765625, 0.948699951171875, 1.0174560546875, 1.086212158203125, 1.15496826171875, 1.223724365234375, 1.29248046875, 1.361236572265625, 1.42999267578125, 1.498748779296875, 1.5675048828125, 1.636260986328125, 1.70501708984375, 1.773773193359375, 1.842529296875, 1.911285400390625, 1.98004150390625, 2.048797607421875, 2.1175537109375, 2.186309814453125, 2.25506591796875, 2.323822021484375, 2.392578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 14.0, 23.0, 26.0, 35.0, 74.0, 102.0, 169.0, 252.0, 375.0, 540.0, 780.0, 1087.0, 1770.0, 2730.0, 4116.0, 6308.0, 10217.0, 16300.0, 26546.0, 44655.0, 78352.0, 164455.0, 350468.0, 152501.0, 74824.0, 42920.0, 25356.0, 15864.0, 9933.0, 6132.0, 3985.0, 2572.0, 1700.0, 1046.0, 736.0, 492.0, 399.0, 243.0, 166.0, 106.0, 61.0, 31.0, 34.0, 19.0, 15.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.013885498046875, -0.01348257064819336, -0.013079643249511719, -0.012676715850830078, -0.012273788452148438, -0.011870861053466797, -0.011467933654785156, -0.011065006256103516, -0.010662078857421875, -0.010259151458740234, -0.009856224060058594, -0.009453296661376953, -0.009050369262695312, -0.008647441864013672, -0.008244514465332031, -0.00784158706665039, -0.00743865966796875, -0.007035732269287109, -0.006632804870605469, -0.006229877471923828, -0.0058269500732421875, -0.005424022674560547, -0.005021095275878906, -0.004618167877197266, -0.004215240478515625, -0.0038123130798339844, -0.0034093856811523438, -0.003006458282470703, -0.0026035308837890625, -0.002200603485107422, -0.0017976760864257812, -0.0013947486877441406, -0.0009918212890625, -0.0005888938903808594, -0.00018596649169921875, 0.00021696090698242188, 0.0006198883056640625, 0.0010228157043457031, 0.0014257431030273438, 0.0018286705017089844, 0.002231597900390625, 0.0026345252990722656, 0.0030374526977539062, 0.003440380096435547, 0.0038433074951171875, 0.004246234893798828, 0.004649162292480469, 0.005052089691162109, 0.00545501708984375, 0.005857944488525391, 0.006260871887207031, 0.006663799285888672, 0.0070667266845703125, 0.007469654083251953, 0.007872581481933594, 0.008275508880615234, 0.008678436279296875, 0.009081363677978516, 0.009484291076660156, 0.009887218475341797, 0.010290145874023438, 0.010693073272705078, 0.011096000671386719, 0.01149892807006836, 0.01190185546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 10.0, 11.0, 12.0, 15.0, 12.0, 22.0, 20.0, 22.0, 23.0, 29.0, 24.0, 31.0, 37.0, 35.0, 38.0, 30.0, 35.0, 49.0, 1077.0, 42.0, 39.0, 31.0, 32.0, 39.0, 28.0, 26.0, 19.0, 42.0, 37.0, 26.0, 24.0, 15.0, 11.0, 10.0, 13.0, 13.0, 8.0, 9.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.29779052734375, -1.2537841796875, -1.20977783203125, -1.165771484375, -1.12176513671875, -1.0777587890625, -1.03375244140625, -0.98974609375, -0.94573974609375, -0.9017333984375, -0.85772705078125, -0.813720703125, -0.76971435546875, -0.7257080078125, -0.68170166015625, -0.6376953125, -0.59368896484375, -0.5496826171875, -0.50567626953125, -0.461669921875, -0.41766357421875, -0.3736572265625, -0.32965087890625, -0.28564453125, -0.24163818359375, -0.1976318359375, -0.15362548828125, -0.109619140625, -0.06561279296875, -0.0216064453125, 0.02239990234375, 0.06640625, 0.11041259765625, 0.1544189453125, 0.19842529296875, 0.242431640625, 0.28643798828125, 0.3304443359375, 0.37445068359375, 0.41845703125, 0.46246337890625, 0.5064697265625, 0.55047607421875, 0.594482421875, 0.63848876953125, 0.6824951171875, 0.72650146484375, 0.7705078125, 0.81451416015625, 0.8585205078125, 0.90252685546875, 0.946533203125, 0.99053955078125, 1.0345458984375, 1.07855224609375, 1.12255859375, 1.16656494140625, 1.2105712890625, 1.25457763671875, 1.298583984375, 1.34259033203125, 1.3865966796875, 1.43060302734375, 1.474609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 3.0, 17.0, 26.0, 28.0, 56.0, 75.0, 107.0, 174.0, 282.0, 409.0, 565.0, 1001.0, 1426.0, 2142.0, 3343.0, 5138.0, 7950.0, 12644.0, 19920.0, 31359.0, 50583.0, 85013.0, 170741.0, 1352403.0, 148008.0, 76716.0, 46739.0, 28977.0, 18179.0, 11692.0, 7619.0, 4697.0, 3112.0, 2041.0, 1295.0, 913.0, 555.0, 401.0, 247.0, 179.0, 118.0, 77.0, 49.0, 25.0, 35.0, 22.0, 5.0, 11.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00872802734375, -0.008466839790344238, -0.008205652236938477, -0.007944464683532715, -0.007683277130126953, -0.007422089576721191, -0.00716090202331543, -0.006899714469909668, -0.006638526916503906, -0.0063773393630981445, -0.006116151809692383, -0.005854964256286621, -0.005593776702880859, -0.005332589149475098, -0.005071401596069336, -0.004810214042663574, -0.0045490264892578125, -0.004287838935852051, -0.004026651382446289, -0.0037654638290405273, -0.0035042762756347656, -0.003243088722229004, -0.002981901168823242, -0.0027207136154174805, -0.0024595260620117188, -0.002198338508605957, -0.0019371509552001953, -0.0016759634017944336, -0.0014147758483886719, -0.0011535882949829102, -0.0008924007415771484, -0.0006312131881713867, -0.000370025634765625, -0.00010883808135986328, 0.00015234947204589844, 0.00041353702545166016, 0.0006747245788574219, 0.0009359121322631836, 0.0011970996856689453, 0.001458287239074707, 0.0017194747924804688, 0.0019806623458862305, 0.002241849899291992, 0.002503037452697754, 0.0027642250061035156, 0.0030254125595092773, 0.003286600112915039, 0.0035477876663208008, 0.0038089752197265625, 0.004070162773132324, 0.004331350326538086, 0.004592537879943848, 0.004853725433349609, 0.005114912986755371, 0.005376100540161133, 0.0056372880935668945, 0.005898475646972656, 0.006159663200378418, 0.00642085075378418, 0.006682038307189941, 0.006943225860595703, 0.007204413414001465, 0.0074656009674072266, 0.007726788520812988, 0.00798797607421875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 968.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 17.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 0.0, 46.0, 52.0, 0.0, 256.0, 2449.0, 0.0, 13420.0, 0.0, 1015763.0, 13756.0, 0.0, 2366.0, 274.0, 0.0, 63.0, 30.0, 0.0, 13.0, 0.0, 7.0, 2.0, 0.0, 0.0, 5.0, 0.0, 11.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0346993803977966e-06, -9.96515154838562e-07, -9.583309292793274e-07, -9.201467037200928e-07, -8.819624781608582e-07, -8.437782526016235e-07, -8.055940270423889e-07, -7.674098014831543e-07, -7.292255759239197e-07, -6.910413503646851e-07, -6.528571248054504e-07, -6.146728992462158e-07, -5.764886736869812e-07, -5.383044481277466e-07, -5.00120222568512e-07, -4.6193599700927734e-07, -4.237517714500427e-07, -3.855675458908081e-07, -3.473833203315735e-07, -3.0919909477233887e-07, -2.7101486921310425e-07, -2.3283064365386963e-07, -1.94646418094635e-07, -1.564621925354004e-07, -1.1827796697616577e-07, -8.009374141693115e-08, -4.190951585769653e-08, -3.725290298461914e-09, 3.4458935260772705e-08, 7.264316082000732e-08, 1.1082738637924194e-07, 1.4901161193847656e-07, 1.8719583749771118e-07, 2.253800630569458e-07, 2.635642886161804e-07, 3.0174851417541504e-07, 3.3993273973464966e-07, 3.781169652938843e-07, 4.163011908531189e-07, 4.544854164123535e-07, 4.926696419715881e-07, 5.308538675308228e-07, 5.690380930900574e-07, 6.07222318649292e-07, 6.454065442085266e-07, 6.835907697677612e-07, 7.217749953269958e-07, 7.599592208862305e-07, 7.981434464454651e-07, 8.363276720046997e-07, 8.745118975639343e-07, 9.126961231231689e-07, 9.508803486824036e-07, 9.890645742416382e-07, 1.0272487998008728e-06, 1.0654330253601074e-06, 1.103617250919342e-06, 1.1418014764785767e-06, 1.1799857020378113e-06, 1.218169927597046e-06, 1.2563541531562805e-06, 1.2945383787155151e-06, 1.3327226042747498e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 17.0, 15.0, 13.0, 16.0, 36.0, 30.0, 39.0, 28.0, 28.0, 34.0, 42.0, 39.0, 55.0, 38.0, 40.0, 50.0, 34.0, 45.0, 33.0, 39.0, 37.0, 19.0, 26.0, 32.0, 23.0, 20.0, 32.0, 18.0, 12.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.939056396484375, -1.87030029296875, -1.801544189453125, -1.7327880859375, -1.664031982421875, -1.59527587890625, -1.526519775390625, -1.457763671875, -1.389007568359375, -1.32025146484375, -1.251495361328125, -1.1827392578125, -1.113983154296875, -1.04522705078125, -0.976470947265625, -0.90771484375, -0.838958740234375, -0.77020263671875, -0.701446533203125, -0.6326904296875, -0.563934326171875, -0.49517822265625, -0.426422119140625, -0.357666015625, -0.288909912109375, -0.22015380859375, -0.151397705078125, -0.0826416015625, -0.013885498046875, 0.05487060546875, 0.123626708984375, 0.1923828125, 0.261138916015625, 0.32989501953125, 0.398651123046875, 0.4674072265625, 0.536163330078125, 0.60491943359375, 0.673675537109375, 0.742431640625, 0.811187744140625, 0.87994384765625, 0.948699951171875, 1.0174560546875, 1.086212158203125, 1.15496826171875, 1.223724365234375, 1.29248046875, 1.361236572265625, 1.42999267578125, 1.498748779296875, 1.5675048828125, 1.636260986328125, 1.70501708984375, 1.773773193359375, 1.842529296875, 1.911285400390625, 1.98004150390625, 2.048797607421875, 2.1175537109375, 2.186309814453125, 2.25506591796875, 2.323822021484375, 2.392578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 7.0, 1.0, 10.0, 13.0, 16.0, 26.0, 39.0, 45.0, 73.0, 75.0, 132.0, 183.0, 257.0, 334.0, 515.0, 732.0, 974.0, 1458.0, 2066.0, 2930.0, 4293.0, 6124.0, 9236.0, 14218.0, 23583.0, 49575.0, 144409.0, 479019.0, 177936.0, 57383.0, 26492.0, 15290.0, 9802.0, 6509.0, 4459.0, 3121.0, 2158.0, 1416.0, 1018.0, 733.0, 553.0, 396.0, 265.0, 213.0, 137.0, 111.0, 81.0, 51.0, 32.0, 15.0, 22.0, 14.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.0078125, -1.9461822509765625, -1.884552001953125, -1.8229217529296875, -1.76129150390625, -1.6996612548828125, -1.638031005859375, -1.5764007568359375, -1.5147705078125, -1.4531402587890625, -1.391510009765625, -1.3298797607421875, -1.26824951171875, -1.2066192626953125, -1.144989013671875, -1.0833587646484375, -1.021728515625, -0.9600982666015625, -0.898468017578125, -0.8368377685546875, -0.77520751953125, -0.7135772705078125, -0.651947021484375, -0.5903167724609375, -0.5286865234375, -0.4670562744140625, -0.405426025390625, -0.3437957763671875, -0.28216552734375, -0.2205352783203125, -0.158905029296875, -0.0972747802734375, -0.03564453125, 0.0259857177734375, 0.087615966796875, 0.1492462158203125, 0.21087646484375, 0.2725067138671875, 0.334136962890625, 0.3957672119140625, 0.4573974609375, 0.5190277099609375, 0.580657958984375, 0.6422882080078125, 0.70391845703125, 0.7655487060546875, 0.827178955078125, 0.8888092041015625, 0.950439453125, 1.0120697021484375, 1.073699951171875, 1.1353302001953125, 1.19696044921875, 1.2585906982421875, 1.320220947265625, 1.3818511962890625, 1.4434814453125, 1.5051116943359375, 1.566741943359375, 1.6283721923828125, 1.69000244140625, 1.7516326904296875, 1.813262939453125, 1.8748931884765625, 1.9365234375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 8.0, 6.0, 13.0, 16.0, 14.0, 16.0, 31.0, 18.0, 36.0, 31.0, 32.0, 44.0, 48.0, 77.0, 75.0, 142.0, 1680.0, 243.0, 93.0, 60.0, 48.0, 47.0, 38.0, 31.0, 39.0, 29.0, 19.0, 21.0, 16.0, 17.0, 14.0, 4.0, 7.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9720458984375, -7.694091796875, -7.4161376953125, -7.13818359375, -6.8602294921875, -6.582275390625, -6.3043212890625, -6.0263671875, -5.7484130859375, -5.470458984375, -5.1925048828125, -4.91455078125, -4.6365966796875, -4.358642578125, -4.0806884765625, -3.802734375, -3.5247802734375, -3.246826171875, -2.9688720703125, -2.69091796875, -2.4129638671875, -2.135009765625, -1.8570556640625, -1.5791015625, -1.3011474609375, -1.023193359375, -0.7452392578125, -0.46728515625, -0.1893310546875, 0.088623046875, 0.3665771484375, 0.64453125, 0.9224853515625, 1.200439453125, 1.4783935546875, 1.75634765625, 2.0343017578125, 2.312255859375, 2.5902099609375, 2.8681640625, 3.1461181640625, 3.424072265625, 3.7020263671875, 3.97998046875, 4.2579345703125, 4.535888671875, 4.8138427734375, 5.091796875, 5.3697509765625, 5.647705078125, 5.9256591796875, 6.20361328125, 6.4815673828125, 6.759521484375, 7.0374755859375, 7.3154296875, 7.5933837890625, 7.871337890625, 8.1492919921875, 8.42724609375, 8.7052001953125, 8.983154296875, 9.2611083984375, 9.5390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 9.0, 7.0, 16.0, 21.0, 18.0, 27.0, 21.0, 39.0, 60.0, 67.0, 114.0, 162.0, 222.0, 400.0, 1986.0, 29673.0, 3009534.0, 97732.0, 4067.0, 610.0, 258.0, 181.0, 109.0, 88.0, 72.0, 50.0, 27.0, 29.0, 25.0, 16.0, 19.0, 8.0, 3.0, 8.0, 11.0, 2.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.8125, -17.2984619140625, -16.784423828125, -16.2703857421875, -15.75634765625, -15.2423095703125, -14.728271484375, -14.2142333984375, -13.7001953125, -13.1861572265625, -12.672119140625, -12.1580810546875, -11.64404296875, -11.1300048828125, -10.615966796875, -10.1019287109375, -9.587890625, -9.0738525390625, -8.559814453125, -8.0457763671875, -7.53173828125, -7.0177001953125, -6.503662109375, -5.9896240234375, -5.4755859375, -4.9615478515625, -4.447509765625, -3.9334716796875, -3.41943359375, -2.9053955078125, -2.391357421875, -1.8773193359375, -1.36328125, -0.8492431640625, -0.335205078125, 0.1788330078125, 0.69287109375, 1.2069091796875, 1.720947265625, 2.2349853515625, 2.7490234375, 3.2630615234375, 3.777099609375, 4.2911376953125, 4.80517578125, 5.3192138671875, 5.833251953125, 6.3472900390625, 6.861328125, 7.3753662109375, 7.889404296875, 8.4034423828125, 8.91748046875, 9.4315185546875, 9.945556640625, 10.4595947265625, 10.9736328125, 11.4876708984375, 12.001708984375, 12.5157470703125, 13.02978515625, 13.5438232421875, 14.057861328125, 14.5718994140625, 15.0859375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 169.0, 677.0, 163.0], "bins": [-141.75186157226562, -139.48297119140625, -137.21408081054688, -134.94520568847656, -132.6763153076172, -130.4074249267578, -128.13853454589844, -125.8696517944336, -123.60076141357422, -121.33187103271484, -119.06298828125, -116.79409790039062, -114.52521514892578, -112.2563247680664, -109.98744201660156, -107.71855163574219, -105.44966125488281, -103.18077087402344, -100.9118881225586, -98.64299774169922, -96.37411499023438, -94.105224609375, -91.83633422851562, -89.56745147705078, -87.29856872558594, -85.02967834472656, -82.76079559326172, -80.49190521240234, -78.2230224609375, -75.95413208007812, -73.68524169921875, -71.4163589477539, -69.14747619628906, -66.87858581542969, -64.60970306396484, -62.34081268310547, -60.07192611694336, -57.80303955078125, -55.53415298461914, -53.26526641845703, -50.996376037597656, -48.72748947143555, -46.45860290527344, -44.18971252441406, -41.92082595825195, -39.651939392089844, -37.383052825927734, -35.114166259765625, -32.84527587890625, -30.57638931274414, -28.3075008392334, -26.03861427307129, -23.769725799560547, -21.500839233398438, -19.231952667236328, -16.96306610107422, -14.694177627563477, -12.42529010772705, -10.156402587890625, -7.887516021728516, -5.61862850189209, -3.349740982055664, -1.0808544158935547, 1.188033103942871, 3.4569203853607178]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 12.0, 18.0, 12.0, 20.0, 20.0, 18.0, 24.0, 26.0, 36.0, 30.0, 46.0, 46.0, 37.0, 34.0, 57.0, 59.0, 43.0, 35.0, 35.0, 41.0, 41.0, 31.0, 35.0, 25.0, 32.0, 26.0, 23.0, 20.0, 24.0, 17.0, 10.0, 12.0, 13.0, 6.0, 2.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.954151153564453, -18.2750301361084, -17.595909118652344, -16.91678810119629, -16.237667083740234, -15.55854606628418, -14.879426002502441, -14.200304985046387, -13.521183967590332, -12.842062950134277, -12.162941932678223, -11.483821868896484, -10.80470085144043, -10.125579833984375, -9.44645881652832, -8.767337799072266, -8.088216781616211, -7.409095764160156, -6.729974746704102, -6.050854206085205, -5.37173318862915, -4.692612171173096, -4.013491630554199, -3.3343706130981445, -2.65524959564209, -1.9761286973953247, -1.2970077991485596, -0.617887020111084, 0.0612339973449707, 0.7403550148010254, 1.4194755554199219, 2.0985965728759766, 2.777719497680664, 3.4568405151367188, 4.135961532592773, 4.81508207321167, 5.494203090667725, 6.173324108123779, 6.852444648742676, 7.5315656661987305, 8.210686683654785, 8.88980770111084, 9.568928718566895, 10.248048782348633, 10.927169799804688, 11.606290817260742, 12.285411834716797, 12.964532852172852, 13.643653869628906, 14.322774887084961, 15.001895904541016, 15.68101692199707, 16.360137939453125, 17.03925895690918, 17.718379974365234, 18.397499084472656, 19.076622009277344, 19.7557430267334, 20.434864044189453, 21.113985061645508, 21.793106079101562, 22.472227096557617, 23.151348114013672, 23.830467224121094, 24.50958824157715]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 6.0, 12.0, 7.0, 13.0, 20.0, 15.0, 22.0, 17.0, 23.0, 32.0, 34.0, 41.0, 27.0, 38.0, 43.0, 36.0, 34.0, 40.0, 52.0, 47.0, 39.0, 36.0, 43.0, 27.0, 32.0, 29.0, 24.0, 23.0, 38.0, 27.0, 16.0, 14.0, 19.0, 12.0, 17.0, 4.0, 4.0, 1.0, 4.0, 6.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1015625, -2.031890869140625, -1.96221923828125, -1.892547607421875, -1.8228759765625, -1.753204345703125, -1.68353271484375, -1.613861083984375, -1.544189453125, -1.474517822265625, -1.40484619140625, -1.335174560546875, -1.2655029296875, -1.195831298828125, -1.12615966796875, -1.056488037109375, -0.98681640625, -0.917144775390625, -0.84747314453125, -0.777801513671875, -0.7081298828125, -0.638458251953125, -0.56878662109375, -0.499114990234375, -0.429443359375, -0.359771728515625, -0.29010009765625, -0.220428466796875, -0.1507568359375, -0.081085205078125, -0.01141357421875, 0.058258056640625, 0.1279296875, 0.197601318359375, 0.26727294921875, 0.336944580078125, 0.4066162109375, 0.476287841796875, 0.54595947265625, 0.615631103515625, 0.685302734375, 0.754974365234375, 0.82464599609375, 0.894317626953125, 0.9639892578125, 1.033660888671875, 1.10333251953125, 1.173004150390625, 1.24267578125, 1.312347412109375, 1.38201904296875, 1.451690673828125, 1.5213623046875, 1.591033935546875, 1.66070556640625, 1.730377197265625, 1.800048828125, 1.869720458984375, 1.93939208984375, 2.009063720703125, 2.0787353515625, 2.148406982421875, 2.21807861328125, 2.287750244140625, 2.357421875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 11.0, 13.0, 18.0, 27.0, 26.0, 47.0, 57.0, 79.0, 125.0, 208.0, 376.0, 916.0, 2376.0, 8033.0, 35723.0, 243525.0, 2494000.0, 1262897.0, 116641.0, 20618.0, 5201.0, 1707.0, 686.0, 331.0, 178.0, 104.0, 80.0, 50.0, 39.0, 27.0, 23.0, 28.0, 16.0, 9.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 0.0, 1.0, 2.0], "bins": [-7.7734375, -7.5291748046875, -7.284912109375, -7.0406494140625, -6.79638671875, -6.5521240234375, -6.307861328125, -6.0635986328125, -5.8193359375, -5.5750732421875, -5.330810546875, -5.0865478515625, -4.84228515625, -4.5980224609375, -4.353759765625, -4.1094970703125, -3.865234375, -3.6209716796875, -3.376708984375, -3.1324462890625, -2.88818359375, -2.6439208984375, -2.399658203125, -2.1553955078125, -1.9111328125, -1.6668701171875, -1.422607421875, -1.1783447265625, -0.93408203125, -0.6898193359375, -0.445556640625, -0.2012939453125, 0.04296875, 0.2872314453125, 0.531494140625, 0.7757568359375, 1.02001953125, 1.2642822265625, 1.508544921875, 1.7528076171875, 1.9970703125, 2.2413330078125, 2.485595703125, 2.7298583984375, 2.97412109375, 3.2183837890625, 3.462646484375, 3.7069091796875, 3.951171875, 4.1954345703125, 4.439697265625, 4.6839599609375, 4.92822265625, 5.1724853515625, 5.416748046875, 5.6610107421875, 5.9052734375, 6.1495361328125, 6.393798828125, 6.6380615234375, 6.88232421875, 7.1265869140625, 7.370849609375, 7.6151123046875, 7.859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 18.0, 22.0, 33.0, 33.0, 50.0, 65.0, 90.0, 129.0, 171.0, 193.0, 264.0, 333.0, 449.0, 440.0, 383.0, 310.0, 261.0, 196.0, 157.0, 129.0, 90.0, 67.0, 47.0, 23.0, 28.0, 14.0, 12.0, 14.0, 6.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.64453125, -6.46661376953125, -6.2886962890625, -6.11077880859375, -5.932861328125, -5.75494384765625, -5.5770263671875, -5.39910888671875, -5.22119140625, -5.04327392578125, -4.8653564453125, -4.68743896484375, -4.509521484375, -4.33160400390625, -4.1536865234375, -3.97576904296875, -3.7978515625, -3.61993408203125, -3.4420166015625, -3.26409912109375, -3.086181640625, -2.90826416015625, -2.7303466796875, -2.55242919921875, -2.37451171875, -2.19659423828125, -2.0186767578125, -1.84075927734375, -1.662841796875, -1.48492431640625, -1.3070068359375, -1.12908935546875, -0.951171875, -0.77325439453125, -0.5953369140625, -0.41741943359375, -0.239501953125, -0.06158447265625, 0.1163330078125, 0.29425048828125, 0.47216796875, 0.65008544921875, 0.8280029296875, 1.00592041015625, 1.183837890625, 1.36175537109375, 1.5396728515625, 1.71759033203125, 1.8955078125, 2.07342529296875, 2.2513427734375, 2.42926025390625, 2.607177734375, 2.78509521484375, 2.9630126953125, 3.14093017578125, 3.31884765625, 3.49676513671875, 3.6746826171875, 3.85260009765625, 4.030517578125, 4.20843505859375, 4.3863525390625, 4.56427001953125, 4.7421875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 20.0, 23.0, 35.0, 44.0, 57.0, 77.0, 111.0, 193.0, 282.0, 535.0, 1139.0, 4270.0, 31896.0, 426599.0, 3224666.0, 463204.0, 33963.0, 4647.0, 1139.0, 495.0, 267.0, 185.0, 114.0, 88.0, 58.0, 39.0, 35.0, 23.0, 14.0, 7.0, 9.0, 9.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.1768798828125, -10.720947265625, -10.2650146484375, -9.80908203125, -9.3531494140625, -8.897216796875, -8.4412841796875, -7.9853515625, -7.5294189453125, -7.073486328125, -6.6175537109375, -6.16162109375, -5.7056884765625, -5.249755859375, -4.7938232421875, -4.337890625, -3.8819580078125, -3.426025390625, -2.9700927734375, -2.51416015625, -2.0582275390625, -1.602294921875, -1.1463623046875, -0.6904296875, -0.2344970703125, 0.221435546875, 0.6773681640625, 1.13330078125, 1.5892333984375, 2.045166015625, 2.5010986328125, 2.95703125, 3.4129638671875, 3.868896484375, 4.3248291015625, 4.78076171875, 5.2366943359375, 5.692626953125, 6.1485595703125, 6.6044921875, 7.0604248046875, 7.516357421875, 7.9722900390625, 8.42822265625, 8.8841552734375, 9.340087890625, 9.7960205078125, 10.251953125, 10.7078857421875, 11.163818359375, 11.6197509765625, 12.07568359375, 12.5316162109375, 12.987548828125, 13.4434814453125, 13.8994140625, 14.3553466796875, 14.811279296875, 15.2672119140625, 15.72314453125, 16.1790771484375, 16.635009765625, 17.0909423828125, 17.546875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [4.0, 4.0, 15.0, 31.0, 57.0, 68.0, 132.0, 166.0, 149.0, 144.0, 112.0, 80.0, 34.0, 15.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.939248085021973, -12.229952812194824, -10.520657539367676, -8.811361312866211, -7.102066516876221, -5.392770767211914, -3.6834754943847656, -1.9741802215576172, -0.26488494873046875, 1.4444104433059692, 3.1537058353424072, 4.863001346588135, 6.572296619415283, 8.28159236907959, 9.990887641906738, 11.700182914733887, 13.409478187561035, 15.118773460388184, 16.82806968688965, 18.537364959716797, 20.246660232543945, 21.955955505371094, 23.665250778198242, 25.37454605102539, 27.08384132385254, 28.793136596679688, 30.502431869506836, 32.211727142333984, 33.921024322509766, 35.63031768798828, 37.33961486816406, 39.04890823364258, 40.75820541381836, 42.46750259399414, 44.176795959472656, 45.88609313964844, 47.59538650512695, 49.304683685302734, 51.01397705078125, 52.72327423095703, 54.43256759643555, 56.14186477661133, 57.851158142089844, 59.560455322265625, 61.26974868774414, 62.97904586791992, 64.68833923339844, 66.39763641357422, 68.10693359375, 69.81623077392578, 71.52552795410156, 73.23481750488281, 74.9441146850586, 76.65341186523438, 78.36270904541016, 80.0719985961914, 81.78129577636719, 83.49059295654297, 85.19989013671875, 86.9091796875, 88.61847686767578, 90.32777404785156, 92.03707122802734, 93.7463607788086, 95.45565795898438]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 11.0, 9.0, 9.0, 16.0, 15.0, 20.0, 14.0, 23.0, 22.0, 22.0, 32.0, 25.0, 30.0, 43.0, 35.0, 42.0, 41.0, 52.0, 39.0, 41.0, 35.0, 39.0, 40.0, 43.0, 43.0, 37.0, 33.0, 24.0, 32.0, 18.0, 20.0, 12.0, 12.0, 9.0, 7.0, 13.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.55908966064453, -16.9721622467041, -16.38523292541504, -15.79830551147461, -15.211377143859863, -14.624448776245117, -14.037521362304688, -13.450592994689941, -12.863664627075195, -12.27673625946045, -11.689807891845703, -11.102880477905273, -10.515952110290527, -9.929023742675781, -9.342096328735352, -8.755167961120605, -8.16823959350586, -7.581311225891113, -6.994383335113525, -6.4074554443359375, -5.820527076721191, -5.233598709106445, -4.646670818328857, -4.0597429275512695, -3.4728145599365234, -2.8858864307403564, -2.2989583015441895, -1.7120301723480225, -1.1251020431518555, -0.5381739139556885, 0.048754215240478516, 0.6356821060180664, 1.2226104736328125, 1.8095386028289795, 2.3964667320251465, 2.9833948612213135, 3.5703229904174805, 4.157251358032227, 4.7441792488098145, 5.331107139587402, 5.918035507202148, 6.5049638748168945, 7.091891765594482, 7.67881965637207, 8.265748023986816, 8.852676391601562, 9.439603805541992, 10.026532173156738, 10.613460540771484, 11.20038890838623, 11.787317276000977, 12.374244689941406, 12.961173057556152, 13.548101425170898, 14.135028839111328, 14.721957206726074, 15.30888557434082, 15.895813941955566, 16.482742309570312, 17.069669723510742, 17.656597137451172, 18.243526458740234, 18.830453872680664, 19.417381286621094, 20.004310607910156]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 5.0, 13.0, 16.0, 12.0, 13.0, 18.0, 26.0, 17.0, 24.0, 37.0, 36.0, 28.0, 36.0, 42.0, 46.0, 44.0, 33.0, 46.0, 36.0, 30.0, 54.0, 34.0, 26.0, 29.0, 27.0, 27.0, 31.0, 30.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0594482421875, -1.989990234375, -1.9205322265625, -1.85107421875, -1.7816162109375, -1.712158203125, -1.6427001953125, -1.5732421875, -1.5037841796875, -1.434326171875, -1.3648681640625, -1.29541015625, -1.2259521484375, -1.156494140625, -1.0870361328125, -1.017578125, -0.9481201171875, -0.878662109375, -0.8092041015625, -0.73974609375, -0.6702880859375, -0.600830078125, -0.5313720703125, -0.4619140625, -0.3924560546875, -0.322998046875, -0.2535400390625, -0.18408203125, -0.1146240234375, -0.045166015625, 0.0242919921875, 0.09375, 0.1632080078125, 0.232666015625, 0.3021240234375, 0.37158203125, 0.4410400390625, 0.510498046875, 0.5799560546875, 0.6494140625, 0.7188720703125, 0.788330078125, 0.8577880859375, 0.92724609375, 0.9967041015625, 1.066162109375, 1.1356201171875, 1.205078125, 1.2745361328125, 1.343994140625, 1.4134521484375, 1.48291015625, 1.5523681640625, 1.621826171875, 1.6912841796875, 1.7607421875, 1.8302001953125, 1.899658203125, 1.9691162109375, 2.03857421875, 2.1080322265625, 2.177490234375, 2.2469482421875, 2.31640625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 10.0, 15.0, 27.0, 42.0, 51.0, 74.0, 124.0, 181.0, 227.0, 331.0, 482.0, 765.0, 1035.0, 1550.0, 2337.0, 3495.0, 5298.0, 8192.0, 12959.0, 20445.0, 33734.0, 55774.0, 98218.0, 214681.0, 287990.0, 124621.0, 67647.0, 39952.0, 24766.0, 15314.0, 9692.0, 6105.0, 4094.0, 2632.0, 1801.0, 1182.0, 813.0, 569.0, 398.0, 306.0, 182.0, 133.0, 100.0, 61.0, 44.0, 32.0, 19.0, 15.0, 8.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.01373291015625, -0.013319015502929688, -0.012905120849609375, -0.012491226196289062, -0.01207733154296875, -0.011663436889648438, -0.011249542236328125, -0.010835647583007812, -0.0104217529296875, -0.010007858276367188, -0.009593963623046875, -0.009180068969726562, -0.00876617431640625, -0.008352279663085938, -0.007938385009765625, -0.0075244903564453125, -0.007110595703125, -0.0066967010498046875, -0.006282806396484375, -0.0058689117431640625, -0.00545501708984375, -0.0050411224365234375, -0.004627227783203125, -0.0042133331298828125, -0.0037994384765625, -0.0033855438232421875, -0.002971649169921875, -0.0025577545166015625, -0.00214385986328125, -0.0017299652099609375, -0.001316070556640625, -0.0009021759033203125, -0.00048828125, -7.43865966796875e-05, 0.000339508056640625, 0.0007534027099609375, 0.00116729736328125, 0.0015811920166015625, 0.001995086669921875, 0.0024089813232421875, 0.0028228759765625, 0.0032367706298828125, 0.003650665283203125, 0.0040645599365234375, 0.00447845458984375, 0.0048923492431640625, 0.005306243896484375, 0.0057201385498046875, 0.006134033203125, 0.0065479278564453125, 0.006961822509765625, 0.0073757171630859375, 0.00778961181640625, 0.008203506469726562, 0.008617401123046875, 0.009031295776367188, 0.0094451904296875, 0.009859085083007812, 0.010272979736328125, 0.010686874389648438, 0.01110076904296875, 0.011514663696289062, 0.011928558349609375, 0.012342453002929688, 0.01275634765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 8.0, 3.0, 9.0, 11.0, 15.0, 14.0, 17.0, 16.0, 25.0, 15.0, 28.0, 34.0, 29.0, 40.0, 35.0, 32.0, 51.0, 45.0, 32.0, 1084.0, 34.0, 56.0, 39.0, 34.0, 41.0, 41.0, 22.0, 32.0, 29.0, 24.0, 22.0, 20.0, 17.0, 18.0, 9.0, 6.0, 12.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.7880859375, -1.734893798828125, -1.68170166015625, -1.628509521484375, -1.5753173828125, -1.522125244140625, -1.46893310546875, -1.415740966796875, -1.362548828125, -1.309356689453125, -1.25616455078125, -1.202972412109375, -1.1497802734375, -1.096588134765625, -1.04339599609375, -0.990203857421875, -0.93701171875, -0.883819580078125, -0.83062744140625, -0.777435302734375, -0.7242431640625, -0.671051025390625, -0.61785888671875, -0.564666748046875, -0.511474609375, -0.458282470703125, -0.40509033203125, -0.351898193359375, -0.2987060546875, -0.245513916015625, -0.19232177734375, -0.139129638671875, -0.0859375, -0.032745361328125, 0.02044677734375, 0.073638916015625, 0.1268310546875, 0.180023193359375, 0.23321533203125, 0.286407470703125, 0.339599609375, 0.392791748046875, 0.44598388671875, 0.499176025390625, 0.5523681640625, 0.605560302734375, 0.65875244140625, 0.711944580078125, 0.76513671875, 0.818328857421875, 0.87152099609375, 0.924713134765625, 0.9779052734375, 1.031097412109375, 1.08428955078125, 1.137481689453125, 1.190673828125, 1.243865966796875, 1.29705810546875, 1.350250244140625, 1.4034423828125, 1.456634521484375, 1.50982666015625, 1.563018798828125, 1.6162109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 21.0, 26.0, 28.0, 34.0, 65.0, 113.0, 142.0, 229.0, 376.0, 487.0, 808.0, 1187.0, 1937.0, 2783.0, 4517.0, 7065.0, 11336.0, 18259.0, 30208.0, 50222.0, 89777.0, 196904.0, 1366546.0, 137272.0, 70230.0, 40862.0, 24502.0, 15113.0, 9392.0, 5832.0, 3859.0, 2439.0, 1500.0, 1057.0, 659.0, 408.0, 290.0, 210.0, 129.0, 94.0, 68.0, 45.0, 26.0, 25.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0096588134765625, -0.009340047836303711, -0.009021282196044922, -0.008702516555786133, -0.008383750915527344, -0.008064985275268555, -0.007746219635009766, -0.0074274539947509766, -0.0071086883544921875, -0.0067899227142333984, -0.006471157073974609, -0.00615239143371582, -0.005833625793457031, -0.005514860153198242, -0.005196094512939453, -0.004877328872680664, -0.004558563232421875, -0.004239797592163086, -0.003921031951904297, -0.003602266311645508, -0.0032835006713867188, -0.0029647350311279297, -0.0026459693908691406, -0.0023272037506103516, -0.0020084381103515625, -0.0016896724700927734, -0.0013709068298339844, -0.0010521411895751953, -0.0007333755493164062, -0.0004146099090576172, -9.584426879882812e-05, 0.00022292137145996094, 0.00054168701171875, 0.0008604526519775391, 0.0011792182922363281, 0.0014979839324951172, 0.0018167495727539062, 0.0021355152130126953, 0.0024542808532714844, 0.0027730464935302734, 0.0030918121337890625, 0.0034105777740478516, 0.0037293434143066406, 0.00404810905456543, 0.004366874694824219, 0.004685640335083008, 0.005004405975341797, 0.005323171615600586, 0.005641937255859375, 0.005960702896118164, 0.006279468536376953, 0.006598234176635742, 0.006916999816894531, 0.00723576545715332, 0.007554531097412109, 0.007873296737670898, 0.008192062377929688, 0.008510828018188477, 0.008829593658447266, 0.009148359298706055, 0.009467124938964844, 0.009785890579223633, 0.010104656219482422, 0.010423421859741211, 0.0107421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 956.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 31.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 37.0, 31.0, 0.0, 40.0, 0.0, 267.0, 2896.0, 0.0, 16532.0, 0.0, 1008809.0, 16601.0, 0.0, 2915.0, 0.0, 238.0, 53.0, 0.0, 43.0, 0.0, 26.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 20.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0961666703224182e-06, -1.0598450899124146e-06, -1.0235235095024109e-06, -9.872019290924072e-07, -9.508803486824036e-07, -9.145587682723999e-07, -8.782371878623962e-07, -8.419156074523926e-07, -8.055940270423889e-07, -7.692724466323853e-07, -7.329508662223816e-07, -6.966292858123779e-07, -6.603077054023743e-07, -6.239861249923706e-07, -5.876645445823669e-07, -5.513429641723633e-07, -5.150213837623596e-07, -4.78699803352356e-07, -4.423782229423523e-07, -4.0605664253234863e-07, -3.6973506212234497e-07, -3.334134817123413e-07, -2.9709190130233765e-07, -2.60770320892334e-07, -2.2444874048233032e-07, -1.8812716007232666e-07, -1.51805579662323e-07, -1.1548399925231934e-07, -7.916241884231567e-08, -4.284083843231201e-08, -6.51925802230835e-09, 2.9802322387695312e-08, 6.612390279769897e-08, 1.0244548320770264e-07, 1.387670636177063e-07, 1.7508864402770996e-07, 2.1141022443771362e-07, 2.477318048477173e-07, 2.8405338525772095e-07, 3.203749656677246e-07, 3.5669654607772827e-07, 3.9301812648773193e-07, 4.293397068977356e-07, 4.6566128730773926e-07, 5.019828677177429e-07, 5.383044481277466e-07, 5.746260285377502e-07, 6.109476089477539e-07, 6.472691893577576e-07, 6.835907697677612e-07, 7.199123501777649e-07, 7.562339305877686e-07, 7.925555109977722e-07, 8.288770914077759e-07, 8.651986718177795e-07, 9.015202522277832e-07, 9.378418326377869e-07, 9.741634130477905e-07, 1.0104849934577942e-06, 1.0468065738677979e-06, 1.0831281542778015e-06, 1.1194497346878052e-06, 1.1557713150978088e-06, 1.1920928955078125e-06]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 5.0, 13.0, 16.0, 12.0, 13.0, 18.0, 26.0, 17.0, 24.0, 37.0, 36.0, 28.0, 36.0, 42.0, 46.0, 44.0, 33.0, 46.0, 36.0, 30.0, 54.0, 34.0, 26.0, 29.0, 27.0, 27.0, 31.0, 30.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0594482421875, -1.989990234375, -1.9205322265625, -1.85107421875, -1.7816162109375, -1.712158203125, -1.6427001953125, -1.5732421875, -1.5037841796875, -1.434326171875, -1.3648681640625, -1.29541015625, -1.2259521484375, -1.156494140625, -1.0870361328125, -1.017578125, -0.9481201171875, -0.878662109375, -0.8092041015625, -0.73974609375, -0.6702880859375, -0.600830078125, -0.5313720703125, -0.4619140625, -0.3924560546875, -0.322998046875, -0.2535400390625, -0.18408203125, -0.1146240234375, -0.045166015625, 0.0242919921875, 0.09375, 0.1632080078125, 0.232666015625, 0.3021240234375, 0.37158203125, 0.4410400390625, 0.510498046875, 0.5799560546875, 0.6494140625, 0.7188720703125, 0.788330078125, 0.8577880859375, 0.92724609375, 0.9967041015625, 1.066162109375, 1.1356201171875, 1.205078125, 1.2745361328125, 1.343994140625, 1.4134521484375, 1.48291015625, 1.5523681640625, 1.621826171875, 1.6912841796875, 1.7607421875, 1.8302001953125, 1.899658203125, 1.9691162109375, 2.03857421875, 2.1080322265625, 2.177490234375, 2.2469482421875, 2.31640625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 18.0, 20.0, 12.0, 27.0, 31.0, 55.0, 87.0, 130.0, 240.0, 303.0, 494.0, 786.0, 1184.0, 1921.0, 2934.0, 4611.0, 7436.0, 11998.0, 18922.0, 30815.0, 52054.0, 143133.0, 483663.0, 150971.0, 53311.0, 30948.0, 19378.0, 12305.0, 7528.0, 4851.0, 3028.0, 1895.0, 1247.0, 817.0, 494.0, 298.0, 200.0, 149.0, 90.0, 54.0, 40.0, 31.0, 12.0, 8.0, 8.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.28515625, -2.21697998046875, -2.1488037109375, -2.08062744140625, -2.012451171875, -1.94427490234375, -1.8760986328125, -1.80792236328125, -1.73974609375, -1.67156982421875, -1.6033935546875, -1.53521728515625, -1.467041015625, -1.39886474609375, -1.3306884765625, -1.26251220703125, -1.1943359375, -1.12615966796875, -1.0579833984375, -0.98980712890625, -0.921630859375, -0.85345458984375, -0.7852783203125, -0.71710205078125, -0.64892578125, -0.58074951171875, -0.5125732421875, -0.44439697265625, -0.376220703125, -0.30804443359375, -0.2398681640625, -0.17169189453125, -0.103515625, -0.03533935546875, 0.0328369140625, 0.10101318359375, 0.169189453125, 0.23736572265625, 0.3055419921875, 0.37371826171875, 0.44189453125, 0.51007080078125, 0.5782470703125, 0.64642333984375, 0.714599609375, 0.78277587890625, 0.8509521484375, 0.91912841796875, 0.9873046875, 1.05548095703125, 1.1236572265625, 1.19183349609375, 1.260009765625, 1.32818603515625, 1.3963623046875, 1.46453857421875, 1.53271484375, 1.60089111328125, 1.6690673828125, 1.73724365234375, 1.805419921875, 1.87359619140625, 1.9417724609375, 2.00994873046875, 2.078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 8.0, 10.0, 10.0, 12.0, 20.0, 10.0, 15.0, 21.0, 35.0, 25.0, 39.0, 37.0, 32.0, 49.0, 77.0, 136.0, 1590.0, 310.0, 105.0, 58.0, 51.0, 42.0, 46.0, 32.0, 31.0, 32.0, 33.0, 20.0, 22.0, 27.0, 19.0, 8.0, 12.0, 11.0, 11.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-8.265625, -8.0140380859375, -7.762451171875, -7.5108642578125, -7.25927734375, -7.0076904296875, -6.756103515625, -6.5045166015625, -6.2529296875, -6.0013427734375, -5.749755859375, -5.4981689453125, -5.24658203125, -4.9949951171875, -4.743408203125, -4.4918212890625, -4.240234375, -3.9886474609375, -3.737060546875, -3.4854736328125, -3.23388671875, -2.9822998046875, -2.730712890625, -2.4791259765625, -2.2275390625, -1.9759521484375, -1.724365234375, -1.4727783203125, -1.22119140625, -0.9696044921875, -0.718017578125, -0.4664306640625, -0.21484375, 0.0367431640625, 0.288330078125, 0.5399169921875, 0.79150390625, 1.0430908203125, 1.294677734375, 1.5462646484375, 1.7978515625, 2.0494384765625, 2.301025390625, 2.5526123046875, 2.80419921875, 3.0557861328125, 3.307373046875, 3.5589599609375, 3.810546875, 4.0621337890625, 4.313720703125, 4.5653076171875, 4.81689453125, 5.0684814453125, 5.320068359375, 5.5716552734375, 5.8232421875, 6.0748291015625, 6.326416015625, 6.5780029296875, 6.82958984375, 7.0811767578125, 7.332763671875, 7.5843505859375, 7.8359375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 15.0, 14.0, 12.0, 20.0, 20.0, 24.0, 31.0, 46.0, 52.0, 90.0, 84.0, 118.0, 149.0, 212.0, 375.0, 1123.0, 7061.0, 98740.0, 2927814.0, 100267.0, 7219.0, 1049.0, 367.0, 197.0, 144.0, 110.0, 78.0, 66.0, 35.0, 28.0, 20.0, 22.0, 11.0, 18.0, 14.0, 8.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.3359375, -12.91259765625, -12.4892578125, -12.06591796875, -11.642578125, -11.21923828125, -10.7958984375, -10.37255859375, -9.94921875, -9.52587890625, -9.1025390625, -8.67919921875, -8.255859375, -7.83251953125, -7.4091796875, -6.98583984375, -6.5625, -6.13916015625, -5.7158203125, -5.29248046875, -4.869140625, -4.44580078125, -4.0224609375, -3.59912109375, -3.17578125, -2.75244140625, -2.3291015625, -1.90576171875, -1.482421875, -1.05908203125, -0.6357421875, -0.21240234375, 0.2109375, 0.63427734375, 1.0576171875, 1.48095703125, 1.904296875, 2.32763671875, 2.7509765625, 3.17431640625, 3.59765625, 4.02099609375, 4.4443359375, 4.86767578125, 5.291015625, 5.71435546875, 6.1376953125, 6.56103515625, 6.984375, 7.40771484375, 7.8310546875, 8.25439453125, 8.677734375, 9.10107421875, 9.5244140625, 9.94775390625, 10.37109375, 10.79443359375, 11.2177734375, 11.64111328125, 12.064453125, 12.48779296875, 12.9111328125, 13.33447265625, 13.7578125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 9.0, 298.0, 656.0, 53.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.055992126464844, -13.795495986938477, -10.53499984741211, -7.274503707885742, -4.014007568359375, -0.7535114288330078, 2.5069847106933594, 5.767480850219727, 9.027976989746094, 12.288473129272461, 15.548969268798828, 18.809465408325195, 22.069961547851562, 25.33045768737793, 28.590953826904297, 31.851449966430664, 35.11194610595703, 38.37244415283203, 41.632938385009766, 44.8934326171875, 48.1539306640625, 51.4144287109375, 54.674922943115234, 57.93541717529297, 61.19591522216797, 64.45641326904297, 67.71690368652344, 70.97740173339844, 74.23789978027344, 77.49839782714844, 80.75889587402344, 84.0193862915039, 87.27987670898438, 90.54037475585938, 93.80087280273438, 97.06136322021484, 100.32186126708984, 103.58235931396484, 106.84284973144531, 110.10334777832031, 113.36384582519531, 116.62434387207031, 119.88484191894531, 123.14533233642578, 126.40583038330078, 129.66632080078125, 132.92681884765625, 136.18731689453125, 139.44781494140625, 142.70831298828125, 145.96881103515625, 149.22930908203125, 152.48980712890625, 155.7502899169922, 159.0107879638672, 162.2712860107422, 165.5317840576172, 168.7922821044922, 172.0527801513672, 175.3132781982422, 178.57376098632812, 181.83425903320312, 185.09475708007812, 188.35525512695312, 191.61575317382812]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 5.0, 14.0, 13.0, 12.0, 6.0, 20.0, 16.0, 18.0, 22.0, 25.0, 31.0, 32.0, 38.0, 26.0, 36.0, 39.0, 34.0, 36.0, 37.0, 33.0, 43.0, 27.0, 54.0, 46.0, 26.0, 29.0, 32.0, 23.0, 29.0, 25.0, 24.0, 18.0, 13.0, 17.0, 14.0, 9.0, 10.0, 8.0, 12.0, 9.0, 2.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-20.439821243286133, -19.773361206054688, -19.106901168823242, -18.440441131591797, -17.77398109436035, -17.107521057128906, -16.441062927246094, -15.774602890014648, -15.108142852783203, -14.441682815551758, -13.775222778320312, -13.108762741088867, -12.442303657531738, -11.775843620300293, -11.109383583068848, -10.442924499511719, -9.776463508605957, -9.110003471374512, -8.443543434143066, -7.777083873748779, -7.110624313354492, -6.444164276123047, -5.777704238891602, -5.1112446784973145, -4.444784641265869, -3.778324842453003, -3.1118650436401367, -2.4454050064086914, -1.7789452075958252, -1.112485408782959, -0.44602537155151367, 0.22043418884277344, 0.8868942260742188, 1.553354024887085, 2.219813823699951, 2.8862738609313965, 3.5527336597442627, 4.219193458557129, 4.885653495788574, 5.552113056182861, 6.218573093414307, 6.885033130645752, 7.551492691040039, 8.217952728271484, 8.88441276550293, 9.550872802734375, 10.21733283996582, 10.88379192352295, 11.550251960754395, 12.21671199798584, 12.883172035217285, 13.549631118774414, 14.21609115600586, 14.882551193237305, 15.54901123046875, 16.215471267700195, 16.88193130493164, 17.548391342163086, 18.21485137939453, 18.881311416625977, 19.547771453857422, 20.214229583740234, 20.880691528320312, 21.547149658203125, 22.21360969543457]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 1.0, 2.0, 8.0, 7.0, 12.0, 12.0, 9.0, 14.0, 14.0, 20.0, 14.0, 21.0, 31.0, 40.0, 25.0, 44.0, 46.0, 35.0, 38.0, 45.0, 35.0, 39.0, 52.0, 46.0, 34.0, 29.0, 30.0, 27.0, 40.0, 22.0, 24.0, 35.0, 31.0, 25.0, 20.0, 11.0, 10.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.168426513671875, -2.09466552734375, -2.020904541015625, -1.9471435546875, -1.873382568359375, -1.79962158203125, -1.725860595703125, -1.652099609375, -1.578338623046875, -1.50457763671875, -1.430816650390625, -1.3570556640625, -1.283294677734375, -1.20953369140625, -1.135772705078125, -1.06201171875, -0.988250732421875, -0.91448974609375, -0.840728759765625, -0.7669677734375, -0.693206787109375, -0.61944580078125, -0.545684814453125, -0.471923828125, -0.398162841796875, -0.32440185546875, -0.250640869140625, -0.1768798828125, -0.103118896484375, -0.02935791015625, 0.044403076171875, 0.1181640625, 0.191925048828125, 0.26568603515625, 0.339447021484375, 0.4132080078125, 0.486968994140625, 0.56072998046875, 0.634490966796875, 0.708251953125, 0.782012939453125, 0.85577392578125, 0.929534912109375, 1.0032958984375, 1.077056884765625, 1.15081787109375, 1.224578857421875, 1.29833984375, 1.372100830078125, 1.44586181640625, 1.519622802734375, 1.5933837890625, 1.667144775390625, 1.74090576171875, 1.814666748046875, 1.888427734375, 1.962188720703125, 2.03594970703125, 2.109710693359375, 2.1834716796875, 2.257232666015625, 2.33099365234375, 2.404754638671875, 2.478515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 13.0, 7.0, 10.0, 14.0, 27.0, 27.0, 28.0, 48.0, 76.0, 102.0, 145.0, 170.0, 293.0, 436.0, 640.0, 1041.0, 1895.0, 3543.0, 7088.0, 14999.0, 35893.0, 95645.0, 300903.0, 1018189.0, 1662454.0, 719415.0, 207287.0, 69938.0, 28182.0, 12243.0, 5864.0, 3076.0, 1707.0, 936.0, 622.0, 391.0, 246.0, 162.0, 136.0, 105.0, 79.0, 61.0, 33.0, 23.0, 29.0, 15.0, 15.0, 12.0, 6.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.689453125, -3.575408935546875, -3.46136474609375, -3.347320556640625, -3.2332763671875, -3.119232177734375, -3.00518798828125, -2.891143798828125, -2.777099609375, -2.663055419921875, -2.54901123046875, -2.434967041015625, -2.3209228515625, -2.206878662109375, -2.09283447265625, -1.978790283203125, -1.86474609375, -1.750701904296875, -1.63665771484375, -1.522613525390625, -1.4085693359375, -1.294525146484375, -1.18048095703125, -1.066436767578125, -0.952392578125, -0.838348388671875, -0.72430419921875, -0.610260009765625, -0.4962158203125, -0.382171630859375, -0.26812744140625, -0.154083251953125, -0.0400390625, 0.074005126953125, 0.18804931640625, 0.302093505859375, 0.4161376953125, 0.530181884765625, 0.64422607421875, 0.758270263671875, 0.872314453125, 0.986358642578125, 1.10040283203125, 1.214447021484375, 1.3284912109375, 1.442535400390625, 1.55657958984375, 1.670623779296875, 1.78466796875, 1.898712158203125, 2.01275634765625, 2.126800537109375, 2.2408447265625, 2.354888916015625, 2.46893310546875, 2.582977294921875, 2.697021484375, 2.811065673828125, 2.92510986328125, 3.039154052734375, 3.1531982421875, 3.267242431640625, 3.38128662109375, 3.495330810546875, 3.609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 29.0, 34.0, 55.0, 68.0, 117.0, 138.0, 211.0, 245.0, 329.0, 402.0, 484.0, 454.0, 390.0, 278.0, 191.0, 159.0, 122.0, 93.0, 66.0, 48.0, 38.0, 19.0, 16.0, 14.0, 17.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.85546875, -7.66253662109375, -7.4696044921875, -7.27667236328125, -7.083740234375, -6.89080810546875, -6.6978759765625, -6.50494384765625, -6.31201171875, -6.11907958984375, -5.9261474609375, -5.73321533203125, -5.540283203125, -5.34735107421875, -5.1544189453125, -4.96148681640625, -4.7685546875, -4.57562255859375, -4.3826904296875, -4.18975830078125, -3.996826171875, -3.80389404296875, -3.6109619140625, -3.41802978515625, -3.22509765625, -3.03216552734375, -2.8392333984375, -2.64630126953125, -2.453369140625, -2.26043701171875, -2.0675048828125, -1.87457275390625, -1.681640625, -1.48870849609375, -1.2957763671875, -1.10284423828125, -0.909912109375, -0.71697998046875, -0.5240478515625, -0.33111572265625, -0.13818359375, 0.05474853515625, 0.2476806640625, 0.44061279296875, 0.633544921875, 0.82647705078125, 1.0194091796875, 1.21234130859375, 1.4052734375, 1.59820556640625, 1.7911376953125, 1.98406982421875, 2.177001953125, 2.36993408203125, 2.5628662109375, 2.75579833984375, 2.94873046875, 3.14166259765625, 3.3345947265625, 3.52752685546875, 3.720458984375, 3.91339111328125, 4.1063232421875, 4.29925537109375, 4.4921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 16.0, 21.0, 24.0, 41.0, 48.0, 69.0, 101.0, 137.0, 205.0, 307.0, 596.0, 1388.0, 4978.0, 27048.0, 217859.0, 2204622.0, 1561977.0, 149146.0, 19373.0, 3782.0, 1142.0, 491.0, 282.0, 162.0, 133.0, 76.0, 53.0, 49.0, 46.0, 22.0, 20.0, 19.0, 17.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.0921630859375, -7.739013671875, -7.3858642578125, -7.03271484375, -6.6795654296875, -6.326416015625, -5.9732666015625, -5.6201171875, -5.2669677734375, -4.913818359375, -4.5606689453125, -4.20751953125, -3.8543701171875, -3.501220703125, -3.1480712890625, -2.794921875, -2.4417724609375, -2.088623046875, -1.7354736328125, -1.38232421875, -1.0291748046875, -0.676025390625, -0.3228759765625, 0.0302734375, 0.3834228515625, 0.736572265625, 1.0897216796875, 1.44287109375, 1.7960205078125, 2.149169921875, 2.5023193359375, 2.85546875, 3.2086181640625, 3.561767578125, 3.9149169921875, 4.26806640625, 4.6212158203125, 4.974365234375, 5.3275146484375, 5.6806640625, 6.0338134765625, 6.386962890625, 6.7401123046875, 7.09326171875, 7.4464111328125, 7.799560546875, 8.1527099609375, 8.505859375, 8.8590087890625, 9.212158203125, 9.5653076171875, 9.91845703125, 10.2716064453125, 10.624755859375, 10.9779052734375, 11.3310546875, 11.6842041015625, 12.037353515625, 12.3905029296875, 12.74365234375, 13.0968017578125, 13.449951171875, 13.8031005859375, 14.15625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 8.0, 15.0, 22.0, 29.0, 45.0, 65.0, 91.0, 116.0, 115.0, 117.0, 110.0, 84.0, 59.0, 47.0, 23.0, 23.0, 14.0, 12.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.782926559448242, -17.738866806030273, -16.694808959960938, -15.650749206542969, -14.606689453125, -13.562630653381348, -12.518571853637695, -11.474512100219727, -10.430453300476074, -9.386394500732422, -8.342334747314453, -7.298275947570801, -6.25421667098999, -5.21015739440918, -4.166098594665527, -3.122039318084717, -2.0779800415039062, -1.0339208841323853, 0.010138273239135742, 1.0541973114013672, 2.0982565879821777, 3.1423158645629883, 4.186374664306641, 5.230433940887451, 6.274493217468262, 7.318552494049072, 8.362611770629883, 9.406670570373535, 10.450729370117188, 11.494789123535156, 12.538847923278809, 13.582906723022461, 14.626968383789062, 15.671027183532715, 16.715085983276367, 17.759145736694336, 18.803205490112305, 19.84726333618164, 20.89132308959961, 21.935382843017578, 22.979442596435547, 24.023502349853516, 25.06756019592285, 26.11161994934082, 27.15567970275879, 28.199737548828125, 29.243797302246094, 30.287857055664062, 31.3319149017334, 32.375972747802734, 33.4200325012207, 34.46409225463867, 35.50815200805664, 36.55221176147461, 37.59626770019531, 38.64032745361328, 39.68438720703125, 40.72844696044922, 41.77250671386719, 42.816566467285156, 43.86062240600586, 44.90468215942383, 45.9487419128418, 46.992801666259766, 48.036861419677734]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 13.0, 9.0, 12.0, 11.0, 18.0, 24.0, 16.0, 27.0, 36.0, 31.0, 24.0, 31.0, 39.0, 46.0, 30.0, 38.0, 43.0, 33.0, 45.0, 37.0, 44.0, 46.0, 48.0, 32.0, 26.0, 21.0, 32.0, 36.0, 25.0, 22.0, 16.0, 15.0, 21.0, 6.0, 12.0, 9.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.000259399414062, -17.39913558959961, -16.798011779785156, -16.196887969970703, -15.595763206481934, -14.99463939666748, -14.393514633178711, -13.792390823364258, -13.191267013549805, -12.590143203735352, -11.989019393920898, -11.387894630432129, -10.786770820617676, -10.185647010803223, -9.584522247314453, -8.9833984375, -8.382274627685547, -7.781150817871094, -7.180026531219482, -6.578902244567871, -5.977778434753418, -5.376654624938965, -4.7755303382873535, -4.174406051635742, -3.573282241821289, -2.972158193588257, -2.3710341453552246, -1.7699100971221924, -1.1687860488891602, -0.5676620006561279, 0.0334620475769043, 0.6345863342285156, 1.2357101440429688, 1.836834192276001, 2.437958240509033, 3.0390822887420654, 3.6402063369750977, 4.241330146789551, 4.842454433441162, 5.443578720092773, 6.044702529907227, 6.64582633972168, 7.246950626373291, 7.848074913024902, 8.449198722839355, 9.050322532653809, 9.651447296142578, 10.252571105957031, 10.853694915771484, 11.454818725585938, 12.05594253540039, 12.65706729888916, 13.258191108703613, 13.859314918518066, 14.460439682006836, 15.061563491821289, 15.662687301635742, 16.263811111450195, 16.86493492126465, 17.4660587310791, 18.067184448242188, 18.66830825805664, 19.269432067871094, 19.870555877685547, 20.4716796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 18.0, 15.0, 17.0, 25.0, 22.0, 34.0, 30.0, 31.0, 32.0, 41.0, 35.0, 41.0, 56.0, 40.0, 34.0, 33.0, 41.0, 32.0, 32.0, 40.0, 54.0, 34.0, 22.0, 30.0, 25.0, 21.0, 16.0, 14.0, 10.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.203125, -2.129730224609375, -2.05633544921875, -1.982940673828125, -1.9095458984375, -1.836151123046875, -1.76275634765625, -1.689361572265625, -1.615966796875, -1.542572021484375, -1.46917724609375, -1.395782470703125, -1.3223876953125, -1.248992919921875, -1.17559814453125, -1.102203369140625, -1.02880859375, -0.955413818359375, -0.88201904296875, -0.808624267578125, -0.7352294921875, -0.661834716796875, -0.58843994140625, -0.515045166015625, -0.441650390625, -0.368255615234375, -0.29486083984375, -0.221466064453125, -0.1480712890625, -0.074676513671875, -0.00128173828125, 0.072113037109375, 0.1455078125, 0.218902587890625, 0.29229736328125, 0.365692138671875, 0.4390869140625, 0.512481689453125, 0.58587646484375, 0.659271240234375, 0.732666015625, 0.806060791015625, 0.87945556640625, 0.952850341796875, 1.0262451171875, 1.099639892578125, 1.17303466796875, 1.246429443359375, 1.31982421875, 1.393218994140625, 1.46661376953125, 1.540008544921875, 1.6134033203125, 1.686798095703125, 1.76019287109375, 1.833587646484375, 1.906982421875, 1.980377197265625, 2.05377197265625, 2.127166748046875, 2.2005615234375, 2.273956298828125, 2.34735107421875, 2.420745849609375, 2.494140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 10.0, 21.0, 29.0, 32.0, 47.0, 72.0, 99.0, 145.0, 201.0, 292.0, 449.0, 642.0, 864.0, 1263.0, 1921.0, 2811.0, 4269.0, 6446.0, 9772.0, 15363.0, 25099.0, 41179.0, 71033.0, 133263.0, 299428.0, 200992.0, 93079.0, 52826.0, 31603.0, 19371.0, 12199.0, 7903.0, 5144.0, 3338.0, 2278.0, 1577.0, 1050.0, 748.0, 517.0, 351.0, 245.0, 158.0, 132.0, 86.0, 59.0, 35.0, 34.0, 33.0, 17.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.01372528076171875, -0.013306021690368652, -0.012886762619018555, -0.012467503547668457, -0.01204824447631836, -0.011628985404968262, -0.011209726333618164, -0.010790467262268066, -0.010371208190917969, -0.009951949119567871, -0.009532690048217773, -0.009113430976867676, -0.008694171905517578, -0.00827491283416748, -0.007855653762817383, -0.007436394691467285, -0.0070171356201171875, -0.00659787654876709, -0.006178617477416992, -0.0057593584060668945, -0.005340099334716797, -0.004920840263366699, -0.0045015811920166016, -0.004082322120666504, -0.0036630630493164062, -0.0032438039779663086, -0.002824544906616211, -0.0024052858352661133, -0.0019860267639160156, -0.001566767692565918, -0.0011475086212158203, -0.0007282495498657227, -0.000308990478515625, 0.00011026859283447266, 0.0005295276641845703, 0.000948786735534668, 0.0013680458068847656, 0.0017873048782348633, 0.002206563949584961, 0.0026258230209350586, 0.0030450820922851562, 0.003464341163635254, 0.0038836002349853516, 0.004302859306335449, 0.004722118377685547, 0.0051413774490356445, 0.005560636520385742, 0.00597989559173584, 0.0063991546630859375, 0.006818413734436035, 0.007237672805786133, 0.0076569318771362305, 0.008076190948486328, 0.008495450019836426, 0.008914709091186523, 0.009333968162536621, 0.009753227233886719, 0.010172486305236816, 0.010591745376586914, 0.011011004447937012, 0.01143026351928711, 0.011849522590637207, 0.012268781661987305, 0.012688040733337402, 0.0131072998046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 6.0, 13.0, 24.0, 19.0, 28.0, 26.0, 37.0, 46.0, 29.0, 52.0, 43.0, 48.0, 43.0, 40.0, 1067.0, 57.0, 62.0, 49.0, 29.0, 48.0, 36.0, 42.0, 25.0, 24.0, 26.0, 23.0, 9.0, 9.0, 5.0, 7.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.349609375, -2.2863922119140625, -2.223175048828125, -2.1599578857421875, -2.09674072265625, -2.0335235595703125, -1.970306396484375, -1.9070892333984375, -1.8438720703125, -1.7806549072265625, -1.717437744140625, -1.6542205810546875, -1.59100341796875, -1.5277862548828125, -1.464569091796875, -1.4013519287109375, -1.338134765625, -1.2749176025390625, -1.211700439453125, -1.1484832763671875, -1.08526611328125, -1.0220489501953125, -0.958831787109375, -0.8956146240234375, -0.8323974609375, -0.7691802978515625, -0.705963134765625, -0.6427459716796875, -0.57952880859375, -0.5163116455078125, -0.453094482421875, -0.3898773193359375, -0.32666015625, -0.2634429931640625, -0.200225830078125, -0.1370086669921875, -0.07379150390625, -0.0105743408203125, 0.052642822265625, 0.1158599853515625, 0.1790771484375, 0.2422943115234375, 0.305511474609375, 0.3687286376953125, 0.43194580078125, 0.4951629638671875, 0.558380126953125, 0.6215972900390625, 0.684814453125, 0.7480316162109375, 0.811248779296875, 0.8744659423828125, 0.93768310546875, 1.0009002685546875, 1.064117431640625, 1.1273345947265625, 1.1905517578125, 1.2537689208984375, 1.316986083984375, 1.3802032470703125, 1.44342041015625, 1.5066375732421875, 1.569854736328125, 1.6330718994140625, 1.6962890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 5.0, 8.0, 21.0, 31.0, 48.0, 78.0, 114.0, 190.0, 288.0, 501.0, 925.0, 1386.0, 2288.0, 4101.0, 7141.0, 13017.0, 24359.0, 46570.0, 94666.0, 236920.0, 1399201.0, 132488.0, 62600.0, 31684.0, 16980.0, 8980.0, 5310.0, 2879.0, 1698.0, 1015.0, 603.0, 398.0, 227.0, 121.0, 106.0, 75.0, 31.0, 18.0, 15.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01261138916015625, -0.012193918228149414, -0.011776447296142578, -0.011358976364135742, -0.010941505432128906, -0.01052403450012207, -0.010106563568115234, -0.009689092636108398, -0.009271621704101562, -0.008854150772094727, -0.00843667984008789, -0.008019208908081055, -0.007601737976074219, -0.007184267044067383, -0.006766796112060547, -0.006349325180053711, -0.005931854248046875, -0.005514383316040039, -0.005096912384033203, -0.004679441452026367, -0.004261970520019531, -0.0038444995880126953, -0.0034270286560058594, -0.0030095577239990234, -0.0025920867919921875, -0.0021746158599853516, -0.0017571449279785156, -0.0013396739959716797, -0.0009222030639648438, -0.0005047321319580078, -8.726119995117188e-05, 0.00033020973205566406, 0.0007476806640625, 0.001165151596069336, 0.0015826225280761719, 0.002000093460083008, 0.0024175643920898438, 0.0028350353240966797, 0.0032525062561035156, 0.0036699771881103516, 0.0040874481201171875, 0.0045049190521240234, 0.004922389984130859, 0.005339860916137695, 0.005757331848144531, 0.006174802780151367, 0.006592273712158203, 0.007009744644165039, 0.007427215576171875, 0.007844686508178711, 0.008262157440185547, 0.008679628372192383, 0.009097099304199219, 0.009514570236206055, 0.00993204116821289, 0.010349512100219727, 0.010766983032226562, 0.011184453964233398, 0.011601924896240234, 0.01201939582824707, 0.012436866760253906, 0.012854337692260742, 0.013271808624267578, 0.013689279556274414, 0.01410675048828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 966.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 20.0, 37.0, 41.0, 216.0, 2361.0, 14002.0, 1015336.0, 13776.0, 2358.0, 244.0, 49.0, 25.0, 31.0, 4.0, 6.0, 0.0, 0.0, 0.0, 6.0, 19.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06, 1.9073486328125e-06]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 18.0, 15.0, 17.0, 25.0, 22.0, 34.0, 30.0, 31.0, 32.0, 41.0, 35.0, 41.0, 56.0, 40.0, 34.0, 33.0, 41.0, 32.0, 32.0, 40.0, 54.0, 34.0, 22.0, 30.0, 25.0, 21.0, 16.0, 14.0, 10.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.203125, -2.129730224609375, -2.05633544921875, -1.982940673828125, -1.9095458984375, -1.836151123046875, -1.76275634765625, -1.689361572265625, -1.615966796875, -1.542572021484375, -1.46917724609375, -1.395782470703125, -1.3223876953125, -1.248992919921875, -1.17559814453125, -1.102203369140625, -1.02880859375, -0.955413818359375, -0.88201904296875, -0.808624267578125, -0.7352294921875, -0.661834716796875, -0.58843994140625, -0.515045166015625, -0.441650390625, -0.368255615234375, -0.29486083984375, -0.221466064453125, -0.1480712890625, -0.074676513671875, -0.00128173828125, 0.072113037109375, 0.1455078125, 0.218902587890625, 0.29229736328125, 0.365692138671875, 0.4390869140625, 0.512481689453125, 0.58587646484375, 0.659271240234375, 0.732666015625, 0.806060791015625, 0.87945556640625, 0.952850341796875, 1.0262451171875, 1.099639892578125, 1.17303466796875, 1.246429443359375, 1.31982421875, 1.393218994140625, 1.46661376953125, 1.540008544921875, 1.6134033203125, 1.686798095703125, 1.76019287109375, 1.833587646484375, 1.906982421875, 1.980377197265625, 2.05377197265625, 2.127166748046875, 2.2005615234375, 2.273956298828125, 2.34735107421875, 2.420745849609375, 2.494140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 6.0, 15.0, 15.0, 18.0, 25.0, 46.0, 74.0, 84.0, 139.0, 240.0, 352.0, 538.0, 914.0, 1537.0, 2352.0, 3868.0, 6669.0, 11958.0, 22260.0, 41288.0, 84156.0, 216426.0, 375748.0, 143304.0, 63424.0, 32331.0, 17277.0, 9651.0, 5430.0, 3156.0, 1956.0, 1185.0, 696.0, 476.0, 317.0, 206.0, 140.0, 86.0, 53.0, 40.0, 35.0, 14.0, 15.0, 8.0, 9.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0625, -1.99444580078125, -1.9263916015625, -1.85833740234375, -1.790283203125, -1.72222900390625, -1.6541748046875, -1.58612060546875, -1.51806640625, -1.45001220703125, -1.3819580078125, -1.31390380859375, -1.245849609375, -1.17779541015625, -1.1097412109375, -1.04168701171875, -0.9736328125, -0.90557861328125, -0.8375244140625, -0.76947021484375, -0.701416015625, -0.63336181640625, -0.5653076171875, -0.49725341796875, -0.42919921875, -0.36114501953125, -0.2930908203125, -0.22503662109375, -0.156982421875, -0.08892822265625, -0.0208740234375, 0.04718017578125, 0.115234375, 0.18328857421875, 0.2513427734375, 0.31939697265625, 0.387451171875, 0.45550537109375, 0.5235595703125, 0.59161376953125, 0.65966796875, 0.72772216796875, 0.7957763671875, 0.86383056640625, 0.931884765625, 0.99993896484375, 1.0679931640625, 1.13604736328125, 1.2041015625, 1.27215576171875, 1.3402099609375, 1.40826416015625, 1.476318359375, 1.54437255859375, 1.6124267578125, 1.68048095703125, 1.74853515625, 1.81658935546875, 1.8846435546875, 1.95269775390625, 2.020751953125, 2.08880615234375, 2.1568603515625, 2.22491455078125, 2.29296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 5.0, 10.0, 7.0, 8.0, 8.0, 12.0, 13.0, 16.0, 25.0, 29.0, 29.0, 34.0, 41.0, 57.0, 66.0, 66.0, 140.0, 345.0, 1529.0, 159.0, 89.0, 71.0, 37.0, 29.0, 44.0, 36.0, 22.0, 24.0, 17.0, 23.0, 15.0, 11.0, 13.0, 8.0, 1.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.902587890625, -9.56298828125, -9.223388671875, -8.8837890625, -8.544189453125, -8.20458984375, -7.864990234375, -7.525390625, -7.185791015625, -6.84619140625, -6.506591796875, -6.1669921875, -5.827392578125, -5.48779296875, -5.148193359375, -4.80859375, -4.468994140625, -4.12939453125, -3.789794921875, -3.4501953125, -3.110595703125, -2.77099609375, -2.431396484375, -2.091796875, -1.752197265625, -1.41259765625, -1.072998046875, -0.7333984375, -0.393798828125, -0.05419921875, 0.285400390625, 0.625, 0.964599609375, 1.30419921875, 1.643798828125, 1.9833984375, 2.322998046875, 2.66259765625, 3.002197265625, 3.341796875, 3.681396484375, 4.02099609375, 4.360595703125, 4.7001953125, 5.039794921875, 5.37939453125, 5.718994140625, 6.05859375, 6.398193359375, 6.73779296875, 7.077392578125, 7.4169921875, 7.756591796875, 8.09619140625, 8.435791015625, 8.775390625, 9.114990234375, 9.45458984375, 9.794189453125, 10.1337890625, 10.473388671875, 10.81298828125, 11.152587890625, 11.4921875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 8.0, 8.0, 20.0, 13.0, 24.0, 31.0, 36.0, 48.0, 64.0, 90.0, 124.0, 160.0, 306.0, 732.0, 2912.0, 34336.0, 2993491.0, 106564.0, 4624.0, 1028.0, 382.0, 216.0, 133.0, 81.0, 63.0, 55.0, 38.0, 31.0, 21.0, 14.0, 9.0, 16.0, 12.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -22.141845703125, -21.50244140625, -20.863037109375, -20.2236328125, -19.584228515625, -18.94482421875, -18.305419921875, -17.666015625, -17.026611328125, -16.38720703125, -15.747802734375, -15.1083984375, -14.468994140625, -13.82958984375, -13.190185546875, -12.55078125, -11.911376953125, -11.27197265625, -10.632568359375, -9.9931640625, -9.353759765625, -8.71435546875, -8.074951171875, -7.435546875, -6.796142578125, -6.15673828125, -5.517333984375, -4.8779296875, -4.238525390625, -3.59912109375, -2.959716796875, -2.3203125, -1.680908203125, -1.04150390625, -0.402099609375, 0.2373046875, 0.876708984375, 1.51611328125, 2.155517578125, 2.794921875, 3.434326171875, 4.07373046875, 4.713134765625, 5.3525390625, 5.991943359375, 6.63134765625, 7.270751953125, 7.91015625, 8.549560546875, 9.18896484375, 9.828369140625, 10.4677734375, 11.107177734375, 11.74658203125, 12.385986328125, 13.025390625, 13.664794921875, 14.30419921875, 14.943603515625, 15.5830078125, 16.222412109375, 16.86181640625, 17.501220703125, 18.140625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 627.0, 377.0, 4.0, 0.0, 2.0], "bins": [-321.0364990234375, -315.677001953125, -310.3175048828125, -304.9580383300781, -299.5985412597656, -294.2390441894531, -288.87957763671875, -283.52008056640625, -278.16058349609375, -272.80108642578125, -267.44158935546875, -262.0821228027344, -256.7226257324219, -251.36312866210938, -246.00364685058594, -240.6441650390625, -235.28466796875, -229.9251708984375, -224.56568908691406, -219.20620727539062, -213.84671020507812, -208.48721313476562, -203.1277313232422, -197.76824951171875, -192.40875244140625, -187.04925537109375, -181.6897735595703, -176.33029174804688, -170.97079467773438, -165.61129760742188, -160.25181579589844, -154.892333984375, -149.53282165527344, -144.17333984375, -138.8138427734375, -133.454345703125, -128.09486389160156, -122.7353744506836, -117.37588500976562, -112.01639556884766, -106.65690612792969, -101.29741668701172, -95.93792724609375, -90.57843780517578, -85.21894836425781, -79.85945892333984, -74.49996948242188, -69.1404800415039, -63.78099060058594, -58.42150115966797, -53.06201171875, -47.70252227783203, -42.34303283691406, -36.983543395996094, -31.624053955078125, -26.264564514160156, -20.905075073242188, -15.545585632324219, -10.18609619140625, -4.826606750488281, 0.5328826904296875, 5.892372131347656, 11.251861572265625, 16.611351013183594, 21.970840454101562]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 5.0, 3.0, 4.0, 11.0, 11.0, 11.0, 15.0, 17.0, 20.0, 17.0, 32.0, 24.0, 23.0, 17.0, 30.0, 31.0, 35.0, 44.0, 48.0, 29.0, 52.0, 37.0, 30.0, 34.0, 27.0, 38.0, 29.0, 27.0, 20.0, 35.0, 32.0, 31.0, 21.0, 25.0, 23.0, 16.0, 9.0, 11.0, 17.0, 16.0, 4.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.73444366455078, -17.103490829467773, -16.4725399017334, -15.84158706665039, -15.210634231567383, -14.579682350158691, -13.94873046875, -13.317777633666992, -12.6868257522583, -12.05587387084961, -11.424921035766602, -10.79396915435791, -10.163017272949219, -9.532064437866211, -8.90111255645752, -8.270160675048828, -7.63920783996582, -7.008255481719971, -6.377303123474121, -5.74635124206543, -5.11539888381958, -4.4844465255737305, -3.85349440574646, -3.2225422859191895, -2.59158992767334, -1.9606376886367798, -1.3296854496002197, -0.6987332105636597, -0.06778097152709961, 0.56317138671875, 1.1941235065460205, 1.825075626373291, 2.4560279846191406, 3.0869803428649902, 3.7179324626922607, 4.348884582519531, 4.979836940765381, 5.6107892990112305, 6.241741180419922, 6.8726935386657715, 7.503645896911621, 8.134597778320312, 8.76555061340332, 9.396502494812012, 10.027454376220703, 10.658407211303711, 11.289359092712402, 11.920310974121094, 12.551263809204102, 13.182215690612793, 13.8131685256958, 14.444120407104492, 15.0750732421875, 15.706025123596191, 16.336977005004883, 16.96792984008789, 17.598880767822266, 18.229833602905273, 18.86078453063965, 19.491737365722656, 20.122690200805664, 20.753643035888672, 21.384593963623047, 22.015546798706055, 22.646499633789062]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 11.0, 11.0, 15.0, 14.0, 13.0, 24.0, 22.0, 24.0, 33.0, 24.0, 22.0, 40.0, 41.0, 38.0, 41.0, 40.0, 47.0, 45.0, 28.0, 40.0, 27.0, 33.0, 43.0, 37.0, 40.0, 28.0, 34.0, 25.0, 25.0, 14.0, 10.0, 14.0, 13.0, 6.0, 10.0, 7.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.326171875, -2.251739501953125, -2.17730712890625, -2.102874755859375, -2.0284423828125, -1.954010009765625, -1.87957763671875, -1.805145263671875, -1.730712890625, -1.656280517578125, -1.58184814453125, -1.507415771484375, -1.4329833984375, -1.358551025390625, -1.28411865234375, -1.209686279296875, -1.13525390625, -1.060821533203125, -0.98638916015625, -0.911956787109375, -0.8375244140625, -0.763092041015625, -0.68865966796875, -0.614227294921875, -0.539794921875, -0.465362548828125, -0.39093017578125, -0.316497802734375, -0.2420654296875, -0.167633056640625, -0.09320068359375, -0.018768310546875, 0.0556640625, 0.130096435546875, 0.20452880859375, 0.278961181640625, 0.3533935546875, 0.427825927734375, 0.50225830078125, 0.576690673828125, 0.651123046875, 0.725555419921875, 0.79998779296875, 0.874420166015625, 0.9488525390625, 1.023284912109375, 1.09771728515625, 1.172149658203125, 1.24658203125, 1.321014404296875, 1.39544677734375, 1.469879150390625, 1.5443115234375, 1.618743896484375, 1.69317626953125, 1.767608642578125, 1.842041015625, 1.916473388671875, 1.99090576171875, 2.065338134765625, 2.1397705078125, 2.214202880859375, 2.28863525390625, 2.363067626953125, 2.4375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 7.0, 2.0, 7.0, 4.0, 6.0, 8.0, 11.0, 18.0, 14.0, 15.0, 18.0, 17.0, 29.0, 29.0, 40.0, 72.0, 169.0, 398.0, 1247.0, 4859.0, 27133.0, 239721.0, 2587714.0, 1220465.0, 94314.0, 13456.0, 2941.0, 843.0, 301.0, 121.0, 73.0, 49.0, 28.0, 31.0, 23.0, 11.0, 14.0, 12.0, 9.0, 7.0, 5.0, 8.0, 7.0, 1.0, 9.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.34375, -8.0728759765625, -7.802001953125, -7.5311279296875, -7.26025390625, -6.9893798828125, -6.718505859375, -6.4476318359375, -6.1767578125, -5.9058837890625, -5.635009765625, -5.3641357421875, -5.09326171875, -4.8223876953125, -4.551513671875, -4.2806396484375, -4.009765625, -3.7388916015625, -3.468017578125, -3.1971435546875, -2.92626953125, -2.6553955078125, -2.384521484375, -2.1136474609375, -1.8427734375, -1.5718994140625, -1.301025390625, -1.0301513671875, -0.75927734375, -0.4884033203125, -0.217529296875, 0.0533447265625, 0.32421875, 0.5950927734375, 0.865966796875, 1.1368408203125, 1.40771484375, 1.6785888671875, 1.949462890625, 2.2203369140625, 2.4912109375, 2.7620849609375, 3.032958984375, 3.3038330078125, 3.57470703125, 3.8455810546875, 4.116455078125, 4.3873291015625, 4.658203125, 4.9290771484375, 5.199951171875, 5.4708251953125, 5.74169921875, 6.0125732421875, 6.283447265625, 6.5543212890625, 6.8251953125, 7.0960693359375, 7.366943359375, 7.6378173828125, 7.90869140625, 8.1795654296875, 8.450439453125, 8.7213134765625, 8.9921875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 9.0, 14.0, 20.0, 29.0, 34.0, 48.0, 54.0, 76.0, 87.0, 123.0, 140.0, 222.0, 227.0, 297.0, 357.0, 385.0, 388.0, 353.0, 282.0, 198.0, 156.0, 142.0, 96.0, 65.0, 67.0, 44.0, 36.0, 27.0, 23.0, 19.0, 7.0, 9.0, 6.0, 5.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.27349853515625, -4.1134033203125, -3.95330810546875, -3.793212890625, -3.63311767578125, -3.4730224609375, -3.31292724609375, -3.15283203125, -2.99273681640625, -2.8326416015625, -2.67254638671875, -2.512451171875, -2.35235595703125, -2.1922607421875, -2.03216552734375, -1.8720703125, -1.71197509765625, -1.5518798828125, -1.39178466796875, -1.231689453125, -1.07159423828125, -0.9114990234375, -0.75140380859375, -0.59130859375, -0.43121337890625, -0.2711181640625, -0.11102294921875, 0.049072265625, 0.20916748046875, 0.3692626953125, 0.52935791015625, 0.689453125, 0.84954833984375, 1.0096435546875, 1.16973876953125, 1.329833984375, 1.48992919921875, 1.6500244140625, 1.81011962890625, 1.97021484375, 2.13031005859375, 2.2904052734375, 2.45050048828125, 2.610595703125, 2.77069091796875, 2.9307861328125, 3.09088134765625, 3.2509765625, 3.41107177734375, 3.5711669921875, 3.73126220703125, 3.891357421875, 4.05145263671875, 4.2115478515625, 4.37164306640625, 4.53173828125, 4.69183349609375, 4.8519287109375, 5.01202392578125, 5.172119140625, 5.33221435546875, 5.4923095703125, 5.65240478515625, 5.8125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 13.0, 10.0, 14.0, 28.0, 31.0, 43.0, 50.0, 66.0, 79.0, 104.0, 134.0, 186.0, 339.0, 688.0, 2233.0, 12044.0, 92964.0, 964973.0, 2733939.0, 341190.0, 36965.0, 5396.0, 1285.0, 492.0, 283.0, 165.0, 131.0, 85.0, 81.0, 57.0, 55.0, 36.0, 29.0, 20.0, 17.0, 11.0, 12.0, 4.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-12.421875, -12.06982421875, -11.7177734375, -11.36572265625, -11.013671875, -10.66162109375, -10.3095703125, -9.95751953125, -9.60546875, -9.25341796875, -8.9013671875, -8.54931640625, -8.197265625, -7.84521484375, -7.4931640625, -7.14111328125, -6.7890625, -6.43701171875, -6.0849609375, -5.73291015625, -5.380859375, -5.02880859375, -4.6767578125, -4.32470703125, -3.97265625, -3.62060546875, -3.2685546875, -2.91650390625, -2.564453125, -2.21240234375, -1.8603515625, -1.50830078125, -1.15625, -0.80419921875, -0.4521484375, -0.10009765625, 0.251953125, 0.60400390625, 0.9560546875, 1.30810546875, 1.66015625, 2.01220703125, 2.3642578125, 2.71630859375, 3.068359375, 3.42041015625, 3.7724609375, 4.12451171875, 4.4765625, 4.82861328125, 5.1806640625, 5.53271484375, 5.884765625, 6.23681640625, 6.5888671875, 6.94091796875, 7.29296875, 7.64501953125, 7.9970703125, 8.34912109375, 8.701171875, 9.05322265625, 9.4052734375, 9.75732421875, 10.109375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 15.0, 23.0, 26.0, 58.0, 74.0, 127.0, 104.0, 130.0, 133.0, 99.0, 79.0, 51.0, 43.0, 15.0, 11.0, 10.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.18479537963867, -31.056053161621094, -29.927310943603516, -28.798568725585938, -27.66982650756836, -26.54108428955078, -25.41234016418457, -24.283597946166992, -23.154855728149414, -22.026113510131836, -20.897371292114258, -19.76862907409668, -18.63988494873047, -17.51114273071289, -16.382400512695312, -15.253658294677734, -14.124916076660156, -12.996173858642578, -11.867431640625, -10.738688468933105, -9.609946250915527, -8.48120403289795, -7.352461338043213, -6.223718643188477, -5.094976425170898, -3.966233968734741, -2.837491512298584, -1.7087490558624268, -0.5800065994262695, 0.5487356185913086, 1.677478313446045, 2.8062210083007812, 3.9349594116210938, 5.063701629638672, 6.192444324493408, 7.3211870193481445, 8.449929237365723, 9.5786714553833, 10.707414627075195, 11.836156845092773, 12.964899063110352, 14.09364128112793, 15.222383499145508, 16.351125717163086, 17.479869842529297, 18.608612060546875, 19.737354278564453, 20.86609649658203, 21.99483871459961, 23.123580932617188, 24.252323150634766, 25.381065368652344, 26.509807586669922, 27.6385498046875, 28.76729393005371, 29.89603614807129, 31.024778366088867, 32.15352249145508, 33.282264709472656, 34.411006927490234, 35.53974914550781, 36.66849136352539, 37.79723358154297, 38.92597579956055, 40.054718017578125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 3.0, 13.0, 12.0, 14.0, 10.0, 11.0, 19.0, 24.0, 27.0, 25.0, 36.0, 27.0, 40.0, 34.0, 33.0, 41.0, 39.0, 37.0, 30.0, 43.0, 38.0, 38.0, 35.0, 40.0, 43.0, 36.0, 30.0, 27.0, 26.0, 30.0, 16.0, 16.0, 17.0, 16.0, 13.0, 8.0, 14.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-18.091873168945312, -17.55296516418457, -17.01405906677246, -16.47515106201172, -15.93624496459961, -15.397336959838867, -14.858429908752441, -14.319522857666016, -13.78061580657959, -13.241708755493164, -12.702801704406738, -12.163894653320312, -11.62498664855957, -11.086080551147461, -10.547172546386719, -10.008265495300293, -9.469358444213867, -8.930451393127441, -8.391544342041016, -7.852636814117432, -7.313729763031006, -6.77482271194458, -6.235915184020996, -5.69700813293457, -5.1581010818481445, -4.619194030761719, -4.080286979675293, -3.541379451751709, -3.002472400665283, -2.4635653495788574, -1.9246580600738525, -1.3857507705688477, -0.8468437194824219, -0.30793654918670654, 0.2309706211090088, 0.7698777914047241, 1.3087849617004395, 1.8476920127868652, 2.38659930229187, 2.925506591796875, 3.464413642883301, 4.003320693969727, 4.542227745056152, 5.081135272979736, 5.620042324066162, 6.158949375152588, 6.697856903076172, 7.236763954162598, 7.775671005249023, 8.31457805633545, 8.853485107421875, 9.3923921585083, 9.931299209594727, 10.470207214355469, 11.009114265441895, 11.54802131652832, 12.086928367614746, 12.625835418701172, 13.164742469787598, 13.703649520874023, 14.242557525634766, 14.781463623046875, 15.320371627807617, 15.859278678894043, 16.39818572998047]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 8.0, 6.0, 7.0, 20.0, 9.0, 13.0, 11.0, 14.0, 22.0, 32.0, 25.0, 29.0, 37.0, 32.0, 44.0, 39.0, 36.0, 35.0, 42.0, 44.0, 47.0, 23.0, 37.0, 51.0, 36.0, 34.0, 32.0, 34.0, 29.0, 27.0, 29.0, 14.0, 17.0, 9.0, 8.0, 11.0, 11.0, 3.0, 7.0, 7.0, 1.0, 6.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1829833984375, -2.106201171875, -2.0294189453125, -1.95263671875, -1.8758544921875, -1.799072265625, -1.7222900390625, -1.6455078125, -1.5687255859375, -1.491943359375, -1.4151611328125, -1.33837890625, -1.2615966796875, -1.184814453125, -1.1080322265625, -1.03125, -0.9544677734375, -0.877685546875, -0.8009033203125, -0.72412109375, -0.6473388671875, -0.570556640625, -0.4937744140625, -0.4169921875, -0.3402099609375, -0.263427734375, -0.1866455078125, -0.10986328125, -0.0330810546875, 0.043701171875, 0.1204833984375, 0.197265625, 0.2740478515625, 0.350830078125, 0.4276123046875, 0.50439453125, 0.5811767578125, 0.657958984375, 0.7347412109375, 0.8115234375, 0.8883056640625, 0.965087890625, 1.0418701171875, 1.11865234375, 1.1954345703125, 1.272216796875, 1.3489990234375, 1.42578125, 1.5025634765625, 1.579345703125, 1.6561279296875, 1.73291015625, 1.8096923828125, 1.886474609375, 1.9632568359375, 2.0400390625, 2.1168212890625, 2.193603515625, 2.2703857421875, 2.34716796875, 2.4239501953125, 2.500732421875, 2.5775146484375, 2.654296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 10.0, 17.0, 28.0, 44.0, 70.0, 118.0, 109.0, 249.0, 318.0, 496.0, 622.0, 987.0, 1427.0, 2087.0, 2895.0, 4329.0, 6298.0, 9639.0, 14505.0, 22587.0, 35080.0, 58273.0, 102190.0, 238475.0, 267166.0, 111061.0, 61827.0, 37558.0, 23536.0, 15233.0, 10006.0, 6838.0, 4536.0, 3048.0, 2172.0, 1522.0, 977.0, 735.0, 467.0, 365.0, 209.0, 148.0, 107.0, 75.0, 40.0, 24.0, 20.0, 18.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0133819580078125, -0.012951135635375977, -0.012520313262939453, -0.01208949089050293, -0.011658668518066406, -0.011227846145629883, -0.01079702377319336, -0.010366201400756836, -0.009935379028320312, -0.009504556655883789, -0.009073734283447266, -0.008642911911010742, -0.008212089538574219, -0.007781267166137695, -0.007350444793701172, -0.0069196224212646484, -0.006488800048828125, -0.0060579776763916016, -0.005627155303955078, -0.005196332931518555, -0.004765510559082031, -0.004334688186645508, -0.0039038658142089844, -0.003473043441772461, -0.0030422210693359375, -0.002611398696899414, -0.0021805763244628906, -0.0017497539520263672, -0.0013189315795898438, -0.0008881092071533203, -0.0004572868347167969, -2.6464462280273438e-05, 0.00040435791015625, 0.0008351802825927734, 0.0012660026550292969, 0.0016968250274658203, 0.0021276473999023438, 0.002558469772338867, 0.0029892921447753906, 0.003420114517211914, 0.0038509368896484375, 0.004281759262084961, 0.004712581634521484, 0.005143404006958008, 0.005574226379394531, 0.006005048751831055, 0.006435871124267578, 0.0068666934967041016, 0.007297515869140625, 0.0077283382415771484, 0.008159160614013672, 0.008589982986450195, 0.009020805358886719, 0.009451627731323242, 0.009882450103759766, 0.010313272476196289, 0.010744094848632812, 0.011174917221069336, 0.01160573959350586, 0.012036561965942383, 0.012467384338378906, 0.01289820671081543, 0.013329029083251953, 0.013759851455688477, 0.014190673828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 3.0, 1.0, 6.0, 10.0, 19.0, 11.0, 15.0, 22.0, 21.0, 29.0, 23.0, 21.0, 20.0, 43.0, 42.0, 39.0, 30.0, 51.0, 37.0, 1074.0, 48.0, 40.0, 40.0, 32.0, 35.0, 42.0, 33.0, 27.0, 22.0, 33.0, 25.0, 12.0, 18.0, 14.0, 16.0, 8.0, 10.0, 10.0, 7.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6298828125, -1.5752716064453125, -1.520660400390625, -1.4660491943359375, -1.41143798828125, -1.3568267822265625, -1.302215576171875, -1.2476043701171875, -1.1929931640625, -1.1383819580078125, -1.083770751953125, -1.0291595458984375, -0.97454833984375, -0.9199371337890625, -0.865325927734375, -0.8107147216796875, -0.756103515625, -0.7014923095703125, -0.646881103515625, -0.5922698974609375, -0.53765869140625, -0.4830474853515625, -0.428436279296875, -0.3738250732421875, -0.3192138671875, -0.2646026611328125, -0.209991455078125, -0.1553802490234375, -0.10076904296875, -0.0461578369140625, 0.008453369140625, 0.0630645751953125, 0.11767578125, 0.1722869873046875, 0.226898193359375, 0.2815093994140625, 0.33612060546875, 0.3907318115234375, 0.445343017578125, 0.4999542236328125, 0.5545654296875, 0.6091766357421875, 0.663787841796875, 0.7183990478515625, 0.77301025390625, 0.8276214599609375, 0.882232666015625, 0.9368438720703125, 0.991455078125, 1.0460662841796875, 1.100677490234375, 1.1552886962890625, 1.20989990234375, 1.2645111083984375, 1.319122314453125, 1.3737335205078125, 1.4283447265625, 1.4829559326171875, 1.537567138671875, 1.5921783447265625, 1.64678955078125, 1.7014007568359375, 1.756011962890625, 1.8106231689453125, 1.865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 19.0, 11.0, 23.0, 37.0, 58.0, 95.0, 107.0, 170.0, 234.0, 411.0, 540.0, 815.0, 1137.0, 1874.0, 2752.0, 4167.0, 6462.0, 9792.0, 15690.0, 25251.0, 41462.0, 70228.0, 136787.0, 1358509.0, 196746.0, 89160.0, 51036.0, 30451.0, 18864.0, 11964.0, 7690.0, 4768.0, 3256.0, 2150.0, 1410.0, 951.0, 644.0, 436.0, 315.0, 217.0, 143.0, 90.0, 62.0, 37.0, 40.0, 20.0, 13.0, 13.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0], "bins": [-0.01119232177734375, -0.010860204696655273, -0.010528087615966797, -0.01019597053527832, -0.009863853454589844, -0.009531736373901367, -0.00919961929321289, -0.008867502212524414, -0.008535385131835938, -0.008203268051147461, -0.007871150970458984, -0.007539033889770508, -0.007206916809082031, -0.006874799728393555, -0.006542682647705078, -0.0062105655670166016, -0.005878448486328125, -0.0055463314056396484, -0.005214214324951172, -0.004882097244262695, -0.004549980163574219, -0.004217863082885742, -0.0038857460021972656, -0.003553628921508789, -0.0032215118408203125, -0.002889394760131836, -0.0025572776794433594, -0.002225160598754883, -0.0018930435180664062, -0.0015609264373779297, -0.0012288093566894531, -0.0008966922760009766, -0.0005645751953125, -0.00023245811462402344, 9.965896606445312e-05, 0.0004317760467529297, 0.0007638931274414062, 0.0010960102081298828, 0.0014281272888183594, 0.001760244369506836, 0.0020923614501953125, 0.002424478530883789, 0.0027565956115722656, 0.003088712692260742, 0.0034208297729492188, 0.0037529468536376953, 0.004085063934326172, 0.0044171810150146484, 0.004749298095703125, 0.0050814151763916016, 0.005413532257080078, 0.005745649337768555, 0.006077766418457031, 0.006409883499145508, 0.006742000579833984, 0.007074117660522461, 0.0074062347412109375, 0.007738351821899414, 0.00807046890258789, 0.008402585983276367, 0.008734703063964844, 0.00906682014465332, 0.009398937225341797, 0.009731054306030273, 0.01006317138671875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 916.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [19.0, 1.0, 0.0, 6.0, 0.0, 1.0, 0.0, 29.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 28.0, 38.0, 63.0, 76.0, 0.0, 357.0, 3578.0, 25980.0, 988220.0, 26051.0, 3515.0, 342.0, 86.0, 0.0, 54.0, 41.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 3.0, 0.0, 6.0, 0.0, 1.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1390075087547302e-06, -1.085922122001648e-06, -1.0328367352485657e-06, -9.797513484954834e-07, -9.266659617424011e-07, -8.735805749893188e-07, -8.204951882362366e-07, -7.674098014831543e-07, -7.14324414730072e-07, -6.612390279769897e-07, -6.081536412239075e-07, -5.550682544708252e-07, -5.019828677177429e-07, -4.4889748096466064e-07, -3.9581209421157837e-07, -3.427267074584961e-07, -2.896413207054138e-07, -2.3655593395233154e-07, -1.8347054719924927e-07, -1.30385160446167e-07, -7.729977369308472e-08, -2.421438694000244e-08, 2.8870999813079834e-08, 8.195638656616211e-08, 1.3504177331924438e-07, 1.8812716007232666e-07, 2.4121254682540894e-07, 2.942979335784912e-07, 3.473833203315735e-07, 4.0046870708465576e-07, 4.5355409383773804e-07, 5.066394805908203e-07, 5.597248673439026e-07, 6.128102540969849e-07, 6.658956408500671e-07, 7.189810276031494e-07, 7.720664143562317e-07, 8.25151801109314e-07, 8.782371878623962e-07, 9.313225746154785e-07, 9.844079613685608e-07, 1.037493348121643e-06, 1.0905787348747253e-06, 1.1436641216278076e-06, 1.1967495083808899e-06, 1.2498348951339722e-06, 1.3029202818870544e-06, 1.3560056686401367e-06, 1.409091055393219e-06, 1.4621764421463013e-06, 1.5152618288993835e-06, 1.5683472156524658e-06, 1.621432602405548e-06, 1.6745179891586304e-06, 1.7276033759117126e-06, 1.780688762664795e-06, 1.8337741494178772e-06, 1.8868595361709595e-06, 1.9399449229240417e-06, 1.993030309677124e-06, 2.0461156964302063e-06, 2.0992010831832886e-06, 2.152286469936371e-06, 2.205371856689453e-06]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1023.0], "bins": [-2.4395898634566038e-08, -2.4014711996755977e-08, -2.3633527135302757e-08, -2.3252340497492696e-08, -2.2871155636039475e-08, -2.2489968998229415e-08, -2.2108782360419355e-08, -2.1727597498966134e-08, -2.1346410861156073e-08, -2.0965224223346013e-08, -2.0584039361892792e-08, -2.020285272408273e-08, -1.982166786262951e-08, -1.944048122481945e-08, -1.905929636336623e-08, -1.867810972555617e-08, -1.829692308774611e-08, -1.7915736449936048e-08, -1.7534551588482827e-08, -1.7153364950672767e-08, -1.6772180089219546e-08, -1.6390993451409486e-08, -1.6009806813599425e-08, -1.5628621952146204e-08, -1.5247437090692983e-08, -1.4866251341061343e-08, -1.4485065591429702e-08, -1.4103878953619642e-08, -1.3722693203988001e-08, -1.334150745435636e-08, -1.296032170472472e-08, -1.257913595509308e-08, -1.2197949317283019e-08, -1.1816763567651378e-08, -1.1435577818019738e-08, -1.1054391180209677e-08, -1.0673205430578037e-08, -1.0292019680946396e-08, -9.910833931314755e-09, -9.529648181683115e-09, -9.148461543873054e-09, -8.767275794241414e-09, -8.386090044609773e-09, -8.004903406799713e-09, -7.623717657168072e-09, -7.242531907536431e-09, -6.861346157904791e-09, -6.48016040827315e-09, -6.0989746586415094e-09, -5.717788909009869e-09, -5.336602715289018e-09, -4.955416965657378e-09, -4.574230771936527e-09, -4.1930450223048865e-09, -3.811859272673246e-09, -3.4306733009970003e-09, -3.0494873293207547e-09, -2.668301357644509e-09, -2.2871153859682636e-09, -1.905929636336623e-09, -1.5247436646603774e-09, -1.1435576929841318e-09, -7.623719433524911e-10, -3.8118597167624557e-10, 0.0]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 8.0, 6.0, 7.0, 20.0, 9.0, 13.0, 11.0, 14.0, 22.0, 32.0, 25.0, 29.0, 37.0, 32.0, 44.0, 39.0, 36.0, 35.0, 42.0, 44.0, 47.0, 23.0, 37.0, 51.0, 36.0, 34.0, 32.0, 34.0, 29.0, 27.0, 29.0, 14.0, 17.0, 9.0, 8.0, 11.0, 11.0, 3.0, 7.0, 7.0, 1.0, 6.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1829833984375, -2.106201171875, -2.0294189453125, -1.95263671875, -1.8758544921875, -1.799072265625, -1.7222900390625, -1.6455078125, -1.5687255859375, -1.491943359375, -1.4151611328125, -1.33837890625, -1.2615966796875, -1.184814453125, -1.1080322265625, -1.03125, -0.9544677734375, -0.877685546875, -0.8009033203125, -0.72412109375, -0.6473388671875, -0.570556640625, -0.4937744140625, -0.4169921875, -0.3402099609375, -0.263427734375, -0.1866455078125, -0.10986328125, -0.0330810546875, 0.043701171875, 0.1204833984375, 0.197265625, 0.2740478515625, 0.350830078125, 0.4276123046875, 0.50439453125, 0.5811767578125, 0.657958984375, 0.7347412109375, 0.8115234375, 0.8883056640625, 0.965087890625, 1.0418701171875, 1.11865234375, 1.1954345703125, 1.272216796875, 1.3489990234375, 1.42578125, 1.5025634765625, 1.579345703125, 1.6561279296875, 1.73291015625, 1.8096923828125, 1.886474609375, 1.9632568359375, 2.0400390625, 2.1168212890625, 2.193603515625, 2.2703857421875, 2.34716796875, 2.4239501953125, 2.500732421875, 2.5775146484375, 2.654296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 5.0, 8.0, 14.0, 25.0, 49.0, 63.0, 97.0, 187.0, 361.0, 562.0, 1029.0, 1795.0, 3323.0, 6017.0, 11507.0, 21801.0, 41989.0, 81398.0, 197352.0, 430352.0, 123197.0, 60115.0, 31633.0, 16352.0, 8778.0, 4704.0, 2636.0, 1363.0, 772.0, 457.0, 252.0, 166.0, 83.0, 48.0, 24.0, 21.0, 9.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.457275390625, -2.36376953125, -2.270263671875, -2.1767578125, -2.083251953125, -1.98974609375, -1.896240234375, -1.802734375, -1.709228515625, -1.61572265625, -1.522216796875, -1.4287109375, -1.335205078125, -1.24169921875, -1.148193359375, -1.0546875, -0.961181640625, -0.86767578125, -0.774169921875, -0.6806640625, -0.587158203125, -0.49365234375, -0.400146484375, -0.306640625, -0.213134765625, -0.11962890625, -0.026123046875, 0.0673828125, 0.160888671875, 0.25439453125, 0.347900390625, 0.44140625, 0.534912109375, 0.62841796875, 0.721923828125, 0.8154296875, 0.908935546875, 1.00244140625, 1.095947265625, 1.189453125, 1.282958984375, 1.37646484375, 1.469970703125, 1.5634765625, 1.656982421875, 1.75048828125, 1.843994140625, 1.9375, 2.031005859375, 2.12451171875, 2.218017578125, 2.3115234375, 2.405029296875, 2.49853515625, 2.592041015625, 2.685546875, 2.779052734375, 2.87255859375, 2.966064453125, 3.0595703125, 3.153076171875, 3.24658203125, 3.340087890625, 3.43359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 2.0, 3.0, 4.0, 10.0, 9.0, 8.0, 3.0, 4.0, 8.0, 16.0, 22.0, 17.0, 21.0, 26.0, 32.0, 25.0, 47.0, 45.0, 53.0, 56.0, 74.0, 141.0, 1461.0, 372.0, 123.0, 79.0, 56.0, 46.0, 42.0, 33.0, 29.0, 31.0, 32.0, 32.0, 24.0, 11.0, 12.0, 9.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.921875, -9.64581298828125, -9.3697509765625, -9.09368896484375, -8.817626953125, -8.54156494140625, -8.2655029296875, -7.98944091796875, -7.71337890625, -7.43731689453125, -7.1612548828125, -6.88519287109375, -6.609130859375, -6.33306884765625, -6.0570068359375, -5.78094482421875, -5.5048828125, -5.22882080078125, -4.9527587890625, -4.67669677734375, -4.400634765625, -4.12457275390625, -3.8485107421875, -3.57244873046875, -3.29638671875, -3.02032470703125, -2.7442626953125, -2.46820068359375, -2.192138671875, -1.91607666015625, -1.6400146484375, -1.36395263671875, -1.087890625, -0.81182861328125, -0.5357666015625, -0.25970458984375, 0.016357421875, 0.29241943359375, 0.5684814453125, 0.84454345703125, 1.12060546875, 1.39666748046875, 1.6727294921875, 1.94879150390625, 2.224853515625, 2.50091552734375, 2.7769775390625, 3.05303955078125, 3.3291015625, 3.60516357421875, 3.8812255859375, 4.15728759765625, 4.433349609375, 4.70941162109375, 4.9854736328125, 5.26153564453125, 5.53759765625, 5.81365966796875, 6.0897216796875, 6.36578369140625, 6.641845703125, 6.91790771484375, 7.1939697265625, 7.47003173828125, 7.74609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 7.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 14.0, 22.0, 21.0, 46.0, 51.0, 61.0, 83.0, 104.0, 139.0, 214.0, 349.0, 1063.0, 11363.0, 735154.0, 2375581.0, 18699.0, 1408.0, 395.0, 228.0, 178.0, 112.0, 86.0, 62.0, 53.0, 38.0, 34.0, 27.0, 18.0, 13.0, 13.0, 5.0, 6.0, 12.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.3125, -14.7470703125, -14.181640625, -13.6162109375, -13.05078125, -12.4853515625, -11.919921875, -11.3544921875, -10.7890625, -10.2236328125, -9.658203125, -9.0927734375, -8.52734375, -7.9619140625, -7.396484375, -6.8310546875, -6.265625, -5.7001953125, -5.134765625, -4.5693359375, -4.00390625, -3.4384765625, -2.873046875, -2.3076171875, -1.7421875, -1.1767578125, -0.611328125, -0.0458984375, 0.51953125, 1.0849609375, 1.650390625, 2.2158203125, 2.78125, 3.3466796875, 3.912109375, 4.4775390625, 5.04296875, 5.6083984375, 6.173828125, 6.7392578125, 7.3046875, 7.8701171875, 8.435546875, 9.0009765625, 9.56640625, 10.1318359375, 10.697265625, 11.2626953125, 11.828125, 12.3935546875, 12.958984375, 13.5244140625, 14.08984375, 14.6552734375, 15.220703125, 15.7861328125, 16.3515625, 16.9169921875, 17.482421875, 18.0478515625, 18.61328125, 19.1787109375, 19.744140625, 20.3095703125, 20.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 113.0, 800.0, 101.0, 4.0], "bins": [-266.6261291503906, -262.2872619628906, -257.9483947753906, -253.60952758789062, -249.27066040039062, -244.93177795410156, -240.59291076660156, -236.25404357910156, -231.91517639160156, -227.57630920410156, -223.23744201660156, -218.89857482910156, -214.5596923828125, -210.2208251953125, -205.8819580078125, -201.5430908203125, -197.2042236328125, -192.8653564453125, -188.5264892578125, -184.1876220703125, -179.8487548828125, -175.50987243652344, -171.17100524902344, -166.83213806152344, -162.49327087402344, -158.15440368652344, -153.81553649902344, -149.47666931152344, -145.13778686523438, -140.79891967773438, -136.46005249023438, -132.12118530273438, -127.78233337402344, -123.44346618652344, -119.10459899902344, -114.7657241821289, -110.4268569946289, -106.0879898071289, -101.74911499023438, -97.41024780273438, -93.07138061523438, -88.73251342773438, -84.39364624023438, -80.05477142333984, -75.71590423583984, -71.37703704833984, -67.03816223144531, -62.69929504394531, -58.36042785644531, -54.02156066894531, -49.68268966674805, -45.34381866455078, -41.00495147705078, -36.66608428955078, -32.327213287353516, -27.988344192504883, -23.64947509765625, -19.310606002807617, -14.971736907958984, -10.632867813110352, -6.293998718261719, -1.955129623413086, 2.383739471435547, 6.72260856628418, 11.061477661132812]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 13.0, 12.0, 10.0, 14.0, 16.0, 18.0, 20.0, 32.0, 22.0, 31.0, 36.0, 32.0, 38.0, 36.0, 43.0, 39.0, 33.0, 32.0, 36.0, 35.0, 34.0, 46.0, 35.0, 37.0, 26.0, 33.0, 25.0, 26.0, 18.0, 19.0, 22.0, 14.0, 18.0, 10.0, 8.0, 13.0, 7.0, 10.0, 2.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.844926834106445, -24.092288970947266, -23.339649200439453, -22.58700942993164, -21.83437156677246, -21.08173370361328, -20.32909393310547, -19.576454162597656, -18.823816299438477, -18.071178436279297, -17.318538665771484, -16.565898895263672, -15.813261032104492, -15.060622215270996, -14.3079833984375, -13.555344581604004, -12.802705764770508, -12.050066947937012, -11.297428131103516, -10.54478931427002, -9.792150497436523, -9.039511680603027, -8.286872863769531, -7.534234046936035, -6.781595230102539, -6.028956413269043, -5.276317596435547, -4.523678779602051, -3.7710399627685547, -3.0184011459350586, -2.2657623291015625, -1.5131235122680664, -0.7604827880859375, -0.007843971252441406, 0.7447948455810547, 1.4974336624145508, 2.250072479248047, 3.002711296081543, 3.755350112915039, 4.507988929748535, 5.260627746582031, 6.013266563415527, 6.765905380249023, 7.5185441970825195, 8.271183013916016, 9.023821830749512, 9.776460647583008, 10.529099464416504, 11.28173828125, 12.034377098083496, 12.787015914916992, 13.539654731750488, 14.292293548583984, 15.04493236541748, 15.797571182250977, 16.550209045410156, 17.30284881591797, 18.05548858642578, 18.80812644958496, 19.56076431274414, 20.313404083251953, 21.066043853759766, 21.818681716918945, 22.571319580078125, 23.323959350585938]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 9.0, 4.0, 8.0, 13.0, 11.0, 6.0, 7.0, 14.0, 18.0, 15.0, 17.0, 23.0, 39.0, 30.0, 37.0, 34.0, 31.0, 36.0, 39.0, 39.0, 30.0, 38.0, 45.0, 46.0, 34.0, 40.0, 35.0, 31.0, 30.0, 18.0, 40.0, 27.0, 25.0, 23.0, 24.0, 17.0, 12.0, 6.0, 9.0, 10.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2818603515625, -2.202392578125, -2.1229248046875, -2.04345703125, -1.9639892578125, -1.884521484375, -1.8050537109375, -1.7255859375, -1.6461181640625, -1.566650390625, -1.4871826171875, -1.40771484375, -1.3282470703125, -1.248779296875, -1.1693115234375, -1.08984375, -1.0103759765625, -0.930908203125, -0.8514404296875, -0.77197265625, -0.6925048828125, -0.613037109375, -0.5335693359375, -0.4541015625, -0.3746337890625, -0.295166015625, -0.2156982421875, -0.13623046875, -0.0567626953125, 0.022705078125, 0.1021728515625, 0.181640625, 0.2611083984375, 0.340576171875, 0.4200439453125, 0.49951171875, 0.5789794921875, 0.658447265625, 0.7379150390625, 0.8173828125, 0.8968505859375, 0.976318359375, 1.0557861328125, 1.13525390625, 1.2147216796875, 1.294189453125, 1.3736572265625, 1.453125, 1.5325927734375, 1.612060546875, 1.6915283203125, 1.77099609375, 1.8504638671875, 1.929931640625, 2.0093994140625, 2.0888671875, 2.1683349609375, 2.247802734375, 2.3272705078125, 2.40673828125, 2.4862060546875, 2.565673828125, 2.6451416015625, 2.724609375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 13.0, 7.0, 11.0, 9.0, 12.0, 15.0, 9.0, 25.0, 30.0, 42.0, 46.0, 64.0, 126.0, 222.0, 447.0, 1253.0, 3876.0, 15484.0, 85891.0, 790957.0, 2676925.0, 536980.0, 63938.0, 12416.0, 3241.0, 1099.0, 496.0, 221.0, 129.0, 77.0, 61.0, 29.0, 23.0, 18.0, 16.0, 14.0, 10.0, 5.0, 10.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.140625, -6.9058837890625, -6.671142578125, -6.4364013671875, -6.20166015625, -5.9669189453125, -5.732177734375, -5.4974365234375, -5.2626953125, -5.0279541015625, -4.793212890625, -4.5584716796875, -4.32373046875, -4.0889892578125, -3.854248046875, -3.6195068359375, -3.384765625, -3.1500244140625, -2.915283203125, -2.6805419921875, -2.44580078125, -2.2110595703125, -1.976318359375, -1.7415771484375, -1.5068359375, -1.2720947265625, -1.037353515625, -0.8026123046875, -0.56787109375, -0.3331298828125, -0.098388671875, 0.1363525390625, 0.37109375, 0.6058349609375, 0.840576171875, 1.0753173828125, 1.31005859375, 1.5447998046875, 1.779541015625, 2.0142822265625, 2.2490234375, 2.4837646484375, 2.718505859375, 2.9532470703125, 3.18798828125, 3.4227294921875, 3.657470703125, 3.8922119140625, 4.126953125, 4.3616943359375, 4.596435546875, 4.8311767578125, 5.06591796875, 5.3006591796875, 5.535400390625, 5.7701416015625, 6.0048828125, 6.2396240234375, 6.474365234375, 6.7091064453125, 6.94384765625, 7.1785888671875, 7.413330078125, 7.6480712890625, 7.8828125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 10.0, 13.0, 24.0, 30.0, 28.0, 41.0, 53.0, 67.0, 102.0, 139.0, 192.0, 246.0, 319.0, 372.0, 444.0, 455.0, 360.0, 272.0, 254.0, 172.0, 133.0, 93.0, 78.0, 40.0, 36.0, 24.0, 21.0, 18.0, 11.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.49169921875, -5.3076171875, -5.12353515625, -4.939453125, -4.75537109375, -4.5712890625, -4.38720703125, -4.203125, -4.01904296875, -3.8349609375, -3.65087890625, -3.466796875, -3.28271484375, -3.0986328125, -2.91455078125, -2.73046875, -2.54638671875, -2.3623046875, -2.17822265625, -1.994140625, -1.81005859375, -1.6259765625, -1.44189453125, -1.2578125, -1.07373046875, -0.8896484375, -0.70556640625, -0.521484375, -0.33740234375, -0.1533203125, 0.03076171875, 0.21484375, 0.39892578125, 0.5830078125, 0.76708984375, 0.951171875, 1.13525390625, 1.3193359375, 1.50341796875, 1.6875, 1.87158203125, 2.0556640625, 2.23974609375, 2.423828125, 2.60791015625, 2.7919921875, 2.97607421875, 3.16015625, 3.34423828125, 3.5283203125, 3.71240234375, 3.896484375, 4.08056640625, 4.2646484375, 4.44873046875, 4.6328125, 4.81689453125, 5.0009765625, 5.18505859375, 5.369140625, 5.55322265625, 5.7373046875, 5.92138671875, 6.10546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 14.0, 21.0, 16.0, 31.0, 31.0, 46.0, 83.0, 123.0, 146.0, 230.0, 333.0, 625.0, 3511.0, 106962.0, 3537351.0, 531688.0, 10913.0, 923.0, 375.0, 248.0, 158.0, 126.0, 83.0, 55.0, 45.0, 45.0, 30.0, 26.0, 11.0, 12.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -21.13818359375, -20.5107421875, -19.88330078125, -19.255859375, -18.62841796875, -18.0009765625, -17.37353515625, -16.74609375, -16.11865234375, -15.4912109375, -14.86376953125, -14.236328125, -13.60888671875, -12.9814453125, -12.35400390625, -11.7265625, -11.09912109375, -10.4716796875, -9.84423828125, -9.216796875, -8.58935546875, -7.9619140625, -7.33447265625, -6.70703125, -6.07958984375, -5.4521484375, -4.82470703125, -4.197265625, -3.56982421875, -2.9423828125, -2.31494140625, -1.6875, -1.06005859375, -0.4326171875, 0.19482421875, 0.822265625, 1.44970703125, 2.0771484375, 2.70458984375, 3.33203125, 3.95947265625, 4.5869140625, 5.21435546875, 5.841796875, 6.46923828125, 7.0966796875, 7.72412109375, 8.3515625, 8.97900390625, 9.6064453125, 10.23388671875, 10.861328125, 11.48876953125, 12.1162109375, 12.74365234375, 13.37109375, 13.99853515625, 14.6259765625, 15.25341796875, 15.880859375, 16.50830078125, 17.1357421875, 17.76318359375, 18.390625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 12.0, 73.0, 234.0, 379.0, 233.0, 75.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.6937713623047, -125.3545913696289, -122.01541137695312, -118.67623138427734, -115.33705139160156, -111.99787139892578, -108.65869140625, -105.31951904296875, -101.98033142089844, -98.64115142822266, -95.30197143554688, -91.9627914428711, -88.62361145019531, -85.28443145751953, -81.94525146484375, -78.6060791015625, -75.26689910888672, -71.92771911621094, -68.58853912353516, -65.24935913085938, -61.910179138183594, -58.57099914550781, -55.2318229675293, -51.892642974853516, -48.553462982177734, -45.21428298950195, -41.87510299682617, -38.535926818847656, -35.196746826171875, -31.85756492614746, -28.518386840820312, -25.17920684814453, -21.84003448486328, -18.5008544921875, -15.161675453186035, -11.82249641418457, -8.483316421508789, -5.144136428833008, -1.8049583435058594, 1.5342216491699219, 4.873401641845703, 8.212581634521484, 11.55176067352295, 14.890939712524414, 18.230119705200195, 21.569299697875977, 24.908477783203125, 28.247657775878906, 31.586837768554688, 34.92601776123047, 38.26519775390625, 41.60437774658203, 44.94355773925781, 48.282737731933594, 51.62191390991211, 54.96109390258789, 58.30027389526367, 61.63945388793945, 64.97863006591797, 68.31781005859375, 71.65699005126953, 74.99617004394531, 78.3353500366211, 81.67453002929688, 85.01371002197266]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 7.0, 6.0, 8.0, 8.0, 10.0, 19.0, 13.0, 9.0, 12.0, 26.0, 22.0, 29.0, 21.0, 29.0, 23.0, 29.0, 21.0, 30.0, 35.0, 34.0, 45.0, 42.0, 38.0, 33.0, 39.0, 41.0, 47.0, 21.0, 33.0, 30.0, 28.0, 32.0, 21.0, 20.0, 19.0, 12.0, 15.0, 13.0, 9.0, 11.0, 5.0, 7.0, 7.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.971534729003906, -15.46187686920166, -14.952219009399414, -14.442560195922852, -13.932902336120605, -13.42324447631836, -12.913585662841797, -12.40392780303955, -11.894269943237305, -11.384612083435059, -10.874954223632812, -10.36529541015625, -9.855637550354004, -9.345979690551758, -8.836320877075195, -8.32666301727295, -7.817005157470703, -7.307347297668457, -6.797688961029053, -6.288030624389648, -5.778372764587402, -5.268714904785156, -4.759056568145752, -4.249398231506348, -3.7397403717041016, -3.2300822734832764, -2.720424175262451, -2.210766077041626, -1.7011079788208008, -1.1914498805999756, -0.6817917823791504, -0.1721336841583252, 0.3375244140625, 0.8471825122833252, 1.3568406105041504, 1.8664987087249756, 2.376156806945801, 2.885814905166626, 3.395473003387451, 3.9051311016082764, 4.414789199829102, 4.924447059631348, 5.434105396270752, 5.943763732910156, 6.453421592712402, 6.963079452514648, 7.472737789154053, 7.982396125793457, 8.492053985595703, 9.00171184539795, 9.511369705200195, 10.021028518676758, 10.530686378479004, 11.04034423828125, 11.550003051757812, 12.059660911560059, 12.569318771362305, 13.07897663116455, 13.588634490966797, 14.09829330444336, 14.607951164245605, 15.117609024047852, 15.627267837524414, 16.136924743652344, 16.646583557128906]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 9.0, 15.0, 13.0, 16.0, 19.0, 24.0, 19.0, 32.0, 30.0, 34.0, 36.0, 45.0, 38.0, 33.0, 43.0, 50.0, 41.0, 43.0, 42.0, 37.0, 36.0, 39.0, 36.0, 30.0, 36.0, 30.0, 26.0, 18.0, 21.0, 15.0, 10.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51953125, -2.436309814453125, -2.35308837890625, -2.269866943359375, -2.1866455078125, -2.103424072265625, -2.02020263671875, -1.936981201171875, -1.853759765625, -1.770538330078125, -1.68731689453125, -1.604095458984375, -1.5208740234375, -1.437652587890625, -1.35443115234375, -1.271209716796875, -1.18798828125, -1.104766845703125, -1.02154541015625, -0.938323974609375, -0.8551025390625, -0.771881103515625, -0.68865966796875, -0.605438232421875, -0.522216796875, -0.438995361328125, -0.35577392578125, -0.272552490234375, -0.1893310546875, -0.106109619140625, -0.02288818359375, 0.060333251953125, 0.1435546875, 0.226776123046875, 0.30999755859375, 0.393218994140625, 0.4764404296875, 0.559661865234375, 0.64288330078125, 0.726104736328125, 0.809326171875, 0.892547607421875, 0.97576904296875, 1.058990478515625, 1.1422119140625, 1.225433349609375, 1.30865478515625, 1.391876220703125, 1.47509765625, 1.558319091796875, 1.64154052734375, 1.724761962890625, 1.8079833984375, 1.891204833984375, 1.97442626953125, 2.057647705078125, 2.140869140625, 2.224090576171875, 2.30731201171875, 2.390533447265625, 2.4737548828125, 2.556976318359375, 2.64019775390625, 2.723419189453125, 2.806640625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 19.0, 35.0, 29.0, 49.0, 83.0, 106.0, 143.0, 230.0, 335.0, 465.0, 750.0, 1063.0, 1589.0, 2379.0, 3690.0, 5789.0, 9255.0, 14929.0, 24838.0, 42883.0, 79056.0, 168009.0, 350266.0, 159941.0, 76681.0, 41970.0, 24190.0, 14406.0, 8832.0, 5615.0, 3643.0, 2362.0, 1638.0, 1047.0, 711.0, 480.0, 327.0, 243.0, 140.0, 108.0, 75.0, 41.0, 28.0, 25.0, 15.0, 10.0, 6.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01617431640625, -0.015676259994506836, -0.015178203582763672, -0.014680147171020508, -0.014182090759277344, -0.01368403434753418, -0.013185977935791016, -0.012687921524047852, -0.012189865112304688, -0.011691808700561523, -0.01119375228881836, -0.010695695877075195, -0.010197639465332031, -0.009699583053588867, -0.009201526641845703, -0.008703470230102539, -0.008205413818359375, -0.007707357406616211, -0.007209300994873047, -0.006711244583129883, -0.006213188171386719, -0.005715131759643555, -0.005217075347900391, -0.0047190189361572266, -0.0042209625244140625, -0.0037229061126708984, -0.0032248497009277344, -0.0027267932891845703, -0.0022287368774414062, -0.0017306804656982422, -0.0012326240539550781, -0.0007345676422119141, -0.00023651123046875, 0.00026154518127441406, 0.0007596015930175781, 0.0012576580047607422, 0.0017557144165039062, 0.0022537708282470703, 0.0027518272399902344, 0.0032498836517333984, 0.0037479400634765625, 0.0042459964752197266, 0.004744052886962891, 0.005242109298706055, 0.005740165710449219, 0.006238222122192383, 0.006736278533935547, 0.007234334945678711, 0.007732391357421875, 0.008230447769165039, 0.008728504180908203, 0.009226560592651367, 0.009724617004394531, 0.010222673416137695, 0.01072072982788086, 0.011218786239624023, 0.011716842651367188, 0.012214899063110352, 0.012712955474853516, 0.01321101188659668, 0.013709068298339844, 0.014207124710083008, 0.014705181121826172, 0.015203237533569336, 0.0157012939453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 10.0, 11.0, 12.0, 17.0, 9.0, 20.0, 13.0, 34.0, 21.0, 31.0, 20.0, 39.0, 35.0, 28.0, 39.0, 35.0, 38.0, 35.0, 1062.0, 37.0, 48.0, 44.0, 42.0, 33.0, 26.0, 31.0, 42.0, 40.0, 28.0, 26.0, 19.0, 24.0, 12.0, 19.0, 6.0, 9.0, 11.0, 7.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7514190673828125, -1.696197509765625, -1.6409759521484375, -1.58575439453125, -1.5305328369140625, -1.475311279296875, -1.4200897216796875, -1.3648681640625, -1.3096466064453125, -1.254425048828125, -1.1992034912109375, -1.14398193359375, -1.0887603759765625, -1.033538818359375, -0.9783172607421875, -0.923095703125, -0.8678741455078125, -0.812652587890625, -0.7574310302734375, -0.70220947265625, -0.6469879150390625, -0.591766357421875, -0.5365447998046875, -0.4813232421875, -0.4261016845703125, -0.370880126953125, -0.3156585693359375, -0.26043701171875, -0.2052154541015625, -0.149993896484375, -0.0947723388671875, -0.03955078125, 0.0156707763671875, 0.070892333984375, 0.1261138916015625, 0.18133544921875, 0.2365570068359375, 0.291778564453125, 0.3470001220703125, 0.4022216796875, 0.4574432373046875, 0.512664794921875, 0.5678863525390625, 0.62310791015625, 0.6783294677734375, 0.733551025390625, 0.7887725830078125, 0.843994140625, 0.8992156982421875, 0.954437255859375, 1.0096588134765625, 1.06488037109375, 1.1201019287109375, 1.175323486328125, 1.2305450439453125, 1.2857666015625, 1.3409881591796875, 1.396209716796875, 1.4514312744140625, 1.50665283203125, 1.5618743896484375, 1.617095947265625, 1.6723175048828125, 1.7275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 14.0, 11.0, 24.0, 33.0, 50.0, 71.0, 122.0, 187.0, 265.0, 399.0, 563.0, 982.0, 1543.0, 2188.0, 3621.0, 5786.0, 9224.0, 15008.0, 24491.0, 40315.0, 67074.0, 123018.0, 1316240.0, 227594.0, 104741.0, 59905.0, 35452.0, 22248.0, 13300.0, 8323.0, 5233.0, 3255.0, 2016.0, 1365.0, 868.0, 543.0, 353.0, 229.0, 166.0, 110.0, 62.0, 46.0, 31.0, 18.0, 18.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0105743408203125, -0.010242700576782227, -0.009911060333251953, -0.00957942008972168, -0.009247779846191406, -0.008916139602661133, -0.00858449935913086, -0.008252859115600586, -0.007921218872070312, -0.007589578628540039, -0.007257938385009766, -0.006926298141479492, -0.006594657897949219, -0.006263017654418945, -0.005931377410888672, -0.0055997371673583984, -0.005268096923828125, -0.0049364566802978516, -0.004604816436767578, -0.004273176193237305, -0.003941535949707031, -0.003609895706176758, -0.0032782554626464844, -0.002946615219116211, -0.0026149749755859375, -0.002283334732055664, -0.0019516944885253906, -0.0016200542449951172, -0.0012884140014648438, -0.0009567737579345703, -0.0006251335144042969, -0.00029349327087402344, 3.814697265625e-05, 0.00036978721618652344, 0.0007014274597167969, 0.0010330677032470703, 0.0013647079467773438, 0.0016963481903076172, 0.0020279884338378906, 0.002359628677368164, 0.0026912689208984375, 0.003022909164428711, 0.0033545494079589844, 0.003686189651489258, 0.004017829895019531, 0.004349470138549805, 0.004681110382080078, 0.0050127506256103516, 0.005344390869140625, 0.0056760311126708984, 0.006007671356201172, 0.006339311599731445, 0.006670951843261719, 0.007002592086791992, 0.007334232330322266, 0.007665872573852539, 0.007997512817382812, 0.008329153060913086, 0.00866079330444336, 0.008992433547973633, 0.009324073791503906, 0.00965571403503418, 0.009987354278564453, 0.010318994522094727, 0.010650634765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 920.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 4.0, 5.0, 8.0, 0.0, 28.0, 0.0, 2.0, 6.0, 45.0, 56.0, 468.0, 3761.0, 1013982.0, 25755.0, 4200.0, 114.0, 29.0, 41.0, 4.0, 0.0, 14.0, 17.0, 5.0, 3.0, 0.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.6582350730895996e-06, -3.56137752532959e-06, -3.46451997756958e-06, -3.3676624298095703e-06, -3.2708048820495605e-06, -3.1739473342895508e-06, -3.077089786529541e-06, -2.9802322387695312e-06, -2.8833746910095215e-06, -2.7865171432495117e-06, -2.689659595489502e-06, -2.592802047729492e-06, -2.4959444999694824e-06, -2.3990869522094727e-06, -2.302229404449463e-06, -2.205371856689453e-06, -2.1085143089294434e-06, -2.0116567611694336e-06, -1.914799213409424e-06, -1.817941665649414e-06, -1.7210841178894043e-06, -1.6242265701293945e-06, -1.5273690223693848e-06, -1.430511474609375e-06, -1.3336539268493652e-06, -1.2367963790893555e-06, -1.1399388313293457e-06, -1.043081283569336e-06, -9.462237358093262e-07, -8.493661880493164e-07, -7.525086402893066e-07, -6.556510925292969e-07, -5.587935447692871e-07, -4.6193599700927734e-07, -3.650784492492676e-07, -2.682209014892578e-07, -1.7136335372924805e-07, -7.450580596923828e-08, 2.2351741790771484e-08, 1.1920928955078125e-07, 2.1606683731079102e-07, 3.129243850708008e-07, 4.0978193283081055e-07, 5.066394805908203e-07, 6.034970283508301e-07, 7.003545761108398e-07, 7.972121238708496e-07, 8.940696716308594e-07, 9.909272193908691e-07, 1.087784767150879e-06, 1.1846423149108887e-06, 1.2814998626708984e-06, 1.3783574104309082e-06, 1.475214958190918e-06, 1.5720725059509277e-06, 1.6689300537109375e-06, 1.7657876014709473e-06, 1.862645149230957e-06, 1.959502696990967e-06, 2.0563602447509766e-06, 2.1532177925109863e-06, 2.250075340270996e-06, 2.346932888031006e-06, 2.4437904357910156e-06]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 9.0, 15.0, 13.0, 16.0, 19.0, 24.0, 19.0, 32.0, 30.0, 34.0, 36.0, 45.0, 38.0, 33.0, 43.0, 50.0, 41.0, 43.0, 42.0, 37.0, 36.0, 39.0, 36.0, 30.0, 36.0, 30.0, 26.0, 18.0, 21.0, 15.0, 10.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51953125, -2.436309814453125, -2.35308837890625, -2.269866943359375, -2.1866455078125, -2.103424072265625, -2.02020263671875, -1.936981201171875, -1.853759765625, -1.770538330078125, -1.68731689453125, -1.604095458984375, -1.5208740234375, -1.437652587890625, -1.35443115234375, -1.271209716796875, -1.18798828125, -1.104766845703125, -1.02154541015625, -0.938323974609375, -0.8551025390625, -0.771881103515625, -0.68865966796875, -0.605438232421875, -0.522216796875, -0.438995361328125, -0.35577392578125, -0.272552490234375, -0.1893310546875, -0.106109619140625, -0.02288818359375, 0.060333251953125, 0.1435546875, 0.226776123046875, 0.30999755859375, 0.393218994140625, 0.4764404296875, 0.559661865234375, 0.64288330078125, 0.726104736328125, 0.809326171875, 0.892547607421875, 0.97576904296875, 1.058990478515625, 1.1422119140625, 1.225433349609375, 1.30865478515625, 1.391876220703125, 1.47509765625, 1.558319091796875, 1.64154052734375, 1.724761962890625, 1.8079833984375, 1.891204833984375, 1.97442626953125, 2.057647705078125, 2.140869140625, 2.224090576171875, 2.30731201171875, 2.390533447265625, 2.4737548828125, 2.556976318359375, 2.64019775390625, 2.723419189453125, 2.806640625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 7.0, 14.0, 8.0, 18.0, 28.0, 50.0, 79.0, 117.0, 214.0, 294.0, 482.0, 700.0, 1053.0, 1685.0, 2555.0, 3662.0, 5641.0, 8608.0, 13509.0, 23390.0, 45808.0, 110490.0, 331359.0, 297673.0, 99670.0, 42131.0, 21985.0, 12964.0, 8418.0, 5465.0, 3564.0, 2361.0, 1609.0, 1016.0, 647.0, 459.0, 305.0, 193.0, 119.0, 82.0, 52.0, 25.0, 21.0, 12.0, 12.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8506317138671875, -1.776458740234375, -1.7022857666015625, -1.62811279296875, -1.5539398193359375, -1.479766845703125, -1.4055938720703125, -1.3314208984375, -1.2572479248046875, -1.183074951171875, -1.1089019775390625, -1.03472900390625, -0.9605560302734375, -0.886383056640625, -0.8122100830078125, -0.738037109375, -0.6638641357421875, -0.589691162109375, -0.5155181884765625, -0.44134521484375, -0.3671722412109375, -0.292999267578125, -0.2188262939453125, -0.1446533203125, -0.0704803466796875, 0.003692626953125, 0.0778656005859375, 0.15203857421875, 0.2262115478515625, 0.300384521484375, 0.3745574951171875, 0.44873046875, 0.5229034423828125, 0.597076416015625, 0.6712493896484375, 0.74542236328125, 0.8195953369140625, 0.893768310546875, 0.9679412841796875, 1.0421142578125, 1.1162872314453125, 1.190460205078125, 1.2646331787109375, 1.33880615234375, 1.4129791259765625, 1.487152099609375, 1.5613250732421875, 1.635498046875, 1.7096710205078125, 1.783843994140625, 1.8580169677734375, 1.93218994140625, 2.0063629150390625, 2.080535888671875, 2.1547088623046875, 2.2288818359375, 2.3030548095703125, 2.377227783203125, 2.4514007568359375, 2.52557373046875, 2.5997467041015625, 2.673919677734375, 2.7480926513671875, 2.822265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 11.0, 4.0, 6.0, 7.0, 8.0, 10.0, 22.0, 22.0, 31.0, 27.0, 30.0, 34.0, 41.0, 49.0, 33.0, 74.0, 102.0, 226.0, 1545.0, 208.0, 107.0, 58.0, 67.0, 56.0, 38.0, 32.0, 43.0, 27.0, 25.0, 22.0, 13.0, 13.0, 17.0, 9.0, 8.0, 5.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.0234375, -9.741455078125, -9.45947265625, -9.177490234375, -8.8955078125, -8.613525390625, -8.33154296875, -8.049560546875, -7.767578125, -7.485595703125, -7.20361328125, -6.921630859375, -6.6396484375, -6.357666015625, -6.07568359375, -5.793701171875, -5.51171875, -5.229736328125, -4.94775390625, -4.665771484375, -4.3837890625, -4.101806640625, -3.81982421875, -3.537841796875, -3.255859375, -2.973876953125, -2.69189453125, -2.409912109375, -2.1279296875, -1.845947265625, -1.56396484375, -1.281982421875, -1.0, -0.718017578125, -0.43603515625, -0.154052734375, 0.1279296875, 0.409912109375, 0.69189453125, 0.973876953125, 1.255859375, 1.537841796875, 1.81982421875, 2.101806640625, 2.3837890625, 2.665771484375, 2.94775390625, 3.229736328125, 3.51171875, 3.793701171875, 4.07568359375, 4.357666015625, 4.6396484375, 4.921630859375, 5.20361328125, 5.485595703125, 5.767578125, 6.049560546875, 6.33154296875, 6.613525390625, 6.8955078125, 7.177490234375, 7.45947265625, 7.741455078125, 8.0234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 4.0, 7.0, 12.0, 12.0, 14.0, 25.0, 32.0, 38.0, 53.0, 62.0, 68.0, 108.0, 134.0, 174.0, 241.0, 399.0, 1074.0, 7221.0, 225166.0, 2880887.0, 25974.0, 2355.0, 489.0, 279.0, 206.0, 167.0, 98.0, 88.0, 70.0, 59.0, 42.0, 36.0, 17.0, 14.0, 20.0, 11.0, 9.0, 16.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8885498046875, -13.378662109375, -12.8687744140625, -12.35888671875, -11.8489990234375, -11.339111328125, -10.8292236328125, -10.3193359375, -9.8094482421875, -9.299560546875, -8.7896728515625, -8.27978515625, -7.7698974609375, -7.260009765625, -6.7501220703125, -6.240234375, -5.7303466796875, -5.220458984375, -4.7105712890625, -4.20068359375, -3.6907958984375, -3.180908203125, -2.6710205078125, -2.1611328125, -1.6512451171875, -1.141357421875, -0.6314697265625, -0.12158203125, 0.3883056640625, 0.898193359375, 1.4080810546875, 1.91796875, 2.4278564453125, 2.937744140625, 3.4476318359375, 3.95751953125, 4.4674072265625, 4.977294921875, 5.4871826171875, 5.9970703125, 6.5069580078125, 7.016845703125, 7.5267333984375, 8.03662109375, 8.5465087890625, 9.056396484375, 9.5662841796875, 10.076171875, 10.5860595703125, 11.095947265625, 11.6058349609375, 12.11572265625, 12.6256103515625, 13.135498046875, 13.6453857421875, 14.1552734375, 14.6651611328125, 15.175048828125, 15.6849365234375, 16.19482421875, 16.7047119140625, 17.214599609375, 17.7244873046875, 18.234375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 25.0, 122.0, 291.0, 340.0, 182.0, 48.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.730520248413086, -7.510559558868408, -6.2905988693237305, -5.0706377029418945, -3.850677013397217, -2.630716323852539, -1.4107551574707031, -0.1907949447631836, 1.0291662216186523, 2.24912691116333, 3.469087839126587, 4.689048767089844, 5.9090094566345215, 7.128970146179199, 8.348931312561035, 9.568891525268555, 10.78885269165039, 12.008813858032227, 13.228774070739746, 14.448735237121582, 15.668695449829102, 16.888656616210938, 18.108617782592773, 19.32857894897461, 20.548538208007812, 21.76849937438965, 22.988460540771484, 24.208419799804688, 25.428380966186523, 26.64834213256836, 27.868303298950195, 29.08826446533203, 30.308223724365234, 31.52818489074707, 32.748146057128906, 33.96810531616211, 35.18806838989258, 36.40802764892578, 37.62799072265625, 38.84794998168945, 40.067909240722656, 41.28786849975586, 42.50783157348633, 43.72779083251953, 44.94775390625, 46.1677131652832, 47.387672424316406, 48.607635498046875, 49.827598571777344, 51.04755783081055, 52.267520904541016, 53.48748016357422, 54.70744323730469, 55.92740249633789, 57.147361755371094, 58.36732482910156, 59.587284088134766, 60.80724334716797, 62.02720642089844, 63.24716567993164, 64.46712493896484, 65.68708801269531, 66.90705108642578, 68.12700653076172, 69.34696960449219]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 2.0, 4.0, 7.0, 9.0, 7.0, 9.0, 20.0, 14.0, 20.0, 17.0, 21.0, 24.0, 30.0, 31.0, 41.0, 41.0, 30.0, 40.0, 49.0, 37.0, 46.0, 55.0, 47.0, 51.0, 36.0, 38.0, 36.0, 40.0, 31.0, 33.0, 17.0, 18.0, 17.0, 13.0, 12.0, 13.0, 10.0, 9.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.985671997070312, -23.186918258666992, -22.388166427612305, -21.589412689208984, -20.790658950805664, -19.991907119750977, -19.193153381347656, -18.39440155029297, -17.59564781188965, -16.796894073486328, -15.998141288757324, -15.19938850402832, -14.400635719299316, -13.601882934570312, -12.803129196166992, -12.004376411437988, -11.205622673034668, -10.406869888305664, -9.608116149902344, -8.80936336517334, -8.010610580444336, -7.211857318878174, -6.413104057312012, -5.614351272583008, -4.815598011016846, -4.016844749450684, -3.2180919647216797, -2.4193387031555176, -1.6205856800079346, -0.8218326568603516, -0.023079395294189453, 0.7756733894348145, 1.5744266510009766, 2.3731796741485596, 3.1719326972961426, 3.9706859588623047, 4.769438743591309, 5.568192005157471, 6.366945266723633, 7.165698051452637, 7.964451313018799, 8.763204574584961, 9.561957359313965, 10.360710144042969, 11.159463882446289, 11.958216667175293, 12.756969451904297, 13.555723190307617, 14.354475975036621, 15.153228759765625, 15.951982498168945, 16.750736236572266, 17.549488067626953, 18.348241806030273, 19.146995544433594, 19.94574737548828, 20.7445011138916, 21.543254852294922, 22.34200668334961, 23.14076042175293, 23.93951416015625, 24.738265991210938, 25.537019729614258, 26.335773468017578, 27.134525299072266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 9.0, 8.0, 7.0, 10.0, 12.0, 12.0, 16.0, 22.0, 21.0, 25.0, 28.0, 31.0, 30.0, 34.0, 40.0, 34.0, 44.0, 41.0, 47.0, 53.0, 29.0, 41.0, 44.0, 39.0, 35.0, 38.0, 31.0, 27.0, 30.0, 29.0, 18.0, 26.0, 12.0, 12.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6015625, -2.516021728515625, -2.43048095703125, -2.344940185546875, -2.2593994140625, -2.173858642578125, -2.08831787109375, -2.002777099609375, -1.917236328125, -1.831695556640625, -1.74615478515625, -1.660614013671875, -1.5750732421875, -1.489532470703125, -1.40399169921875, -1.318450927734375, -1.23291015625, -1.147369384765625, -1.06182861328125, -0.976287841796875, -0.8907470703125, -0.805206298828125, -0.71966552734375, -0.634124755859375, -0.548583984375, -0.463043212890625, -0.37750244140625, -0.291961669921875, -0.2064208984375, -0.120880126953125, -0.03533935546875, 0.050201416015625, 0.1357421875, 0.221282958984375, 0.30682373046875, 0.392364501953125, 0.4779052734375, 0.563446044921875, 0.64898681640625, 0.734527587890625, 0.820068359375, 0.905609130859375, 0.99114990234375, 1.076690673828125, 1.1622314453125, 1.247772216796875, 1.33331298828125, 1.418853759765625, 1.50439453125, 1.589935302734375, 1.67547607421875, 1.761016845703125, 1.8465576171875, 1.932098388671875, 2.01763916015625, 2.103179931640625, 2.188720703125, 2.274261474609375, 2.35980224609375, 2.445343017578125, 2.5308837890625, 2.616424560546875, 2.70196533203125, 2.787506103515625, 2.873046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 17.0, 7.0, 9.0, 24.0, 39.0, 35.0, 68.0, 99.0, 233.0, 383.0, 828.0, 1741.0, 4370.0, 12456.0, 43219.0, 190694.0, 1057691.0, 2141286.0, 588223.0, 110633.0, 27777.0, 8451.0, 3151.0, 1368.0, 633.0, 303.0, 180.0, 100.0, 71.0, 56.0, 25.0, 19.0, 13.0, 14.0, 7.0, 6.0, 3.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.1373291015625, -4.962158203125, -4.7869873046875, -4.61181640625, -4.4366455078125, -4.261474609375, -4.0863037109375, -3.9111328125, -3.7359619140625, -3.560791015625, -3.3856201171875, -3.21044921875, -3.0352783203125, -2.860107421875, -2.6849365234375, -2.509765625, -2.3345947265625, -2.159423828125, -1.9842529296875, -1.80908203125, -1.6339111328125, -1.458740234375, -1.2835693359375, -1.1083984375, -0.9332275390625, -0.758056640625, -0.5828857421875, -0.40771484375, -0.2325439453125, -0.057373046875, 0.1177978515625, 0.29296875, 0.4681396484375, 0.643310546875, 0.8184814453125, 0.99365234375, 1.1688232421875, 1.343994140625, 1.5191650390625, 1.6943359375, 1.8695068359375, 2.044677734375, 2.2198486328125, 2.39501953125, 2.5701904296875, 2.745361328125, 2.9205322265625, 3.095703125, 3.2708740234375, 3.446044921875, 3.6212158203125, 3.79638671875, 3.9715576171875, 4.146728515625, 4.3218994140625, 4.4970703125, 4.6722412109375, 4.847412109375, 5.0225830078125, 5.19775390625, 5.3729248046875, 5.548095703125, 5.7232666015625, 5.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 11.0, 5.0, 13.0, 22.0, 27.0, 51.0, 56.0, 73.0, 83.0, 133.0, 206.0, 253.0, 310.0, 380.0, 442.0, 448.0, 380.0, 325.0, 247.0, 167.0, 123.0, 84.0, 73.0, 44.0, 34.0, 18.0, 16.0, 10.0, 13.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.13507080078125, -4.9576416015625, -4.78021240234375, -4.602783203125, -4.42535400390625, -4.2479248046875, -4.07049560546875, -3.89306640625, -3.71563720703125, -3.5382080078125, -3.36077880859375, -3.183349609375, -3.00592041015625, -2.8284912109375, -2.65106201171875, -2.4736328125, -2.29620361328125, -2.1187744140625, -1.94134521484375, -1.763916015625, -1.58648681640625, -1.4090576171875, -1.23162841796875, -1.05419921875, -0.87677001953125, -0.6993408203125, -0.52191162109375, -0.344482421875, -0.16705322265625, 0.0103759765625, 0.18780517578125, 0.365234375, 0.54266357421875, 0.7200927734375, 0.89752197265625, 1.074951171875, 1.25238037109375, 1.4298095703125, 1.60723876953125, 1.78466796875, 1.96209716796875, 2.1395263671875, 2.31695556640625, 2.494384765625, 2.67181396484375, 2.8492431640625, 3.02667236328125, 3.2041015625, 3.38153076171875, 3.5589599609375, 3.73638916015625, 3.913818359375, 4.09124755859375, 4.2686767578125, 4.44610595703125, 4.62353515625, 4.80096435546875, 4.9783935546875, 5.15582275390625, 5.333251953125, 5.51068115234375, 5.6881103515625, 5.86553955078125, 6.04296875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 10.0, 3.0, 14.0, 30.0, 36.0, 56.0, 71.0, 98.0, 154.0, 199.0, 345.0, 671.0, 3431.0, 74683.0, 3127225.0, 963465.0, 20616.0, 1644.0, 513.0, 314.0, 201.0, 134.0, 83.0, 80.0, 57.0, 50.0, 33.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.046875, -19.4541015625, -18.861328125, -18.2685546875, -17.67578125, -17.0830078125, -16.490234375, -15.8974609375, -15.3046875, -14.7119140625, -14.119140625, -13.5263671875, -12.93359375, -12.3408203125, -11.748046875, -11.1552734375, -10.5625, -9.9697265625, -9.376953125, -8.7841796875, -8.19140625, -7.5986328125, -7.005859375, -6.4130859375, -5.8203125, -5.2275390625, -4.634765625, -4.0419921875, -3.44921875, -2.8564453125, -2.263671875, -1.6708984375, -1.078125, -0.4853515625, 0.107421875, 0.7001953125, 1.29296875, 1.8857421875, 2.478515625, 3.0712890625, 3.6640625, 4.2568359375, 4.849609375, 5.4423828125, 6.03515625, 6.6279296875, 7.220703125, 7.8134765625, 8.40625, 8.9990234375, 9.591796875, 10.1845703125, 10.77734375, 11.3701171875, 11.962890625, 12.5556640625, 13.1484375, 13.7412109375, 14.333984375, 14.9267578125, 15.51953125, 16.1123046875, 16.705078125, 17.2978515625, 17.890625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 14.0, 26.0, 37.0, 71.0, 99.0, 114.0, 132.0, 155.0, 136.0, 85.0, 54.0, 39.0, 24.0, 14.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.38740158081055, -34.17501449584961, -32.962623596191406, -31.75023651123047, -30.5378475189209, -29.325458526611328, -28.11307144165039, -26.90068244934082, -25.68829345703125, -24.47590446472168, -23.26351547241211, -22.051128387451172, -20.8387393951416, -19.62635040283203, -18.413963317871094, -17.201574325561523, -15.989185333251953, -14.776796340942383, -13.564408302307129, -12.352020263671875, -11.139631271362305, -9.927242279052734, -8.71485424041748, -7.502466201782227, -6.290077209472656, -5.077688694000244, -3.865300178527832, -2.65291166305542, -1.4405231475830078, -0.2281346321105957, 0.9842538833618164, 2.1966419219970703, 3.409027099609375, 4.621415615081787, 5.833804130554199, 7.046192646026611, 8.258581161499023, 9.470970153808594, 10.683358192443848, 11.895746231079102, 13.108135223388672, 14.320524215698242, 15.532912254333496, 16.74530029296875, 17.95768928527832, 19.17007827758789, 20.382465362548828, 21.5948543548584, 22.80724334716797, 24.01963233947754, 25.23202133178711, 26.444408416748047, 27.656797409057617, 28.869186401367188, 30.081573486328125, 31.293962478637695, 32.506351470947266, 33.7187385559082, 34.931129455566406, 36.143516540527344, 37.35590362548828, 38.568294525146484, 39.78068161010742, 40.993072509765625, 42.20545959472656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 9.0, 11.0, 9.0, 19.0, 16.0, 17.0, 22.0, 27.0, 33.0, 23.0, 21.0, 28.0, 34.0, 30.0, 47.0, 31.0, 34.0, 45.0, 44.0, 35.0, 50.0, 39.0, 39.0, 32.0, 42.0, 32.0, 24.0, 24.0, 37.0, 25.0, 12.0, 17.0, 16.0, 14.0, 14.0, 3.0, 6.0, 4.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.936317443847656, -17.336288452148438, -16.73625946044922, -16.13623046875, -15.536201477050781, -14.936172485351562, -14.336143493652344, -13.736114501953125, -13.136085510253906, -12.536056518554688, -11.936027526855469, -11.33599853515625, -10.735969543457031, -10.135940551757812, -9.535911560058594, -8.935882568359375, -8.335853576660156, -7.7358245849609375, -7.135795593261719, -6.5357666015625, -5.935737609863281, -5.3357086181640625, -4.735679626464844, -4.135650634765625, -3.5356216430664062, -2.9355926513671875, -2.3355636596679688, -1.73553466796875, -1.1355056762695312, -0.5354766845703125, 0.06455230712890625, 0.664581298828125, 1.2646102905273438, 1.8646392822265625, 2.4646682739257812, 3.064697265625, 3.6647262573242188, 4.2647552490234375, 4.864784240722656, 5.464813232421875, 6.064842224121094, 6.6648712158203125, 7.264900207519531, 7.86492919921875, 8.464958190917969, 9.064987182617188, 9.665016174316406, 10.265045166015625, 10.865074157714844, 11.465103149414062, 12.065132141113281, 12.6651611328125, 13.265190124511719, 13.865219116210938, 14.465248107910156, 15.065277099609375, 15.665306091308594, 16.265335083007812, 16.86536407470703, 17.46539306640625, 18.06542205810547, 18.665451049804688, 19.265480041503906, 19.865509033203125, 20.465538024902344]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 18.0, 20.0, 19.0, 12.0, 21.0, 25.0, 30.0, 24.0, 27.0, 25.0, 40.0, 43.0, 38.0, 54.0, 34.0, 55.0, 38.0, 43.0, 42.0, 46.0, 32.0, 34.0, 36.0, 31.0, 27.0, 15.0, 26.0, 18.0, 15.0, 15.0, 9.0, 14.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.481689453125, -2.39501953125, -2.308349609375, -2.2216796875, -2.135009765625, -2.04833984375, -1.961669921875, -1.875, -1.788330078125, -1.70166015625, -1.614990234375, -1.5283203125, -1.441650390625, -1.35498046875, -1.268310546875, -1.181640625, -1.094970703125, -1.00830078125, -0.921630859375, -0.8349609375, -0.748291015625, -0.66162109375, -0.574951171875, -0.48828125, -0.401611328125, -0.31494140625, -0.228271484375, -0.1416015625, -0.054931640625, 0.03173828125, 0.118408203125, 0.205078125, 0.291748046875, 0.37841796875, 0.465087890625, 0.5517578125, 0.638427734375, 0.72509765625, 0.811767578125, 0.8984375, 0.985107421875, 1.07177734375, 1.158447265625, 1.2451171875, 1.331787109375, 1.41845703125, 1.505126953125, 1.591796875, 1.678466796875, 1.76513671875, 1.851806640625, 1.9384765625, 2.025146484375, 2.11181640625, 2.198486328125, 2.28515625, 2.371826171875, 2.45849609375, 2.545166015625, 2.6318359375, 2.718505859375, 2.80517578125, 2.891845703125, 2.978515625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 14.0, 9.0, 18.0, 22.0, 44.0, 55.0, 88.0, 127.0, 171.0, 271.0, 344.0, 555.0, 821.0, 1236.0, 1791.0, 2620.0, 3814.0, 5661.0, 8678.0, 12995.0, 19501.0, 30771.0, 49934.0, 87234.0, 189151.0, 312299.0, 134232.0, 68983.0, 40954.0, 25738.0, 16615.0, 11204.0, 7446.0, 4840.0, 3219.0, 2326.0, 1543.0, 1045.0, 708.0, 451.0, 321.0, 239.0, 130.0, 112.0, 80.0, 47.0, 39.0, 21.0, 17.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0141143798828125, -0.013663530349731445, -0.01321268081665039, -0.012761831283569336, -0.012310981750488281, -0.011860132217407227, -0.011409282684326172, -0.010958433151245117, -0.010507583618164062, -0.010056734085083008, -0.009605884552001953, -0.009155035018920898, -0.008704185485839844, -0.008253335952758789, -0.007802486419677734, -0.00735163688659668, -0.006900787353515625, -0.00644993782043457, -0.005999088287353516, -0.005548238754272461, -0.005097389221191406, -0.0046465396881103516, -0.004195690155029297, -0.003744840621948242, -0.0032939910888671875, -0.002843141555786133, -0.002392292022705078, -0.0019414424896240234, -0.0014905929565429688, -0.001039743423461914, -0.0005888938903808594, -0.0001380443572998047, 0.00031280517578125, 0.0007636547088623047, 0.0012145042419433594, 0.001665353775024414, 0.0021162033081054688, 0.0025670528411865234, 0.003017902374267578, 0.003468751907348633, 0.0039196014404296875, 0.004370450973510742, 0.004821300506591797, 0.0052721500396728516, 0.005722999572753906, 0.006173849105834961, 0.006624698638916016, 0.00707554817199707, 0.007526397705078125, 0.00797724723815918, 0.008428096771240234, 0.008878946304321289, 0.009329795837402344, 0.009780645370483398, 0.010231494903564453, 0.010682344436645508, 0.011133193969726562, 0.011584043502807617, 0.012034893035888672, 0.012485742568969727, 0.012936592102050781, 0.013387441635131836, 0.01383829116821289, 0.014289140701293945, 0.014739990234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 12.0, 4.0, 3.0, 11.0, 17.0, 11.0, 17.0, 13.0, 12.0, 27.0, 29.0, 33.0, 31.0, 26.0, 24.0, 29.0, 36.0, 42.0, 35.0, 34.0, 47.0, 1071.0, 36.0, 37.0, 41.0, 37.0, 23.0, 30.0, 31.0, 33.0, 21.0, 28.0, 15.0, 19.0, 16.0, 11.0, 17.0, 10.0, 11.0, 11.0, 10.0, 5.0, 7.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.7587890625, -1.7071685791015625, -1.655548095703125, -1.6039276123046875, -1.55230712890625, -1.5006866455078125, -1.449066162109375, -1.3974456787109375, -1.3458251953125, -1.2942047119140625, -1.242584228515625, -1.1909637451171875, -1.13934326171875, -1.0877227783203125, -1.036102294921875, -0.9844818115234375, -0.932861328125, -0.8812408447265625, -0.829620361328125, -0.7779998779296875, -0.72637939453125, -0.6747589111328125, -0.623138427734375, -0.5715179443359375, -0.5198974609375, -0.4682769775390625, -0.416656494140625, -0.3650360107421875, -0.31341552734375, -0.2617950439453125, -0.210174560546875, -0.1585540771484375, -0.10693359375, -0.0553131103515625, -0.003692626953125, 0.0479278564453125, 0.09954833984375, 0.1511688232421875, 0.202789306640625, 0.2544097900390625, 0.3060302734375, 0.3576507568359375, 0.409271240234375, 0.4608917236328125, 0.51251220703125, 0.5641326904296875, 0.615753173828125, 0.6673736572265625, 0.718994140625, 0.7706146240234375, 0.822235107421875, 0.8738555908203125, 0.92547607421875, 0.9770965576171875, 1.028717041015625, 1.0803375244140625, 1.1319580078125, 1.1835784912109375, 1.235198974609375, 1.2868194580078125, 1.33843994140625, 1.3900604248046875, 1.441680908203125, 1.4933013916015625, 1.544921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 11.0, 9.0, 16.0, 31.0, 47.0, 62.0, 100.0, 137.0, 219.0, 298.0, 537.0, 724.0, 1084.0, 1675.0, 2488.0, 3649.0, 5660.0, 8604.0, 13041.0, 20521.0, 31927.0, 51204.0, 86162.0, 179175.0, 1342780.0, 145159.0, 75069.0, 45057.0, 28705.0, 18420.0, 11851.0, 7598.0, 4977.0, 3347.0, 2238.0, 1476.0, 1027.0, 647.0, 426.0, 325.0, 227.0, 131.0, 95.0, 62.0, 46.0, 32.0, 22.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.009490966796875, -0.009178519248962402, -0.008866071701049805, -0.008553624153137207, -0.00824117660522461, -0.007928729057312012, -0.007616281509399414, -0.007303833961486816, -0.006991386413574219, -0.006678938865661621, -0.0063664913177490234, -0.006054043769836426, -0.005741596221923828, -0.0054291486740112305, -0.005116701126098633, -0.004804253578186035, -0.0044918060302734375, -0.00417935848236084, -0.003866910934448242, -0.0035544633865356445, -0.003242015838623047, -0.0029295682907104492, -0.0026171207427978516, -0.002304673194885254, -0.0019922256469726562, -0.0016797780990600586, -0.001367330551147461, -0.0010548830032348633, -0.0007424354553222656, -0.00042998790740966797, -0.00011754035949707031, 0.00019490718841552734, 0.000507354736328125, 0.0008198022842407227, 0.0011322498321533203, 0.001444697380065918, 0.0017571449279785156, 0.0020695924758911133, 0.002382040023803711, 0.0026944875717163086, 0.0030069351196289062, 0.003319382667541504, 0.0036318302154541016, 0.003944277763366699, 0.004256725311279297, 0.0045691728591918945, 0.004881620407104492, 0.00519406795501709, 0.0055065155029296875, 0.005818963050842285, 0.006131410598754883, 0.0064438581466674805, 0.006756305694580078, 0.007068753242492676, 0.0073812007904052734, 0.007693648338317871, 0.008006095886230469, 0.008318543434143066, 0.008630990982055664, 0.008943438529968262, 0.00925588607788086, 0.009568333625793457, 0.009880781173706055, 0.010193228721618652, 0.01050567626953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 931.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 11.0, 4.0, 0.0, 1.0, 20.0, 4.0, 0.0, 1.0, 1.0, 0.0, 47.0, 19.0, 21.0, 304.0, 2163.0, 20974.0, 1001317.0, 23287.0, 151.0, 98.0, 58.0, 26.0, 10.0, 1.0, 1.0, 1.0, 0.0, 11.0, 0.0, 0.0, 5.0, 0.0, 16.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.187676727771759e-06, -2.1103769540786743e-06, -2.0330771803855896e-06, -1.955777406692505e-06, -1.8784776329994202e-06, -1.8011778593063354e-06, -1.7238780856132507e-06, -1.646578311920166e-06, -1.5692785382270813e-06, -1.4919787645339966e-06, -1.4146789908409119e-06, -1.3373792171478271e-06, -1.2600794434547424e-06, -1.1827796697616577e-06, -1.105479896068573e-06, -1.0281801223754883e-06, -9.508803486824036e-07, -8.735805749893188e-07, -7.962808012962341e-07, -7.189810276031494e-07, -6.416812539100647e-07, -5.6438148021698e-07, -4.870817065238953e-07, -4.0978193283081055e-07, -3.3248215913772583e-07, -2.551823854446411e-07, -1.778826117515564e-07, -1.0058283805847168e-07, -2.3283064365386963e-08, 5.4016709327697754e-08, 1.3131648302078247e-07, 2.086162567138672e-07, 2.859160304069519e-07, 3.632158041000366e-07, 4.4051557779312134e-07, 5.178153514862061e-07, 5.951151251792908e-07, 6.724148988723755e-07, 7.497146725654602e-07, 8.270144462585449e-07, 9.043142199516296e-07, 9.816139936447144e-07, 1.058913767337799e-06, 1.1362135410308838e-06, 1.2135133147239685e-06, 1.2908130884170532e-06, 1.368112862110138e-06, 1.4454126358032227e-06, 1.5227124094963074e-06, 1.600012183189392e-06, 1.6773119568824768e-06, 1.7546117305755615e-06, 1.8319115042686462e-06, 1.909211277961731e-06, 1.9865110516548157e-06, 2.0638108253479004e-06, 2.141110599040985e-06, 2.21841037273407e-06, 2.2957101464271545e-06, 2.3730099201202393e-06, 2.450309693813324e-06, 2.5276094675064087e-06, 2.6049092411994934e-06, 2.682209014892578e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 18.0, 20.0, 19.0, 12.0, 21.0, 25.0, 30.0, 24.0, 27.0, 25.0, 40.0, 43.0, 38.0, 54.0, 34.0, 55.0, 38.0, 43.0, 42.0, 46.0, 32.0, 34.0, 36.0, 31.0, 27.0, 15.0, 26.0, 18.0, 15.0, 15.0, 9.0, 14.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.481689453125, -2.39501953125, -2.308349609375, -2.2216796875, -2.135009765625, -2.04833984375, -1.961669921875, -1.875, -1.788330078125, -1.70166015625, -1.614990234375, -1.5283203125, -1.441650390625, -1.35498046875, -1.268310546875, -1.181640625, -1.094970703125, -1.00830078125, -0.921630859375, -0.8349609375, -0.748291015625, -0.66162109375, -0.574951171875, -0.48828125, -0.401611328125, -0.31494140625, -0.228271484375, -0.1416015625, -0.054931640625, 0.03173828125, 0.118408203125, 0.205078125, 0.291748046875, 0.37841796875, 0.465087890625, 0.5517578125, 0.638427734375, 0.72509765625, 0.811767578125, 0.8984375, 0.985107421875, 1.07177734375, 1.158447265625, 1.2451171875, 1.331787109375, 1.41845703125, 1.505126953125, 1.591796875, 1.678466796875, 1.76513671875, 1.851806640625, 1.9384765625, 2.025146484375, 2.11181640625, 2.198486328125, 2.28515625, 2.371826171875, 2.45849609375, 2.545166015625, 2.6318359375, 2.718505859375, 2.80517578125, 2.891845703125, 2.978515625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 19.0, 21.0, 28.0, 43.0, 67.0, 100.0, 142.0, 179.0, 271.0, 442.0, 661.0, 1022.0, 1445.0, 2268.0, 3553.0, 6085.0, 11404.0, 24282.0, 59980.0, 168454.0, 403906.0, 221807.0, 79166.0, 30564.0, 13773.0, 7207.0, 4191.0, 2528.0, 1666.0, 1050.0, 719.0, 493.0, 332.0, 209.0, 152.0, 93.0, 65.0, 45.0, 32.0, 28.0, 23.0, 8.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.08160400390625, -2.0089111328125, -1.93621826171875, -1.863525390625, -1.79083251953125, -1.7181396484375, -1.64544677734375, -1.57275390625, -1.50006103515625, -1.4273681640625, -1.35467529296875, -1.281982421875, -1.20928955078125, -1.1365966796875, -1.06390380859375, -0.9912109375, -0.91851806640625, -0.8458251953125, -0.77313232421875, -0.700439453125, -0.62774658203125, -0.5550537109375, -0.48236083984375, -0.40966796875, -0.33697509765625, -0.2642822265625, -0.19158935546875, -0.118896484375, -0.04620361328125, 0.0264892578125, 0.09918212890625, 0.171875, 0.24456787109375, 0.3172607421875, 0.38995361328125, 0.462646484375, 0.53533935546875, 0.6080322265625, 0.68072509765625, 0.75341796875, 0.82611083984375, 0.8988037109375, 0.97149658203125, 1.044189453125, 1.11688232421875, 1.1895751953125, 1.26226806640625, 1.3349609375, 1.40765380859375, 1.4803466796875, 1.55303955078125, 1.625732421875, 1.69842529296875, 1.7711181640625, 1.84381103515625, 1.91650390625, 1.98919677734375, 2.0618896484375, 2.13458251953125, 2.207275390625, 2.27996826171875, 2.3526611328125, 2.42535400390625, 2.498046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 9.0, 13.0, 21.0, 12.0, 17.0, 29.0, 23.0, 42.0, 32.0, 41.0, 37.0, 42.0, 70.0, 129.0, 352.0, 1559.0, 173.0, 63.0, 62.0, 48.0, 38.0, 39.0, 26.0, 28.0, 20.0, 23.0, 12.0, 10.0, 9.0, 11.0, 10.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.593017578125, -9.26416015625, -8.935302734375, -8.6064453125, -8.277587890625, -7.94873046875, -7.619873046875, -7.291015625, -6.962158203125, -6.63330078125, -6.304443359375, -5.9755859375, -5.646728515625, -5.31787109375, -4.989013671875, -4.66015625, -4.331298828125, -4.00244140625, -3.673583984375, -3.3447265625, -3.015869140625, -2.68701171875, -2.358154296875, -2.029296875, -1.700439453125, -1.37158203125, -1.042724609375, -0.7138671875, -0.385009765625, -0.05615234375, 0.272705078125, 0.6015625, 0.930419921875, 1.25927734375, 1.588134765625, 1.9169921875, 2.245849609375, 2.57470703125, 2.903564453125, 3.232421875, 3.561279296875, 3.89013671875, 4.218994140625, 4.5478515625, 4.876708984375, 5.20556640625, 5.534423828125, 5.86328125, 6.192138671875, 6.52099609375, 6.849853515625, 7.1787109375, 7.507568359375, 7.83642578125, 8.165283203125, 8.494140625, 8.822998046875, 9.15185546875, 9.480712890625, 9.8095703125, 10.138427734375, 10.46728515625, 10.796142578125, 11.125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 5.0, 7.0, 7.0, 16.0, 12.0, 15.0, 16.0, 20.0, 38.0, 45.0, 64.0, 77.0, 108.0, 183.0, 262.0, 487.0, 1729.0, 25190.0, 3073128.0, 40612.0, 2150.0, 548.0, 279.0, 177.0, 140.0, 112.0, 69.0, 52.0, 23.0, 25.0, 17.0, 27.0, 10.0, 13.0, 13.0, 10.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.90625, -20.283203125, -19.66015625, -19.037109375, -18.4140625, -17.791015625, -17.16796875, -16.544921875, -15.921875, -15.298828125, -14.67578125, -14.052734375, -13.4296875, -12.806640625, -12.18359375, -11.560546875, -10.9375, -10.314453125, -9.69140625, -9.068359375, -8.4453125, -7.822265625, -7.19921875, -6.576171875, -5.953125, -5.330078125, -4.70703125, -4.083984375, -3.4609375, -2.837890625, -2.21484375, -1.591796875, -0.96875, -0.345703125, 0.27734375, 0.900390625, 1.5234375, 2.146484375, 2.76953125, 3.392578125, 4.015625, 4.638671875, 5.26171875, 5.884765625, 6.5078125, 7.130859375, 7.75390625, 8.376953125, 9.0, 9.623046875, 10.24609375, 10.869140625, 11.4921875, 12.115234375, 12.73828125, 13.361328125, 13.984375, 14.607421875, 15.23046875, 15.853515625, 16.4765625, 17.099609375, 17.72265625, 18.345703125, 18.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 15.0, 53.0, 163.0, 300.0, 271.0, 146.0, 54.0, 12.0, 3.0], "bins": [-49.93052673339844, -49.08224105834961, -48.23395919799805, -47.38567352294922, -46.537391662597656, -45.68910598754883, -44.840824127197266, -43.99253845214844, -43.144256591796875, -42.29597091674805, -41.447689056396484, -40.599403381347656, -39.751121520996094, -38.902835845947266, -38.0545539855957, -37.206268310546875, -36.35798645019531, -35.509700775146484, -34.66141891479492, -33.813133239746094, -32.96485137939453, -32.1165657043457, -31.26828384399414, -30.420000076293945, -29.571714401245117, -28.723430633544922, -27.875146865844727, -27.02686309814453, -26.178579330444336, -25.33029556274414, -24.482011795043945, -23.63372802734375, -22.785446166992188, -21.937162399291992, -21.088878631591797, -20.2405948638916, -19.392311096191406, -18.54402732849121, -17.695743560791016, -16.84745979309082, -15.999174118041992, -15.150890350341797, -14.302606582641602, -13.454322814941406, -12.606039047241211, -11.757755279541016, -10.90947151184082, -10.061187744140625, -9.21290397644043, -8.364620208740234, -7.516336441040039, -6.668052673339844, -5.819768905639648, -4.971484661102295, -4.1232008934021, -3.2749171257019043, -2.426633358001709, -1.5783495903015137, -0.7300657033920288, 0.11821818351745605, 0.9665019512176514, 1.8147859573364258, 2.663069725036621, 3.5113534927368164, 4.359637260437012]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 8.0, 7.0, 6.0, 9.0, 11.0, 6.0, 12.0, 14.0, 15.0, 22.0, 22.0, 24.0, 30.0, 30.0, 18.0, 31.0, 21.0, 35.0, 41.0, 50.0, 39.0, 47.0, 43.0, 34.0, 40.0, 38.0, 41.0, 51.0, 50.0, 27.0, 32.0, 21.0, 17.0, 24.0, 12.0, 16.0, 10.0, 9.0, 8.0, 8.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.588218688964844, -21.821998596191406, -21.05577850341797, -20.2895565032959, -19.52333641052246, -18.757116317749023, -17.990896224975586, -17.224674224853516, -16.458454132080078, -15.69223403930664, -14.926012992858887, -14.15979290008545, -13.393571853637695, -12.627351760864258, -11.86113166809082, -11.094910621643066, -10.328690528869629, -9.562470436096191, -8.796249389648438, -8.030029296875, -7.263808250427246, -6.497588157653809, -5.731367588043213, -4.965147018432617, -4.1989264488220215, -3.432705879211426, -2.66648530960083, -1.9002649784088135, -1.1340444087982178, -0.36782383918762207, 0.39839649200439453, 1.1646170616149902, 1.930837631225586, 2.6970582008361816, 3.4632787704467773, 4.229498863220215, 4.995719909667969, 5.761940002441406, 6.528160572052002, 7.294381141662598, 8.060602188110352, 8.826822280883789, 9.593043327331543, 10.35926342010498, 11.125484466552734, 11.891704559326172, 12.65792465209961, 13.424145698547363, 14.1903657913208, 14.956585884094238, 15.722806930541992, 16.48902702331543, 17.255247116088867, 18.021469116210938, 18.787689208984375, 19.553909301757812, 20.32012939453125, 21.086349487304688, 21.852569580078125, 22.618791580200195, 23.385011672973633, 24.15123176574707, 24.917451858520508, 25.683673858642578, 26.449893951416016]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 3.0, 4.0, 21.0, 16.0, 12.0, 17.0, 26.0, 17.0, 19.0, 31.0, 25.0, 29.0, 40.0, 34.0, 41.0, 41.0, 51.0, 55.0, 26.0, 53.0, 53.0, 33.0, 41.0, 41.0, 32.0, 27.0, 29.0, 31.0, 17.0, 20.0, 19.0, 19.0, 7.0, 15.0, 11.0, 10.0, 9.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.4912109375, -2.400390625, -2.3095703125, -2.21875, -2.1279296875, -2.037109375, -1.9462890625, -1.85546875, -1.7646484375, -1.673828125, -1.5830078125, -1.4921875, -1.4013671875, -1.310546875, -1.2197265625, -1.12890625, -1.0380859375, -0.947265625, -0.8564453125, -0.765625, -0.6748046875, -0.583984375, -0.4931640625, -0.40234375, -0.3115234375, -0.220703125, -0.1298828125, -0.0390625, 0.0517578125, 0.142578125, 0.2333984375, 0.32421875, 0.4150390625, 0.505859375, 0.5966796875, 0.6875, 0.7783203125, 0.869140625, 0.9599609375, 1.05078125, 1.1416015625, 1.232421875, 1.3232421875, 1.4140625, 1.5048828125, 1.595703125, 1.6865234375, 1.77734375, 1.8681640625, 1.958984375, 2.0498046875, 2.140625, 2.2314453125, 2.322265625, 2.4130859375, 2.50390625, 2.5947265625, 2.685546875, 2.7763671875, 2.8671875, 2.9580078125, 3.048828125, 3.1396484375, 3.23046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 10.0, 9.0, 17.0, 26.0, 23.0, 39.0, 45.0, 79.0, 93.0, 128.0, 225.0, 365.0, 749.0, 1821.0, 4851.0, 15661.0, 60400.0, 315908.0, 1685059.0, 1706224.0, 317064.0, 60947.0, 15781.0, 5065.0, 1802.0, 808.0, 361.0, 221.0, 121.0, 92.0, 70.0, 48.0, 45.0, 30.0, 21.0, 20.0, 11.0, 8.0, 8.0, 4.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.275146484375, -5.09326171875, -4.911376953125, -4.7294921875, -4.547607421875, -4.36572265625, -4.183837890625, -4.001953125, -3.820068359375, -3.63818359375, -3.456298828125, -3.2744140625, -3.092529296875, -2.91064453125, -2.728759765625, -2.546875, -2.364990234375, -2.18310546875, -2.001220703125, -1.8193359375, -1.637451171875, -1.45556640625, -1.273681640625, -1.091796875, -0.909912109375, -0.72802734375, -0.546142578125, -0.3642578125, -0.182373046875, -0.00048828125, 0.181396484375, 0.36328125, 0.545166015625, 0.72705078125, 0.908935546875, 1.0908203125, 1.272705078125, 1.45458984375, 1.636474609375, 1.818359375, 2.000244140625, 2.18212890625, 2.364013671875, 2.5458984375, 2.727783203125, 2.90966796875, 3.091552734375, 3.2734375, 3.455322265625, 3.63720703125, 3.819091796875, 4.0009765625, 4.182861328125, 4.36474609375, 4.546630859375, 4.728515625, 4.910400390625, 5.09228515625, 5.274169921875, 5.4560546875, 5.637939453125, 5.81982421875, 6.001708984375, 6.18359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 11.0, 19.0, 19.0, 25.0, 32.0, 45.0, 56.0, 80.0, 89.0, 92.0, 138.0, 151.0, 158.0, 220.0, 301.0, 311.0, 322.0, 344.0, 312.0, 209.0, 218.0, 168.0, 133.0, 122.0, 88.0, 66.0, 61.0, 45.0, 43.0, 25.0, 28.0, 20.0, 22.0, 17.0, 8.0, 11.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.820556640625, -3.69189453125, -3.563232421875, -3.4345703125, -3.305908203125, -3.17724609375, -3.048583984375, -2.919921875, -2.791259765625, -2.66259765625, -2.533935546875, -2.4052734375, -2.276611328125, -2.14794921875, -2.019287109375, -1.890625, -1.761962890625, -1.63330078125, -1.504638671875, -1.3759765625, -1.247314453125, -1.11865234375, -0.989990234375, -0.861328125, -0.732666015625, -0.60400390625, -0.475341796875, -0.3466796875, -0.218017578125, -0.08935546875, 0.039306640625, 0.16796875, 0.296630859375, 0.42529296875, 0.553955078125, 0.6826171875, 0.811279296875, 0.93994140625, 1.068603515625, 1.197265625, 1.325927734375, 1.45458984375, 1.583251953125, 1.7119140625, 1.840576171875, 1.96923828125, 2.097900390625, 2.2265625, 2.355224609375, 2.48388671875, 2.612548828125, 2.7412109375, 2.869873046875, 2.99853515625, 3.127197265625, 3.255859375, 3.384521484375, 3.51318359375, 3.641845703125, 3.7705078125, 3.899169921875, 4.02783203125, 4.156494140625, 4.28515625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 8.0, 13.0, 12.0, 18.0, 15.0, 22.0, 32.0, 29.0, 57.0, 61.0, 81.0, 85.0, 137.0, 162.0, 221.0, 261.0, 459.0, 1990.0, 45640.0, 2631462.0, 1484296.0, 26174.0, 1508.0, 371.0, 245.0, 183.0, 160.0, 122.0, 112.0, 101.0, 47.0, 39.0, 34.0, 23.0, 26.0, 10.0, 12.0, 6.0, 11.0, 10.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-20.671875, -20.0625, -19.453125, -18.84375, -18.234375, -17.625, -17.015625, -16.40625, -15.796875, -15.1875, -14.578125, -13.96875, -13.359375, -12.75, -12.140625, -11.53125, -10.921875, -10.3125, -9.703125, -9.09375, -8.484375, -7.875, -7.265625, -6.65625, -6.046875, -5.4375, -4.828125, -4.21875, -3.609375, -3.0, -2.390625, -1.78125, -1.171875, -0.5625, 0.046875, 0.65625, 1.265625, 1.875, 2.484375, 3.09375, 3.703125, 4.3125, 4.921875, 5.53125, 6.140625, 6.75, 7.359375, 7.96875, 8.578125, 9.1875, 9.796875, 10.40625, 11.015625, 11.625, 12.234375, 12.84375, 13.453125, 14.0625, 14.671875, 15.28125, 15.890625, 16.5, 17.109375, 17.71875, 18.328125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 22.0, 56.0, 118.0, 188.0, 249.0, 182.0, 105.0, 55.0, 21.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.02879333496094, -81.19861602783203, -79.36843872070312, -77.53826141357422, -75.70808410644531, -73.8779067993164, -72.0477294921875, -70.21754455566406, -68.38737487792969, -66.55719757080078, -64.72702026367188, -62.89684295654297, -61.06666564941406, -59.236488342285156, -57.406307220458984, -55.57612991333008, -53.745948791503906, -51.915771484375, -50.085594177246094, -48.25541687011719, -46.42523956298828, -44.595062255859375, -42.7648811340332, -40.9347038269043, -39.10452651977539, -37.274349212646484, -35.44417190551758, -33.61399459838867, -31.783815383911133, -29.953638076782227, -28.123458862304688, -26.29328155517578, -24.46310043334961, -22.632923126220703, -20.802745819091797, -18.972566604614258, -17.14238929748535, -15.312211990356445, -13.482033729553223, -11.65185546875, -9.821678161621094, -7.991500377655029, -6.161322593688965, -4.3311448097229, -2.500967025756836, -0.6707897186279297, 1.159388542175293, 2.9895668029785156, 4.819744110107422, 6.649921894073486, 8.48009967803955, 10.310277938842773, 12.14045524597168, 13.970632553100586, 15.800810813903809, 17.63098907470703, 19.461166381835938, 21.291343688964844, 23.12152099609375, 24.95170021057129, 26.781877517700195, 28.6120548248291, 30.44223403930664, 32.27241134643555, 34.10258865356445]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 7.0, 8.0, 7.0, 10.0, 10.0, 10.0, 11.0, 22.0, 33.0, 27.0, 26.0, 27.0, 22.0, 26.0, 33.0, 48.0, 40.0, 34.0, 42.0, 34.0, 39.0, 34.0, 43.0, 37.0, 29.0, 42.0, 34.0, 22.0, 32.0, 27.0, 23.0, 28.0, 13.0, 17.0, 15.0, 10.0, 13.0, 7.0, 8.0, 9.0, 5.0, 4.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.77703857421875, -16.23661994934082, -15.69620132446289, -15.155782699584961, -14.615364074707031, -14.074945449829102, -13.534526824951172, -12.994108200073242, -12.453689575195312, -11.913270950317383, -11.372852325439453, -10.832433700561523, -10.292015075683594, -9.751596450805664, -9.211177825927734, -8.670759201049805, -8.130340576171875, -7.589921951293945, -7.049503326416016, -6.509084701538086, -5.968666076660156, -5.428247451782227, -4.887828826904297, -4.347410202026367, -3.8069915771484375, -3.266572952270508, -2.726154327392578, -2.1857357025146484, -1.6453170776367188, -1.104898452758789, -0.5644798278808594, -0.024061203002929688, 0.516357421875, 1.0567760467529297, 1.5971946716308594, 2.137613296508789, 2.6780319213867188, 3.2184505462646484, 3.758869171142578, 4.299287796020508, 4.8397064208984375, 5.380125045776367, 5.920543670654297, 6.460962295532227, 7.001380920410156, 7.541799545288086, 8.082218170166016, 8.622636795043945, 9.163055419921875, 9.703474044799805, 10.243892669677734, 10.784311294555664, 11.324729919433594, 11.865148544311523, 12.405567169189453, 12.945985794067383, 13.486404418945312, 14.026823043823242, 14.567241668701172, 15.107660293579102, 15.648078918457031, 16.18849754333496, 16.72891616821289, 17.26933479309082, 17.80975341796875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 5.0, 14.0, 18.0, 11.0, 14.0, 30.0, 40.0, 26.0, 36.0, 30.0, 35.0, 34.0, 32.0, 38.0, 52.0, 44.0, 56.0, 44.0, 39.0, 46.0, 34.0, 33.0, 34.0, 25.0, 20.0, 27.0, 26.0, 17.0, 16.0, 20.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.75390625, -2.66571044921875, -2.5775146484375, -2.48931884765625, -2.401123046875, -2.31292724609375, -2.2247314453125, -2.13653564453125, -2.04833984375, -1.96014404296875, -1.8719482421875, -1.78375244140625, -1.695556640625, -1.60736083984375, -1.5191650390625, -1.43096923828125, -1.3427734375, -1.25457763671875, -1.1663818359375, -1.07818603515625, -0.989990234375, -0.90179443359375, -0.8135986328125, -0.72540283203125, -0.63720703125, -0.54901123046875, -0.4608154296875, -0.37261962890625, -0.284423828125, -0.19622802734375, -0.1080322265625, -0.01983642578125, 0.068359375, 0.15655517578125, 0.2447509765625, 0.33294677734375, 0.421142578125, 0.50933837890625, 0.5975341796875, 0.68572998046875, 0.77392578125, 0.86212158203125, 0.9503173828125, 1.03851318359375, 1.126708984375, 1.21490478515625, 1.3031005859375, 1.39129638671875, 1.4794921875, 1.56768798828125, 1.6558837890625, 1.74407958984375, 1.832275390625, 1.92047119140625, 2.0086669921875, 2.09686279296875, 2.18505859375, 2.27325439453125, 2.3614501953125, 2.44964599609375, 2.537841796875, 2.62603759765625, 2.7142333984375, 2.80242919921875, 2.890625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 12.0, 12.0, 18.0, 42.0, 56.0, 79.0, 122.0, 176.0, 282.0, 431.0, 581.0, 876.0, 1344.0, 2039.0, 2975.0, 4507.0, 6917.0, 10704.0, 16764.0, 26411.0, 42110.0, 70216.0, 135766.0, 322124.0, 184042.0, 84473.0, 49321.0, 30772.0, 19492.0, 12337.0, 7922.0, 5230.0, 3476.0, 2248.0, 1548.0, 1058.0, 680.0, 459.0, 338.0, 192.0, 139.0, 89.0, 62.0, 31.0, 29.0, 22.0, 13.0, 7.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01522064208984375, -0.014754652976989746, -0.014288663864135742, -0.013822674751281738, -0.013356685638427734, -0.01289069652557373, -0.012424707412719727, -0.011958718299865723, -0.011492729187011719, -0.011026740074157715, -0.010560750961303711, -0.010094761848449707, -0.009628772735595703, -0.0091627836227417, -0.008696794509887695, -0.008230805397033691, -0.0077648162841796875, -0.007298827171325684, -0.00683283805847168, -0.006366848945617676, -0.005900859832763672, -0.005434870719909668, -0.004968881607055664, -0.00450289249420166, -0.004036903381347656, -0.0035709142684936523, -0.0031049251556396484, -0.0026389360427856445, -0.0021729469299316406, -0.0017069578170776367, -0.0012409687042236328, -0.0007749795913696289, -0.000308990478515625, 0.0001569986343383789, 0.0006229877471923828, 0.0010889768600463867, 0.0015549659729003906, 0.0020209550857543945, 0.0024869441986083984, 0.0029529333114624023, 0.0034189224243164062, 0.00388491153717041, 0.004350900650024414, 0.004816889762878418, 0.005282878875732422, 0.005748867988586426, 0.00621485710144043, 0.006680846214294434, 0.0071468353271484375, 0.007612824440002441, 0.008078813552856445, 0.00854480266571045, 0.009010791778564453, 0.009476780891418457, 0.009942770004272461, 0.010408759117126465, 0.010874748229980469, 0.011340737342834473, 0.011806726455688477, 0.01227271556854248, 0.012738704681396484, 0.013204693794250488, 0.013670682907104492, 0.014136672019958496, 0.0146026611328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 9.0, 11.0, 8.0, 20.0, 11.0, 24.0, 23.0, 24.0, 37.0, 30.0, 37.0, 34.0, 34.0, 41.0, 40.0, 47.0, 45.0, 1068.0, 37.0, 46.0, 36.0, 44.0, 35.0, 28.0, 30.0, 42.0, 33.0, 23.0, 19.0, 20.0, 20.0, 14.0, 11.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.21875, -2.15606689453125, -2.0933837890625, -2.03070068359375, -1.968017578125, -1.90533447265625, -1.8426513671875, -1.77996826171875, -1.71728515625, -1.65460205078125, -1.5919189453125, -1.52923583984375, -1.466552734375, -1.40386962890625, -1.3411865234375, -1.27850341796875, -1.2158203125, -1.15313720703125, -1.0904541015625, -1.02777099609375, -0.965087890625, -0.90240478515625, -0.8397216796875, -0.77703857421875, -0.71435546875, -0.65167236328125, -0.5889892578125, -0.52630615234375, -0.463623046875, -0.40093994140625, -0.3382568359375, -0.27557373046875, -0.212890625, -0.15020751953125, -0.0875244140625, -0.02484130859375, 0.037841796875, 0.10052490234375, 0.1632080078125, 0.22589111328125, 0.28857421875, 0.35125732421875, 0.4139404296875, 0.47662353515625, 0.539306640625, 0.60198974609375, 0.6646728515625, 0.72735595703125, 0.7900390625, 0.85272216796875, 0.9154052734375, 0.97808837890625, 1.040771484375, 1.10345458984375, 1.1661376953125, 1.22882080078125, 1.29150390625, 1.35418701171875, 1.4168701171875, 1.47955322265625, 1.542236328125, 1.60491943359375, 1.6676025390625, 1.73028564453125, 1.79296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 9.0, 7.0, 6.0, 21.0, 23.0, 26.0, 49.0, 94.0, 111.0, 174.0, 243.0, 436.0, 637.0, 1105.0, 1766.0, 2642.0, 4671.0, 7694.0, 13119.0, 22561.0, 39368.0, 69282.0, 134906.0, 1366793.0, 212532.0, 94432.0, 52037.0, 29769.0, 17200.0, 10004.0, 6030.0, 3504.0, 2226.0, 1362.0, 835.0, 525.0, 324.0, 195.0, 157.0, 94.0, 66.0, 32.0, 25.0, 22.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.01145017147064209, -0.01105189323425293, -0.01065361499786377, -0.01025533676147461, -0.00985705852508545, -0.009458780288696289, -0.009060502052307129, -0.008662223815917969, -0.008263945579528809, -0.007865667343139648, -0.007467389106750488, -0.007069110870361328, -0.006670832633972168, -0.006272554397583008, -0.005874276161193848, -0.0054759979248046875, -0.005077719688415527, -0.004679441452026367, -0.004281163215637207, -0.003882884979248047, -0.0034846067428588867, -0.0030863285064697266, -0.0026880502700805664, -0.0022897720336914062, -0.001891493797302246, -0.001493215560913086, -0.0010949373245239258, -0.0006966590881347656, -0.00029838085174560547, 9.989738464355469e-05, 0.0004981756210327148, 0.000896453857421875, 0.0012947320938110352, 0.0016930103302001953, 0.0020912885665893555, 0.0024895668029785156, 0.0028878450393676758, 0.003286123275756836, 0.003684401512145996, 0.004082679748535156, 0.004480957984924316, 0.0048792362213134766, 0.005277514457702637, 0.005675792694091797, 0.006074070930480957, 0.006472349166870117, 0.006870627403259277, 0.0072689056396484375, 0.007667183876037598, 0.008065462112426758, 0.008463740348815918, 0.008862018585205078, 0.009260296821594238, 0.009658575057983398, 0.010056853294372559, 0.010455131530761719, 0.010853409767150879, 0.011251688003540039, 0.0116499662399292, 0.01204824447631836, 0.01244652271270752, 0.01284480094909668, 0.01324307918548584, 0.013641357421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 927.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 1.0, 0.0, 22.0, 0.0, 13.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 22.0, 26.0, 23.0, 23.0, 89.0, 212.0, 2942.0, 0.0, 23400.0, 994937.0, 23486.0, 2909.0, 224.0, 97.0, 13.0, 0.0, 24.0, 24.0, 22.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 21.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113021850585938e-06, -1.259148120880127e-06, -1.2069940567016602e-06, -1.1548399925231934e-06, -1.1026859283447266e-06, -1.0505318641662598e-06, -9.98377799987793e-07, -9.462237358093262e-07, -8.940696716308594e-07, -8.419156074523926e-07, -7.897615432739258e-07, -7.37607479095459e-07, -6.854534149169922e-07, -6.332993507385254e-07, -5.811452865600586e-07, -5.289912223815918e-07, -4.76837158203125e-07, -4.246830940246582e-07, -3.725290298461914e-07, -3.203749656677246e-07, -2.682209014892578e-07, -2.1606683731079102e-07, -1.6391277313232422e-07, -1.1175870895385742e-07, -5.960464477539063e-08, -7.450580596923828e-09, 4.470348358154297e-08, 9.685754776000977e-08, 1.4901161193847656e-07, 2.0116567611694336e-07, 2.5331974029541016e-07, 3.0547380447387695e-07, 3.5762786865234375e-07, 4.0978193283081055e-07, 4.6193599700927734e-07, 5.140900611877441e-07, 5.662441253662109e-07, 6.183981895446777e-07, 6.705522537231445e-07, 7.227063179016113e-07, 7.748603820800781e-07, 8.270144462585449e-07, 8.791685104370117e-07, 9.313225746154785e-07, 9.834766387939453e-07, 1.0356307029724121e-06, 1.087784767150879e-06, 1.1399388313293457e-06, 1.1920928955078125e-06, 1.2442469596862793e-06, 1.296401023864746e-06, 1.3485550880432129e-06, 1.4007091522216797e-06, 1.4528632164001465e-06, 1.5050172805786133e-06, 1.55717134475708e-06, 1.6093254089355469e-06, 1.6614794731140137e-06, 1.7136335372924805e-06, 1.7657876014709473e-06, 1.817941665649414e-06, 1.8700957298278809e-06, 1.9222497940063477e-06, 1.9744038581848145e-06, 2.0265579223632812e-06]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 5.0, 14.0, 18.0, 11.0, 14.0, 30.0, 40.0, 26.0, 36.0, 30.0, 35.0, 34.0, 32.0, 38.0, 52.0, 44.0, 56.0, 44.0, 39.0, 46.0, 34.0, 33.0, 34.0, 25.0, 20.0, 27.0, 26.0, 17.0, 16.0, 20.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.75390625, -2.66571044921875, -2.5775146484375, -2.48931884765625, -2.401123046875, -2.31292724609375, -2.2247314453125, -2.13653564453125, -2.04833984375, -1.96014404296875, -1.8719482421875, -1.78375244140625, -1.695556640625, -1.60736083984375, -1.5191650390625, -1.43096923828125, -1.3427734375, -1.25457763671875, -1.1663818359375, -1.07818603515625, -0.989990234375, -0.90179443359375, -0.8135986328125, -0.72540283203125, -0.63720703125, -0.54901123046875, -0.4608154296875, -0.37261962890625, -0.284423828125, -0.19622802734375, -0.1080322265625, -0.01983642578125, 0.068359375, 0.15655517578125, 0.2447509765625, 0.33294677734375, 0.421142578125, 0.50933837890625, 0.5975341796875, 0.68572998046875, 0.77392578125, 0.86212158203125, 0.9503173828125, 1.03851318359375, 1.126708984375, 1.21490478515625, 1.3031005859375, 1.39129638671875, 1.4794921875, 1.56768798828125, 1.6558837890625, 1.74407958984375, 1.832275390625, 1.92047119140625, 2.0086669921875, 2.09686279296875, 2.18505859375, 2.27325439453125, 2.3614501953125, 2.44964599609375, 2.537841796875, 2.62603759765625, 2.7142333984375, 2.80242919921875, 2.890625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 12.0, 24.0, 23.0, 58.0, 74.0, 115.0, 219.0, 307.0, 553.0, 942.0, 1611.0, 2909.0, 4965.0, 8927.0, 17020.0, 34403.0, 83773.0, 320838.0, 396891.0, 96053.0, 37849.0, 18234.0, 9954.0, 5441.0, 3086.0, 1755.0, 938.0, 575.0, 365.0, 217.0, 147.0, 75.0, 57.0, 46.0, 33.0, 19.0, 15.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.90625, -2.81561279296875, -2.7249755859375, -2.63433837890625, -2.543701171875, -2.45306396484375, -2.3624267578125, -2.27178955078125, -2.18115234375, -2.09051513671875, -1.9998779296875, -1.90924072265625, -1.818603515625, -1.72796630859375, -1.6373291015625, -1.54669189453125, -1.4560546875, -1.36541748046875, -1.2747802734375, -1.18414306640625, -1.093505859375, -1.00286865234375, -0.9122314453125, -0.82159423828125, -0.73095703125, -0.64031982421875, -0.5496826171875, -0.45904541015625, -0.368408203125, -0.27777099609375, -0.1871337890625, -0.09649658203125, -0.005859375, 0.08477783203125, 0.1754150390625, 0.26605224609375, 0.356689453125, 0.44732666015625, 0.5379638671875, 0.62860107421875, 0.71923828125, 0.80987548828125, 0.9005126953125, 0.99114990234375, 1.081787109375, 1.17242431640625, 1.2630615234375, 1.35369873046875, 1.4443359375, 1.53497314453125, 1.6256103515625, 1.71624755859375, 1.806884765625, 1.89752197265625, 1.9881591796875, 2.07879638671875, 2.16943359375, 2.26007080078125, 2.3507080078125, 2.44134521484375, 2.531982421875, 2.62261962890625, 2.7132568359375, 2.80389404296875, 2.89453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 6.0, 4.0, 11.0, 10.0, 12.0, 19.0, 16.0, 20.0, 21.0, 24.0, 37.0, 41.0, 42.0, 44.0, 55.0, 46.0, 77.0, 171.0, 1653.0, 215.0, 100.0, 58.0, 48.0, 42.0, 40.0, 31.0, 34.0, 20.0, 29.0, 28.0, 9.0, 13.0, 17.0, 10.0, 10.0, 10.0, 11.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.3006591796875, -9.984130859375, -9.6676025390625, -9.35107421875, -9.0345458984375, -8.718017578125, -8.4014892578125, -8.0849609375, -7.7684326171875, -7.451904296875, -7.1353759765625, -6.81884765625, -6.5023193359375, -6.185791015625, -5.8692626953125, -5.552734375, -5.2362060546875, -4.919677734375, -4.6031494140625, -4.28662109375, -3.9700927734375, -3.653564453125, -3.3370361328125, -3.0205078125, -2.7039794921875, -2.387451171875, -2.0709228515625, -1.75439453125, -1.4378662109375, -1.121337890625, -0.8048095703125, -0.48828125, -0.1717529296875, 0.144775390625, 0.4613037109375, 0.77783203125, 1.0943603515625, 1.410888671875, 1.7274169921875, 2.0439453125, 2.3604736328125, 2.677001953125, 2.9935302734375, 3.31005859375, 3.6265869140625, 3.943115234375, 4.2596435546875, 4.576171875, 4.8927001953125, 5.209228515625, 5.5257568359375, 5.84228515625, 6.1588134765625, 6.475341796875, 6.7918701171875, 7.1083984375, 7.4249267578125, 7.741455078125, 8.0579833984375, 8.37451171875, 8.6910400390625, 9.007568359375, 9.3240966796875, 9.640625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 11.0, 12.0, 14.0, 11.0, 19.0, 16.0, 18.0, 35.0, 43.0, 53.0, 79.0, 86.0, 119.0, 148.0, 233.0, 455.0, 1725.0, 39345.0, 3068999.0, 31416.0, 1505.0, 435.0, 254.0, 146.0, 122.0, 100.0, 84.0, 55.0, 26.0, 35.0, 16.0, 29.0, 13.0, 15.0, 7.0, 5.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.14208984375, -20.4248046875, -19.70751953125, -18.990234375, -18.27294921875, -17.5556640625, -16.83837890625, -16.12109375, -15.40380859375, -14.6865234375, -13.96923828125, -13.251953125, -12.53466796875, -11.8173828125, -11.10009765625, -10.3828125, -9.66552734375, -8.9482421875, -8.23095703125, -7.513671875, -6.79638671875, -6.0791015625, -5.36181640625, -4.64453125, -3.92724609375, -3.2099609375, -2.49267578125, -1.775390625, -1.05810546875, -0.3408203125, 0.37646484375, 1.09375, 1.81103515625, 2.5283203125, 3.24560546875, 3.962890625, 4.68017578125, 5.3974609375, 6.11474609375, 6.83203125, 7.54931640625, 8.2666015625, 8.98388671875, 9.701171875, 10.41845703125, 11.1357421875, 11.85302734375, 12.5703125, 13.28759765625, 14.0048828125, 14.72216796875, 15.439453125, 16.15673828125, 16.8740234375, 17.59130859375, 18.30859375, 19.02587890625, 19.7431640625, 20.46044921875, 21.177734375, 21.89501953125, 22.6123046875, 23.32958984375, 24.046875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [195.0, 808.0, 15.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.190304756164551, -1.1983695030212402, 2.7935657501220703, 6.785500526428223, 10.777436256408691, 14.76937198638916, 18.761306762695312, 22.75324249267578, 26.74517822265625, 30.73711395263672, 34.72904968261719, 38.720985412597656, 42.712921142578125, 46.704856872558594, 50.6967887878418, 54.688724517822266, 58.680660247802734, 62.6725959777832, 66.6645278930664, 70.65646362304688, 74.64839935302734, 78.64033508300781, 82.63227081298828, 86.62420654296875, 90.61614227294922, 94.60807800292969, 98.60001373291016, 102.59194946289062, 106.5838851928711, 110.57582092285156, 114.5677490234375, 118.5596923828125, 122.55162048339844, 126.5435562133789, 130.53549194335938, 134.5274200439453, 138.5193634033203, 142.51129150390625, 146.50323486328125, 150.4951629638672, 154.4871063232422, 158.47903442382812, 162.47097778320312, 166.46290588378906, 170.45484924316406, 174.44677734375, 178.438720703125, 182.43064880371094, 186.42257690429688, 190.4145050048828, 194.4064483642578, 198.39837646484375, 202.39031982421875, 206.3822479248047, 210.3741912841797, 214.36611938476562, 218.35806274414062, 222.34999084472656, 226.34193420410156, 230.3338623046875, 234.3258056640625, 238.31773376464844, 242.30967712402344, 246.30160522460938, 250.29354858398438]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 3.0, 8.0, 7.0, 12.0, 15.0, 12.0, 17.0, 13.0, 22.0, 32.0, 23.0, 25.0, 31.0, 34.0, 46.0, 30.0, 36.0, 32.0, 33.0, 51.0, 37.0, 52.0, 33.0, 31.0, 31.0, 30.0, 36.0, 28.0, 27.0, 26.0, 22.0, 24.0, 17.0, 14.0, 16.0, 13.0, 16.0, 6.0, 4.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-24.78132438659668, -24.04560089111328, -23.309879302978516, -22.574155807495117, -21.83843231201172, -21.10270881652832, -20.366985321044922, -19.631263732910156, -18.895540237426758, -18.15981674194336, -17.424095153808594, -16.688371658325195, -15.952648162841797, -15.216924667358398, -14.481202125549316, -13.745479583740234, -13.009756088256836, -12.274032592773438, -11.538310050964355, -10.802587509155273, -10.066864013671875, -9.331140518188477, -8.595417976379395, -7.859694957733154, -7.123971939086914, -6.388248920440674, -5.652525901794434, -4.916802883148193, -4.181079864501953, -3.445356845855713, -2.7096338272094727, -1.9739108085632324, -1.2381877899169922, -0.502464771270752, 0.23325824737548828, 0.9689812660217285, 1.7047042846679688, 2.440427303314209, 3.176150321960449, 3.9118733406066895, 4.64759635925293, 5.38331937789917, 6.11904239654541, 6.85476541519165, 7.590488433837891, 8.326211929321289, 9.061934471130371, 9.797657012939453, 10.533380508422852, 11.26910400390625, 12.004826545715332, 12.740549087524414, 13.476272583007812, 14.211996078491211, 14.947718620300293, 15.683441162109375, 16.419164657592773, 17.154888153076172, 17.890609741210938, 18.626333236694336, 19.362056732177734, 20.097780227661133, 20.83350372314453, 21.569225311279297, 22.304948806762695]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 3.0, 10.0, 10.0, 10.0, 16.0, 17.0, 22.0, 25.0, 24.0, 39.0, 36.0, 20.0, 40.0, 37.0, 48.0, 46.0, 47.0, 40.0, 44.0, 49.0, 50.0, 42.0, 29.0, 32.0, 30.0, 31.0, 25.0, 21.0, 24.0, 19.0, 15.0, 11.0, 11.0, 18.0, 13.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.892578125, -2.79925537109375, -2.7059326171875, -2.61260986328125, -2.519287109375, -2.42596435546875, -2.3326416015625, -2.23931884765625, -2.14599609375, -2.05267333984375, -1.9593505859375, -1.86602783203125, -1.772705078125, -1.67938232421875, -1.5860595703125, -1.49273681640625, -1.3994140625, -1.30609130859375, -1.2127685546875, -1.11944580078125, -1.026123046875, -0.93280029296875, -0.8394775390625, -0.74615478515625, -0.65283203125, -0.55950927734375, -0.4661865234375, -0.37286376953125, -0.279541015625, -0.18621826171875, -0.0928955078125, 0.00042724609375, 0.09375, 0.18707275390625, 0.2803955078125, 0.37371826171875, 0.467041015625, 0.56036376953125, 0.6536865234375, 0.74700927734375, 0.84033203125, 0.93365478515625, 1.0269775390625, 1.12030029296875, 1.213623046875, 1.30694580078125, 1.4002685546875, 1.49359130859375, 1.5869140625, 1.68023681640625, 1.7735595703125, 1.86688232421875, 1.960205078125, 2.05352783203125, 2.1468505859375, 2.24017333984375, 2.33349609375, 2.42681884765625, 2.5201416015625, 2.61346435546875, 2.706787109375, 2.80010986328125, 2.8934326171875, 2.98675537109375, 3.080078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 1.0, 8.0, 10.0, 16.0, 18.0, 21.0, 28.0, 35.0, 59.0, 78.0, 121.0, 299.0, 704.0, 1765.0, 5808.0, 24413.0, 139936.0, 1240918.0, 2380134.0, 336585.0, 48048.0, 10392.0, 2907.0, 1006.0, 428.0, 186.0, 100.0, 66.0, 43.0, 31.0, 13.0, 17.0, 17.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.015625, -6.78338623046875, -6.5511474609375, -6.31890869140625, -6.086669921875, -5.85443115234375, -5.6221923828125, -5.38995361328125, -5.15771484375, -4.92547607421875, -4.6932373046875, -4.46099853515625, -4.228759765625, -3.99652099609375, -3.7642822265625, -3.53204345703125, -3.2998046875, -3.06756591796875, -2.8353271484375, -2.60308837890625, -2.370849609375, -2.13861083984375, -1.9063720703125, -1.67413330078125, -1.44189453125, -1.20965576171875, -0.9774169921875, -0.74517822265625, -0.512939453125, -0.28070068359375, -0.0484619140625, 0.18377685546875, 0.416015625, 0.64825439453125, 0.8804931640625, 1.11273193359375, 1.344970703125, 1.57720947265625, 1.8094482421875, 2.04168701171875, 2.27392578125, 2.50616455078125, 2.7384033203125, 2.97064208984375, 3.202880859375, 3.43511962890625, 3.6673583984375, 3.89959716796875, 4.1318359375, 4.36407470703125, 4.5963134765625, 4.82855224609375, 5.060791015625, 5.29302978515625, 5.5252685546875, 5.75750732421875, 5.98974609375, 6.22198486328125, 6.4542236328125, 6.68646240234375, 6.918701171875, 7.15093994140625, 7.3831787109375, 7.61541748046875, 7.84765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 2.0, 9.0, 8.0, 14.0, 18.0, 25.0, 37.0, 36.0, 67.0, 86.0, 106.0, 150.0, 158.0, 254.0, 380.0, 396.0, 488.0, 440.0, 340.0, 238.0, 207.0, 171.0, 118.0, 90.0, 65.0, 45.0, 36.0, 36.0, 16.0, 11.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.36737060546875, -5.1917724609375, -5.01617431640625, -4.840576171875, -4.66497802734375, -4.4893798828125, -4.31378173828125, -4.13818359375, -3.96258544921875, -3.7869873046875, -3.61138916015625, -3.435791015625, -3.26019287109375, -3.0845947265625, -2.90899658203125, -2.7333984375, -2.55780029296875, -2.3822021484375, -2.20660400390625, -2.031005859375, -1.85540771484375, -1.6798095703125, -1.50421142578125, -1.32861328125, -1.15301513671875, -0.9774169921875, -0.80181884765625, -0.626220703125, -0.45062255859375, -0.2750244140625, -0.09942626953125, 0.076171875, 0.25177001953125, 0.4273681640625, 0.60296630859375, 0.778564453125, 0.95416259765625, 1.1297607421875, 1.30535888671875, 1.48095703125, 1.65655517578125, 1.8321533203125, 2.00775146484375, 2.183349609375, 2.35894775390625, 2.5345458984375, 2.71014404296875, 2.8857421875, 3.06134033203125, 3.2369384765625, 3.41253662109375, 3.588134765625, 3.76373291015625, 3.9393310546875, 4.11492919921875, 4.29052734375, 4.46612548828125, 4.6417236328125, 4.81732177734375, 4.992919921875, 5.16851806640625, 5.3441162109375, 5.51971435546875, 5.6953125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 16.0, 9.0, 25.0, 33.0, 28.0, 75.0, 87.0, 122.0, 166.0, 249.0, 309.0, 482.0, 2192.0, 109337.0, 3897362.0, 179165.0, 2906.0, 565.0, 300.0, 248.0, 154.0, 122.0, 90.0, 55.0, 41.0, 32.0, 29.0, 21.0, 11.0, 10.0, 6.0, 5.0, 4.0, 8.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.640625, -23.859619140625, -23.07861328125, -22.297607421875, -21.5166015625, -20.735595703125, -19.95458984375, -19.173583984375, -18.392578125, -17.611572265625, -16.83056640625, -16.049560546875, -15.2685546875, -14.487548828125, -13.70654296875, -12.925537109375, -12.14453125, -11.363525390625, -10.58251953125, -9.801513671875, -9.0205078125, -8.239501953125, -7.45849609375, -6.677490234375, -5.896484375, -5.115478515625, -4.33447265625, -3.553466796875, -2.7724609375, -1.991455078125, -1.21044921875, -0.429443359375, 0.3515625, 1.132568359375, 1.91357421875, 2.694580078125, 3.4755859375, 4.256591796875, 5.03759765625, 5.818603515625, 6.599609375, 7.380615234375, 8.16162109375, 8.942626953125, 9.7236328125, 10.504638671875, 11.28564453125, 12.066650390625, 12.84765625, 13.628662109375, 14.40966796875, 15.190673828125, 15.9716796875, 16.752685546875, 17.53369140625, 18.314697265625, 19.095703125, 19.876708984375, 20.65771484375, 21.438720703125, 22.2197265625, 23.000732421875, 23.78173828125, 24.562744140625, 25.34375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 9.0, 18.0, 49.0, 60.0, 113.0, 172.0, 179.0, 142.0, 109.0, 86.0, 43.0, 17.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.216331481933594, -14.920907020568848, -13.625482559204102, -12.330058097839355, -11.03463363647461, -9.739209175109863, -8.443784713745117, -7.148360252380371, -5.852935791015625, -4.557511329650879, -3.262086868286133, -1.9666624069213867, -0.6712379455566406, 0.6241865158081055, 1.9196109771728516, 3.2150354385375977, 4.510459899902344, 5.80588436126709, 7.101308822631836, 8.396733283996582, 9.692157745361328, 10.987582206726074, 12.28300666809082, 13.578431129455566, 14.873855590820312, 16.169281005859375, 17.464704513549805, 18.760128021240234, 20.055553436279297, 21.35097885131836, 22.64640235900879, 23.94182586669922, 25.23725128173828, 26.532676696777344, 27.828100204467773, 29.123523712158203, 30.418949127197266, 31.714374542236328, 33.009796142578125, 34.30522155761719, 35.60064697265625, 36.89607238769531, 38.191497802734375, 39.48691940307617, 40.782344818115234, 42.0777702331543, 43.373191833496094, 44.668617248535156, 45.96404266357422, 47.25946807861328, 48.554893493652344, 49.85031509399414, 51.1457405090332, 52.441165924072266, 53.73658752441406, 55.032012939453125, 56.32743835449219, 57.62286376953125, 58.91828918457031, 60.21371078491211, 61.50913619995117, 62.804561614990234, 64.09998321533203, 65.3954086303711, 66.69083404541016]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 9.0, 4.0, 6.0, 8.0, 7.0, 21.0, 18.0, 17.0, 30.0, 26.0, 23.0, 32.0, 37.0, 36.0, 42.0, 58.0, 47.0, 55.0, 42.0, 47.0, 46.0, 49.0, 54.0, 26.0, 32.0, 34.0, 24.0, 13.0, 32.0, 24.0, 20.0, 15.0, 12.0, 12.0, 6.0, 11.0, 7.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.41748046875, -18.791841506958008, -18.166202545166016, -17.540563583374023, -16.91492462158203, -16.289287567138672, -15.66364860534668, -15.038009643554688, -14.412370681762695, -13.786731719970703, -13.161092758178711, -12.535454750061035, -11.909815788269043, -11.28417682647705, -10.658538818359375, -10.032899856567383, -9.40726089477539, -8.781621932983398, -8.155982971191406, -7.5303449630737305, -6.904706001281738, -6.279067039489746, -5.653428554534912, -5.027790069580078, -4.402151107788086, -3.776512384414673, -3.1508736610412598, -2.5252349376678467, -1.8995962142944336, -1.2739574909210205, -0.6483187675476074, -0.022680282592773438, 0.6029586791992188, 1.2285974025726318, 1.854236125946045, 2.479874849319458, 3.105513572692871, 3.731152296066284, 4.356791019439697, 4.982429504394531, 5.608068466186523, 6.233707427978516, 6.85934591293335, 7.484984397888184, 8.110623359680176, 8.736262321472168, 9.361900329589844, 9.987539291381836, 10.613178253173828, 11.23881721496582, 11.864456176757812, 12.490094184875488, 13.11573314666748, 13.741372108459473, 14.367010116577148, 14.99264907836914, 15.618288040161133, 16.243927001953125, 16.869565963745117, 17.49520492553711, 18.12084197998047, 18.74648094177246, 19.372119903564453, 19.997758865356445, 20.623397827148438]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 11.0, 11.0, 18.0, 20.0, 12.0, 25.0, 25.0, 33.0, 17.0, 22.0, 27.0, 34.0, 37.0, 44.0, 38.0, 55.0, 47.0, 44.0, 33.0, 37.0, 43.0, 32.0, 45.0, 32.0, 31.0, 25.0, 19.0, 23.0, 28.0, 20.0, 19.0, 11.0, 10.0, 9.0, 9.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.955078125, -2.86663818359375, -2.7781982421875, -2.68975830078125, -2.601318359375, -2.51287841796875, -2.4244384765625, -2.33599853515625, -2.24755859375, -2.15911865234375, -2.0706787109375, -1.98223876953125, -1.893798828125, -1.80535888671875, -1.7169189453125, -1.62847900390625, -1.5400390625, -1.45159912109375, -1.3631591796875, -1.27471923828125, -1.186279296875, -1.09783935546875, -1.0093994140625, -0.92095947265625, -0.83251953125, -0.74407958984375, -0.6556396484375, -0.56719970703125, -0.478759765625, -0.39031982421875, -0.3018798828125, -0.21343994140625, -0.125, -0.03656005859375, 0.0518798828125, 0.14031982421875, 0.228759765625, 0.31719970703125, 0.4056396484375, 0.49407958984375, 0.58251953125, 0.67095947265625, 0.7593994140625, 0.84783935546875, 0.936279296875, 1.02471923828125, 1.1131591796875, 1.20159912109375, 1.2900390625, 1.37847900390625, 1.4669189453125, 1.55535888671875, 1.643798828125, 1.73223876953125, 1.8206787109375, 1.90911865234375, 1.99755859375, 2.08599853515625, 2.1744384765625, 2.26287841796875, 2.351318359375, 2.43975830078125, 2.5281982421875, 2.61663818359375, 2.705078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 20.0, 22.0, 31.0, 46.0, 62.0, 103.0, 141.0, 194.0, 264.0, 391.0, 559.0, 723.0, 1131.0, 1519.0, 2231.0, 3094.0, 4395.0, 6449.0, 9088.0, 12969.0, 18412.0, 26455.0, 38911.0, 61798.0, 105708.0, 231272.0, 229154.0, 105630.0, 60819.0, 38741.0, 26600.0, 18530.0, 12963.0, 9026.0, 6216.0, 4353.0, 3027.0, 2180.0, 1464.0, 1118.0, 772.0, 567.0, 417.0, 280.0, 209.0, 142.0, 114.0, 78.0, 47.0, 36.0, 30.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0], "bins": [-0.0134124755859375, -0.013005971908569336, -0.012599468231201172, -0.012192964553833008, -0.011786460876464844, -0.01137995719909668, -0.010973453521728516, -0.010566949844360352, -0.010160446166992188, -0.009753942489624023, -0.00934743881225586, -0.008940935134887695, -0.008534431457519531, -0.008127927780151367, -0.007721424102783203, -0.007314920425415039, -0.006908416748046875, -0.006501913070678711, -0.006095409393310547, -0.005688905715942383, -0.005282402038574219, -0.004875898361206055, -0.004469394683837891, -0.0040628910064697266, -0.0036563873291015625, -0.0032498836517333984, -0.0028433799743652344, -0.0024368762969970703, -0.0020303726196289062, -0.0016238689422607422, -0.0012173652648925781, -0.0008108615875244141, -0.00040435791015625, 2.1457672119140625e-06, 0.0004086494445800781, 0.0008151531219482422, 0.0012216567993164062, 0.0016281604766845703, 0.0020346641540527344, 0.0024411678314208984, 0.0028476715087890625, 0.0032541751861572266, 0.0036606788635253906, 0.004067182540893555, 0.004473686218261719, 0.004880189895629883, 0.005286693572998047, 0.005693197250366211, 0.006099700927734375, 0.006506204605102539, 0.006912708282470703, 0.007319211959838867, 0.007725715637207031, 0.008132219314575195, 0.00853872299194336, 0.008945226669311523, 0.009351730346679688, 0.009758234024047852, 0.010164737701416016, 0.01057124137878418, 0.010977745056152344, 0.011384248733520508, 0.011790752410888672, 0.012197256088256836, 0.012603759765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 13.0, 20.0, 25.0, 23.0, 20.0, 25.0, 24.0, 35.0, 38.0, 52.0, 46.0, 42.0, 54.0, 50.0, 53.0, 1066.0, 39.0, 36.0, 41.0, 42.0, 31.0, 38.0, 27.0, 23.0, 27.0, 25.0, 19.0, 20.0, 10.0, 11.0, 12.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.115631103515625, -2.04766845703125, -1.979705810546875, -1.9117431640625, -1.843780517578125, -1.77581787109375, -1.707855224609375, -1.639892578125, -1.571929931640625, -1.50396728515625, -1.436004638671875, -1.3680419921875, -1.300079345703125, -1.23211669921875, -1.164154052734375, -1.09619140625, -1.028228759765625, -0.96026611328125, -0.892303466796875, -0.8243408203125, -0.756378173828125, -0.68841552734375, -0.620452880859375, -0.552490234375, -0.484527587890625, -0.41656494140625, -0.348602294921875, -0.2806396484375, -0.212677001953125, -0.14471435546875, -0.076751708984375, -0.0087890625, 0.059173583984375, 0.12713623046875, 0.195098876953125, 0.2630615234375, 0.331024169921875, 0.39898681640625, 0.466949462890625, 0.534912109375, 0.602874755859375, 0.67083740234375, 0.738800048828125, 0.8067626953125, 0.874725341796875, 0.94268798828125, 1.010650634765625, 1.07861328125, 1.146575927734375, 1.21453857421875, 1.282501220703125, 1.3504638671875, 1.418426513671875, 1.48638916015625, 1.554351806640625, 1.622314453125, 1.690277099609375, 1.75823974609375, 1.826202392578125, 1.8941650390625, 1.962127685546875, 2.03009033203125, 2.098052978515625, 2.166015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 11.0, 13.0, 22.0, 41.0, 33.0, 70.0, 119.0, 181.0, 263.0, 407.0, 635.0, 1027.0, 1726.0, 2865.0, 4354.0, 7653.0, 12496.0, 21738.0, 37289.0, 67708.0, 134305.0, 1364971.0, 221020.0, 96199.0, 51020.0, 28958.0, 16738.0, 9940.0, 5922.0, 3583.0, 2166.0, 1381.0, 771.0, 498.0, 363.0, 217.0, 150.0, 95.0, 58.0, 40.0, 29.0, 17.0, 9.0, 18.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01311492919921875, -0.012702107429504395, -0.012289285659790039, -0.011876463890075684, -0.011463642120361328, -0.011050820350646973, -0.010637998580932617, -0.010225176811218262, -0.009812355041503906, -0.00939953327178955, -0.008986711502075195, -0.00857388973236084, -0.008161067962646484, -0.007748246192932129, -0.0073354244232177734, -0.006922602653503418, -0.0065097808837890625, -0.006096959114074707, -0.0056841373443603516, -0.005271315574645996, -0.004858493804931641, -0.004445672035217285, -0.00403285026550293, -0.0036200284957885742, -0.0032072067260742188, -0.0027943849563598633, -0.002381563186645508, -0.0019687414169311523, -0.0015559196472167969, -0.0011430978775024414, -0.0007302761077880859, -0.00031745433807373047, 9.5367431640625e-05, 0.0005081892013549805, 0.0009210109710693359, 0.0013338327407836914, 0.0017466545104980469, 0.0021594762802124023, 0.002572298049926758, 0.0029851198196411133, 0.0033979415893554688, 0.0038107633590698242, 0.00422358512878418, 0.004636406898498535, 0.005049228668212891, 0.005462050437927246, 0.0058748722076416016, 0.006287693977355957, 0.0067005157470703125, 0.007113337516784668, 0.0075261592864990234, 0.007938981056213379, 0.008351802825927734, 0.00876462459564209, 0.009177446365356445, 0.0095902681350708, 0.010003089904785156, 0.010415911674499512, 0.010828733444213867, 0.011241555213928223, 0.011654376983642578, 0.012067198753356934, 0.012480020523071289, 0.012892842292785645, 0.0133056640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 881.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 13.0, 2.0, 24.0, 17.0, 2.0, 0.0, 2.0, 6.0, 67.0, 51.0, 157.0, 3992.0, 32987.0, 1006890.0, 3978.0, 138.0, 72.0, 76.0, 3.0, 4.0, 1.0, 0.0, 11.0, 31.0, 1.0, 19.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.993511199951172e-06, -3.893859684467316e-06, -3.7942081689834595e-06, -3.6945566534996033e-06, -3.594905138015747e-06, -3.495253622531891e-06, -3.3956021070480347e-06, -3.2959505915641785e-06, -3.1962990760803223e-06, -3.096647560596466e-06, -2.99699604511261e-06, -2.8973445296287537e-06, -2.7976930141448975e-06, -2.6980414986610413e-06, -2.598389983177185e-06, -2.498738467693329e-06, -2.3990869522094727e-06, -2.2994354367256165e-06, -2.1997839212417603e-06, -2.100132405757904e-06, -2.000480890274048e-06, -1.9008293747901917e-06, -1.8011778593063354e-06, -1.7015263438224792e-06, -1.601874828338623e-06, -1.5022233128547668e-06, -1.4025717973709106e-06, -1.3029202818870544e-06, -1.2032687664031982e-06, -1.103617250919342e-06, -1.0039657354354858e-06, -9.043142199516296e-07, -8.046627044677734e-07, -7.050111889839172e-07, -6.05359673500061e-07, -5.057081580162048e-07, -4.0605664253234863e-07, -3.0640512704849243e-07, -2.0675361156463623e-07, -1.0710209608078003e-07, -7.450580596923828e-09, 9.220093488693237e-08, 1.9185245037078857e-07, 2.915039658546448e-07, 3.91155481338501e-07, 4.908069968223572e-07, 5.904585123062134e-07, 6.901100277900696e-07, 7.897615432739258e-07, 8.89413058757782e-07, 9.890645742416382e-07, 1.0887160897254944e-06, 1.1883676052093506e-06, 1.2880191206932068e-06, 1.387670636177063e-06, 1.4873221516609192e-06, 1.5869736671447754e-06, 1.6866251826286316e-06, 1.7862766981124878e-06, 1.885928213596344e-06, 1.9855797290802e-06, 2.0852312445640564e-06, 2.1848827600479126e-06, 2.284534275531769e-06, 2.384185791015625e-06]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.063336747772155e-10, 1.812667349554431e-09, 2.7190010243316465e-09, 3.625334699108862e-09, 4.5316683738860775e-09, 5.438002048663293e-09, 6.3443357234405084e-09, 7.250669398217724e-09, 8.15700307299494e-09, 9.063336747772155e-09, 9.96967042254937e-09, 1.0876004097326586e-08, 1.1782337772103801e-08, 1.2688671446881017e-08, 1.3595005121658232e-08, 1.4501338796435448e-08, 1.5407671583034244e-08, 1.631400614598988e-08, 1.7220340708945514e-08, 1.812667349554431e-08, 1.9033006282143106e-08, 1.993934084509874e-08, 2.0845675408054376e-08, 2.1752008194653172e-08, 2.2658340981251968e-08, 2.3564675544207603e-08, 2.4471010107163238e-08, 2.5377342893762034e-08, 2.628367568036083e-08, 2.7190010243316465e-08, 2.80963448062721e-08, 2.9002677592870896e-08, 2.990901037946969e-08, 3.081534316606849e-08, 3.172167950538096e-08, 3.262801229197976e-08, 3.3534345078578554e-08, 3.444068141789103e-08, 3.5347014204489824e-08, 3.625334699108862e-08, 3.7159679777687415e-08, 3.806601256428621e-08, 3.8972348903598686e-08, 3.987868169019748e-08, 4.078501447679628e-08, 4.169135081610875e-08, 4.259768360270755e-08, 4.3504016389306344e-08, 4.441034917590514e-08, 4.5316681962503935e-08, 4.622301830181641e-08, 4.7129351088415206e-08, 4.8035683875014e-08, 4.8942020214326476e-08, 4.984835300092527e-08, 5.075468578752407e-08, 5.1661018574122863e-08, 5.256735136072166e-08, 5.3473687700034134e-08, 5.438002048663293e-08, 5.5286353273231725e-08, 5.61926896125442e-08, 5.7099022399142996e-08, 5.800535518574179e-08]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0], "bins": [-5.960464477539063e-08, -5.8673322200775146e-08, -5.774199962615967e-08, -5.681067705154419e-08, -5.587935447692871e-08, -5.494803190231323e-08, -5.4016709327697754e-08, -5.3085386753082275e-08, -5.21540641784668e-08, -5.122274160385132e-08, -5.029141902923584e-08, -4.936009645462036e-08, -4.842877388000488e-08, -4.7497451305389404e-08, -4.6566128730773926e-08, -4.563480615615845e-08, -4.470348358154297e-08, -4.377216100692749e-08, -4.284083843231201e-08, -4.190951585769653e-08, -4.0978193283081055e-08, -4.0046870708465576e-08, -3.91155481338501e-08, -3.818422555923462e-08, -3.725290298461914e-08, -3.632158041000366e-08, -3.5390257835388184e-08, -3.4458935260772705e-08, -3.3527612686157227e-08, -3.259629011154175e-08, -3.166496753692627e-08, -3.073364496231079e-08, -2.9802322387695312e-08, -2.8870999813079834e-08, -2.7939677238464355e-08, -2.7008354663848877e-08, -2.60770320892334e-08, -2.514570951461792e-08, -2.421438694000244e-08, -2.3283064365386963e-08, -2.2351741790771484e-08, -2.1420419216156006e-08, -2.0489096641540527e-08, -1.955777406692505e-08, -1.862645149230957e-08, -1.7695128917694092e-08, -1.6763806343078613e-08, -1.5832483768463135e-08, -1.4901161193847656e-08, -1.3969838619232178e-08, -1.30385160446167e-08, -1.210719347000122e-08, -1.1175870895385742e-08, -1.0244548320770264e-08, -9.313225746154785e-09, -8.381903171539307e-09, -7.450580596923828e-09, -6.51925802230835e-09, -5.587935447692871e-09, -4.6566128730773926e-09, -3.725290298461914e-09, -2.7939677238464355e-09, -1.862645149230957e-09, -9.313225746154785e-10, 0.0]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 11.0, 11.0, 18.0, 20.0, 12.0, 25.0, 25.0, 33.0, 17.0, 22.0, 27.0, 34.0, 37.0, 44.0, 38.0, 55.0, 47.0, 44.0, 33.0, 37.0, 43.0, 32.0, 45.0, 32.0, 31.0, 25.0, 19.0, 23.0, 28.0, 20.0, 19.0, 11.0, 10.0, 9.0, 9.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.955078125, -2.86663818359375, -2.7781982421875, -2.68975830078125, -2.601318359375, -2.51287841796875, -2.4244384765625, -2.33599853515625, -2.24755859375, -2.15911865234375, -2.0706787109375, -1.98223876953125, -1.893798828125, -1.80535888671875, -1.7169189453125, -1.62847900390625, -1.5400390625, -1.45159912109375, -1.3631591796875, -1.27471923828125, -1.186279296875, -1.09783935546875, -1.0093994140625, -0.92095947265625, -0.83251953125, -0.74407958984375, -0.6556396484375, -0.56719970703125, -0.478759765625, -0.39031982421875, -0.3018798828125, -0.21343994140625, -0.125, -0.03656005859375, 0.0518798828125, 0.14031982421875, 0.228759765625, 0.31719970703125, 0.4056396484375, 0.49407958984375, 0.58251953125, 0.67095947265625, 0.7593994140625, 0.84783935546875, 0.936279296875, 1.02471923828125, 1.1131591796875, 1.20159912109375, 1.2900390625, 1.37847900390625, 1.4669189453125, 1.55535888671875, 1.643798828125, 1.73223876953125, 1.8206787109375, 1.90911865234375, 1.99755859375, 2.08599853515625, 2.1744384765625, 2.26287841796875, 2.351318359375, 2.43975830078125, 2.5281982421875, 2.61663818359375, 2.705078125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 4.0, 8.0, 11.0, 15.0, 24.0, 27.0, 38.0, 75.0, 112.0, 165.0, 286.0, 486.0, 757.0, 1297.0, 2229.0, 3887.0, 6853.0, 11985.0, 21515.0, 40704.0, 85746.0, 237032.0, 395872.0, 122653.0, 53959.0, 27429.0, 15174.0, 8462.0, 4966.0, 2741.0, 1555.0, 961.0, 553.0, 334.0, 186.0, 148.0, 99.0, 57.0, 44.0, 19.0, 18.0, 26.0, 13.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.814453125, -2.7242431640625, -2.634033203125, -2.5438232421875, -2.45361328125, -2.3634033203125, -2.273193359375, -2.1829833984375, -2.0927734375, -2.0025634765625, -1.912353515625, -1.8221435546875, -1.73193359375, -1.6417236328125, -1.551513671875, -1.4613037109375, -1.37109375, -1.2808837890625, -1.190673828125, -1.1004638671875, -1.01025390625, -0.9200439453125, -0.829833984375, -0.7396240234375, -0.6494140625, -0.5592041015625, -0.468994140625, -0.3787841796875, -0.28857421875, -0.1983642578125, -0.108154296875, -0.0179443359375, 0.072265625, 0.1624755859375, 0.252685546875, 0.3428955078125, 0.43310546875, 0.5233154296875, 0.613525390625, 0.7037353515625, 0.7939453125, 0.8841552734375, 0.974365234375, 1.0645751953125, 1.15478515625, 1.2449951171875, 1.335205078125, 1.4254150390625, 1.515625, 1.6058349609375, 1.696044921875, 1.7862548828125, 1.87646484375, 1.9666748046875, 2.056884765625, 2.1470947265625, 2.2373046875, 2.3275146484375, 2.417724609375, 2.5079345703125, 2.59814453125, 2.6883544921875, 2.778564453125, 2.8687744140625, 2.958984375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 9.0, 3.0, 7.0, 10.0, 14.0, 8.0, 10.0, 17.0, 16.0, 17.0, 38.0, 17.0, 31.0, 53.0, 46.0, 52.0, 64.0, 89.0, 214.0, 1598.0, 209.0, 85.0, 59.0, 49.0, 50.0, 51.0, 39.0, 36.0, 19.0, 31.0, 21.0, 14.0, 11.0, 23.0, 8.0, 13.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.8885498046875, -8.597412109375, -8.3062744140625, -8.01513671875, -7.7239990234375, -7.432861328125, -7.1417236328125, -6.8505859375, -6.5594482421875, -6.268310546875, -5.9771728515625, -5.68603515625, -5.3948974609375, -5.103759765625, -4.8126220703125, -4.521484375, -4.2303466796875, -3.939208984375, -3.6480712890625, -3.35693359375, -3.0657958984375, -2.774658203125, -2.4835205078125, -2.1923828125, -1.9012451171875, -1.610107421875, -1.3189697265625, -1.02783203125, -0.7366943359375, -0.445556640625, -0.1544189453125, 0.13671875, 0.4278564453125, 0.718994140625, 1.0101318359375, 1.30126953125, 1.5924072265625, 1.883544921875, 2.1746826171875, 2.4658203125, 2.7569580078125, 3.048095703125, 3.3392333984375, 3.63037109375, 3.9215087890625, 4.212646484375, 4.5037841796875, 4.794921875, 5.0860595703125, 5.377197265625, 5.6683349609375, 5.95947265625, 6.2506103515625, 6.541748046875, 6.8328857421875, 7.1240234375, 7.4151611328125, 7.706298828125, 7.9974365234375, 8.28857421875, 8.5797119140625, 8.870849609375, 9.1619873046875, 9.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 6.0, 10.0, 13.0, 17.0, 25.0, 22.0, 30.0, 50.0, 61.0, 63.0, 99.0, 146.0, 182.0, 272.0, 452.0, 1532.0, 15282.0, 960764.0, 2142126.0, 21138.0, 1901.0, 463.0, 281.0, 195.0, 129.0, 98.0, 66.0, 58.0, 40.0, 34.0, 24.0, 20.0, 15.0, 19.0, 15.0, 8.0, 6.0, 7.0, 8.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.78125, -16.2735595703125, -15.765869140625, -15.2581787109375, -14.75048828125, -14.2427978515625, -13.735107421875, -13.2274169921875, -12.7197265625, -12.2120361328125, -11.704345703125, -11.1966552734375, -10.68896484375, -10.1812744140625, -9.673583984375, -9.1658935546875, -8.658203125, -8.1505126953125, -7.642822265625, -7.1351318359375, -6.62744140625, -6.1197509765625, -5.612060546875, -5.1043701171875, -4.5966796875, -4.0889892578125, -3.581298828125, -3.0736083984375, -2.56591796875, -2.0582275390625, -1.550537109375, -1.0428466796875, -0.53515625, -0.0274658203125, 0.480224609375, 0.9879150390625, 1.49560546875, 2.0032958984375, 2.510986328125, 3.0186767578125, 3.5263671875, 4.0340576171875, 4.541748046875, 5.0494384765625, 5.55712890625, 6.0648193359375, 6.572509765625, 7.0802001953125, 7.587890625, 8.0955810546875, 8.603271484375, 9.1109619140625, 9.61865234375, 10.1263427734375, 10.634033203125, 11.1417236328125, 11.6494140625, 12.1571044921875, 12.664794921875, 13.1724853515625, 13.68017578125, 14.1878662109375, 14.695556640625, 15.2032470703125, 15.7109375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 60.0, 284.0, 454.0, 193.0, 17.0, 2.0, 1.0], "bins": [-98.02595520019531, -96.37340545654297, -94.7208480834961, -93.06829833984375, -91.4157485961914, -89.76319885253906, -88.11064147949219, -86.45809173583984, -84.8055419921875, -83.15299224853516, -81.50043487548828, -79.84788513183594, -78.1953353881836, -76.54278564453125, -74.89022827148438, -73.23767852783203, -71.58512115478516, -69.93257141113281, -68.28001403808594, -66.6274642944336, -64.97491455078125, -63.32236099243164, -61.66980743408203, -60.01725769042969, -58.36470413208008, -56.71215057373047, -55.059600830078125, -53.407047271728516, -51.754493713378906, -50.10194396972656, -48.44939041137695, -46.796836853027344, -45.144290924072266, -43.491737365722656, -41.83918762207031, -40.1866340637207, -38.534080505371094, -36.88153076171875, -35.22897720336914, -33.57642364501953, -31.923873901367188, -30.27132225036621, -28.618770599365234, -26.966217041015625, -25.31366539001465, -23.661113739013672, -22.008560180664062, -20.356008529663086, -18.70345687866211, -17.050905227661133, -15.39835262298584, -13.745800018310547, -12.09324836730957, -10.440696716308594, -8.7881441116333, -7.135591506958008, -5.483038902282715, -3.83048677444458, -2.1779346466064453, -0.5253825187683105, 1.1271696090698242, 2.779721260070801, 4.432273864746094, 6.084826469421387, 7.737378120422363]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 4.0, 8.0, 10.0, 6.0, 9.0, 16.0, 17.0, 17.0, 18.0, 27.0, 19.0, 32.0, 40.0, 31.0, 40.0, 31.0, 37.0, 43.0, 49.0, 44.0, 51.0, 38.0, 39.0, 41.0, 46.0, 33.0, 32.0, 34.0, 31.0, 25.0, 27.0, 18.0, 18.0, 13.0, 12.0, 7.0, 8.0, 7.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.095500946044922, -20.347705841064453, -19.59990882873535, -18.85211181640625, -18.10431671142578, -17.356521606445312, -16.60872459411621, -15.860928535461426, -15.11313247680664, -14.365336418151855, -13.61754035949707, -12.869744300842285, -12.1219482421875, -11.374152183532715, -10.62635612487793, -9.878560066223145, -9.13076400756836, -8.382967948913574, -7.635171890258789, -6.887375831604004, -6.139579772949219, -5.391783714294434, -4.643987655639648, -3.8961915969848633, -3.148395538330078, -2.400599479675293, -1.6528034210205078, -0.9050073623657227, -0.1572113037109375, 0.5905847549438477, 1.3383808135986328, 2.086176872253418, 2.833972930908203, 3.5817689895629883, 4.329565048217773, 5.077361106872559, 5.825157165527344, 6.572953224182129, 7.320749282836914, 8.0685453414917, 8.816341400146484, 9.56413745880127, 10.311933517456055, 11.05972957611084, 11.807525634765625, 12.55532169342041, 13.303117752075195, 14.05091381072998, 14.798709869384766, 15.54650592803955, 16.294301986694336, 17.042098999023438, 17.789894104003906, 18.537689208984375, 19.285486221313477, 20.033283233642578, 20.781078338623047, 21.528873443603516, 22.276670455932617, 23.02446746826172, 23.772262573242188, 24.520057678222656, 25.267854690551758, 26.01565170288086, 26.763446807861328]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 18.0, 18.0, 16.0, 23.0, 19.0, 25.0, 27.0, 28.0, 40.0, 41.0, 40.0, 45.0, 36.0, 50.0, 40.0, 48.0, 41.0, 41.0, 38.0, 37.0, 36.0, 39.0, 28.0, 26.0, 26.0, 30.0, 17.0, 19.0, 20.0, 10.0, 6.0, 8.0, 8.0, 12.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.19140625, -3.09185791015625, -2.9923095703125, -2.89276123046875, -2.793212890625, -2.69366455078125, -2.5941162109375, -2.49456787109375, -2.39501953125, -2.29547119140625, -2.1959228515625, -2.09637451171875, -1.996826171875, -1.89727783203125, -1.7977294921875, -1.69818115234375, -1.5986328125, -1.49908447265625, -1.3995361328125, -1.29998779296875, -1.200439453125, -1.10089111328125, -1.0013427734375, -0.90179443359375, -0.80224609375, -0.70269775390625, -0.6031494140625, -0.50360107421875, -0.404052734375, -0.30450439453125, -0.2049560546875, -0.10540771484375, -0.005859375, 0.09368896484375, 0.1932373046875, 0.29278564453125, 0.392333984375, 0.49188232421875, 0.5914306640625, 0.69097900390625, 0.79052734375, 0.89007568359375, 0.9896240234375, 1.08917236328125, 1.188720703125, 1.28826904296875, 1.3878173828125, 1.48736572265625, 1.5869140625, 1.68646240234375, 1.7860107421875, 1.88555908203125, 1.985107421875, 2.08465576171875, 2.1842041015625, 2.28375244140625, 2.38330078125, 2.48284912109375, 2.5823974609375, 2.68194580078125, 2.781494140625, 2.88104248046875, 2.9805908203125, 3.08013916015625, 3.1796875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 15.0, 15.0, 15.0, 22.0, 29.0, 41.0, 75.0, 105.0, 281.0, 868.0, 3163.0, 16501.0, 131020.0, 1822234.0, 2046196.0, 149737.0, 18582.0, 3672.0, 960.0, 299.0, 129.0, 66.0, 53.0, 34.0, 20.0, 27.0, 19.0, 12.0, 8.0, 11.0, 10.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.25, -8.961181640625, -8.67236328125, -8.383544921875, -8.0947265625, -7.805908203125, -7.51708984375, -7.228271484375, -6.939453125, -6.650634765625, -6.36181640625, -6.072998046875, -5.7841796875, -5.495361328125, -5.20654296875, -4.917724609375, -4.62890625, -4.340087890625, -4.05126953125, -3.762451171875, -3.4736328125, -3.184814453125, -2.89599609375, -2.607177734375, -2.318359375, -2.029541015625, -1.74072265625, -1.451904296875, -1.1630859375, -0.874267578125, -0.58544921875, -0.296630859375, -0.0078125, 0.281005859375, 0.56982421875, 0.858642578125, 1.1474609375, 1.436279296875, 1.72509765625, 2.013916015625, 2.302734375, 2.591552734375, 2.88037109375, 3.169189453125, 3.4580078125, 3.746826171875, 4.03564453125, 4.324462890625, 4.61328125, 4.902099609375, 5.19091796875, 5.479736328125, 5.7685546875, 6.057373046875, 6.34619140625, 6.635009765625, 6.923828125, 7.212646484375, 7.50146484375, 7.790283203125, 8.0791015625, 8.367919921875, 8.65673828125, 8.945556640625, 9.234375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 8.0, 13.0, 17.0, 6.0, 17.0, 34.0, 27.0, 48.0, 48.0, 67.0, 73.0, 84.0, 150.0, 177.0, 231.0, 278.0, 348.0, 416.0, 361.0, 354.0, 308.0, 225.0, 171.0, 128.0, 83.0, 86.0, 73.0, 49.0, 37.0, 43.0, 20.0, 22.0, 16.0, 14.0, 14.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.3125, -4.169189453125, -4.02587890625, -3.882568359375, -3.7392578125, -3.595947265625, -3.45263671875, -3.309326171875, -3.166015625, -3.022705078125, -2.87939453125, -2.736083984375, -2.5927734375, -2.449462890625, -2.30615234375, -2.162841796875, -2.01953125, -1.876220703125, -1.73291015625, -1.589599609375, -1.4462890625, -1.302978515625, -1.15966796875, -1.016357421875, -0.873046875, -0.729736328125, -0.58642578125, -0.443115234375, -0.2998046875, -0.156494140625, -0.01318359375, 0.130126953125, 0.2734375, 0.416748046875, 0.56005859375, 0.703369140625, 0.8466796875, 0.989990234375, 1.13330078125, 1.276611328125, 1.419921875, 1.563232421875, 1.70654296875, 1.849853515625, 1.9931640625, 2.136474609375, 2.27978515625, 2.423095703125, 2.56640625, 2.709716796875, 2.85302734375, 2.996337890625, 3.1396484375, 3.282958984375, 3.42626953125, 3.569580078125, 3.712890625, 3.856201171875, 3.99951171875, 4.142822265625, 4.2861328125, 4.429443359375, 4.57275390625, 4.716064453125, 4.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 13.0, 18.0, 21.0, 25.0, 26.0, 51.0, 63.0, 82.0, 111.0, 125.0, 189.0, 252.0, 345.0, 1056.0, 24246.0, 3364574.0, 794177.0, 6955.0, 627.0, 329.0, 241.0, 196.0, 138.0, 81.0, 75.0, 65.0, 43.0, 38.0, 23.0, 19.0, 8.0, 9.0, 15.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.109375, -27.27880859375, -26.4482421875, -25.61767578125, -24.787109375, -23.95654296875, -23.1259765625, -22.29541015625, -21.46484375, -20.63427734375, -19.8037109375, -18.97314453125, -18.142578125, -17.31201171875, -16.4814453125, -15.65087890625, -14.8203125, -13.98974609375, -13.1591796875, -12.32861328125, -11.498046875, -10.66748046875, -9.8369140625, -9.00634765625, -8.17578125, -7.34521484375, -6.5146484375, -5.68408203125, -4.853515625, -4.02294921875, -3.1923828125, -2.36181640625, -1.53125, -0.70068359375, 0.1298828125, 0.96044921875, 1.791015625, 2.62158203125, 3.4521484375, 4.28271484375, 5.11328125, 5.94384765625, 6.7744140625, 7.60498046875, 8.435546875, 9.26611328125, 10.0966796875, 10.92724609375, 11.7578125, 12.58837890625, 13.4189453125, 14.24951171875, 15.080078125, 15.91064453125, 16.7412109375, 17.57177734375, 18.40234375, 19.23291015625, 20.0634765625, 20.89404296875, 21.724609375, 22.55517578125, 23.3857421875, 24.21630859375, 25.046875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 16.0, 23.0, 34.0, 45.0, 66.0, 102.0, 103.0, 103.0, 103.0, 96.0, 93.0, 71.0, 52.0, 29.0, 23.0, 10.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.040903091430664, -24.22721290588379, -23.413524627685547, -22.599834442138672, -21.786144256591797, -20.972455978393555, -20.15876579284668, -19.345077514648438, -18.531387329101562, -17.717697143554688, -16.904008865356445, -16.09031867980957, -15.276629447937012, -14.462940216064453, -13.649250030517578, -12.83556079864502, -12.021871566772461, -11.208182334899902, -10.394493103027344, -9.580802917480469, -8.76711368560791, -7.953424453735352, -7.139734745025635, -6.326045036315918, -5.512355804443359, -4.698666572570801, -3.884976863861084, -3.0712873935699463, -2.2575979232788086, -1.44390869140625, -0.6302189826965332, 0.1834707260131836, 0.997161865234375, 1.8108513355255127, 2.6245408058166504, 3.438230276107788, 4.251919746398926, 5.065608978271484, 5.879298686981201, 6.692988395690918, 7.506677627563477, 8.320366859436035, 9.134056091308594, 9.947746276855469, 10.761435508728027, 11.575124740600586, 12.388814926147461, 13.20250415802002, 14.016193389892578, 14.829882621765137, 15.643571853637695, 16.45726203918457, 17.270950317382812, 18.084640502929688, 18.898330688476562, 19.712020874023438, 20.52570915222168, 21.339399337768555, 22.153087615966797, 22.966777801513672, 23.780467987060547, 24.59415626525879, 25.407846450805664, 26.221534729003906, 27.03522491455078]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 9.0, 3.0, 8.0, 9.0, 9.0, 12.0, 20.0, 18.0, 23.0, 27.0, 34.0, 35.0, 35.0, 43.0, 43.0, 45.0, 38.0, 46.0, 30.0, 46.0, 47.0, 46.0, 40.0, 35.0, 42.0, 39.0, 33.0, 29.0, 23.0, 26.0, 25.0, 17.0, 16.0, 16.0, 8.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.3619384765625, -21.730127334594727, -21.098318099975586, -20.466506958007812, -19.834697723388672, -19.2028865814209, -18.571075439453125, -17.939266204833984, -17.30745506286621, -16.675643920898438, -16.043834686279297, -15.412023544311523, -14.780213356018066, -14.14840316772461, -13.516592025756836, -12.884781837463379, -12.252971649169922, -11.621161460876465, -10.989351272583008, -10.357540130615234, -9.725729942321777, -9.09391975402832, -8.462108612060547, -7.83029842376709, -7.198488235473633, -6.566678047180176, -5.9348673820495605, -5.303056716918945, -4.671246528625488, -4.039436340332031, -3.407625675201416, -2.775815010070801, -2.1440048217773438, -1.5121943950653076, -0.8803839683532715, -0.24857354164123535, 0.3832368850708008, 1.015047311782837, 1.646857738494873, 2.2786684036254883, 2.9104785919189453, 3.5422890186309814, 4.174099445343018, 4.805910110473633, 5.43772029876709, 6.069530487060547, 6.701341152191162, 7.333151817321777, 7.964962005615234, 8.596772193908691, 9.228582382202148, 9.860393524169922, 10.492203712463379, 11.124013900756836, 11.75582504272461, 12.387635231018066, 13.019445419311523, 13.65125560760498, 14.283065795898438, 14.914876937866211, 15.546687126159668, 16.178497314453125, 16.8103084564209, 17.442119598388672, 18.073928833007812]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 35.0, 22.0, 41.0, 31.0, 30.0, 41.0, 38.0, 38.0, 47.0, 58.0, 54.0, 55.0, 53.0, 46.0, 40.0, 43.0, 40.0, 36.0, 32.0, 19.0, 31.0, 26.0, 20.0, 9.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.919189453125, -3.80322265625, -3.687255859375, -3.5712890625, -3.455322265625, -3.33935546875, -3.223388671875, -3.107421875, -2.991455078125, -2.87548828125, -2.759521484375, -2.6435546875, -2.527587890625, -2.41162109375, -2.295654296875, -2.1796875, -2.063720703125, -1.94775390625, -1.831787109375, -1.7158203125, -1.599853515625, -1.48388671875, -1.367919921875, -1.251953125, -1.135986328125, -1.02001953125, -0.904052734375, -0.7880859375, -0.672119140625, -0.55615234375, -0.440185546875, -0.32421875, -0.208251953125, -0.09228515625, 0.023681640625, 0.1396484375, 0.255615234375, 0.37158203125, 0.487548828125, 0.603515625, 0.719482421875, 0.83544921875, 0.951416015625, 1.0673828125, 1.183349609375, 1.29931640625, 1.415283203125, 1.53125, 1.647216796875, 1.76318359375, 1.879150390625, 1.9951171875, 2.111083984375, 2.22705078125, 2.343017578125, 2.458984375, 2.574951171875, 2.69091796875, 2.806884765625, 2.9228515625, 3.038818359375, 3.15478515625, 3.270751953125, 3.38671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 16.0, 15.0, 22.0, 34.0, 60.0, 82.0, 145.0, 216.0, 321.0, 610.0, 960.0, 1604.0, 2674.0, 4767.0, 8167.0, 14516.0, 25665.0, 47695.0, 94517.0, 229987.0, 352576.0, 126914.0, 61727.0, 32694.0, 18127.0, 10178.0, 6031.0, 3317.0, 1916.0, 1157.0, 715.0, 395.0, 235.0, 187.0, 93.0, 81.0, 41.0, 27.0, 22.0, 14.0, 14.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0242767333984375, -0.02358698844909668, -0.02289724349975586, -0.02220749855041504, -0.02151775360107422, -0.0208280086517334, -0.020138263702392578, -0.019448518753051758, -0.018758773803710938, -0.018069028854370117, -0.017379283905029297, -0.016689538955688477, -0.015999794006347656, -0.015310049057006836, -0.014620304107666016, -0.013930559158325195, -0.013240814208984375, -0.012551069259643555, -0.011861324310302734, -0.011171579360961914, -0.010481834411621094, -0.009792089462280273, -0.009102344512939453, -0.008412599563598633, -0.0077228546142578125, -0.007033109664916992, -0.006343364715576172, -0.0056536197662353516, -0.004963874816894531, -0.004274129867553711, -0.0035843849182128906, -0.0028946399688720703, -0.00220489501953125, -0.0015151500701904297, -0.0008254051208496094, -0.00013566017150878906, 0.0005540847778320312, 0.0012438297271728516, 0.0019335746765136719, 0.002623319625854492, 0.0033130645751953125, 0.004002809524536133, 0.004692554473876953, 0.0053822994232177734, 0.006072044372558594, 0.006761789321899414, 0.007451534271240234, 0.008141279220581055, 0.008831024169921875, 0.009520769119262695, 0.010210514068603516, 0.010900259017944336, 0.011590003967285156, 0.012279748916625977, 0.012969493865966797, 0.013659238815307617, 0.014348983764648438, 0.015038728713989258, 0.015728473663330078, 0.0164182186126709, 0.01710796356201172, 0.01779770851135254, 0.01848745346069336, 0.01917719841003418, 0.019866943359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 8.0, 16.0, 16.0, 12.0, 19.0, 27.0, 24.0, 27.0, 21.0, 32.0, 39.0, 36.0, 29.0, 34.0, 27.0, 30.0, 46.0, 1061.0, 42.0, 42.0, 32.0, 37.0, 28.0, 39.0, 38.0, 27.0, 33.0, 31.0, 23.0, 26.0, 17.0, 13.0, 13.0, 12.0, 12.0, 6.0, 11.0, 4.0, 6.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8183441162109375, -1.758758544921875, -1.6991729736328125, -1.63958740234375, -1.5800018310546875, -1.520416259765625, -1.4608306884765625, -1.4012451171875, -1.3416595458984375, -1.282073974609375, -1.2224884033203125, -1.16290283203125, -1.1033172607421875, -1.043731689453125, -0.9841461181640625, -0.924560546875, -0.8649749755859375, -0.805389404296875, -0.7458038330078125, -0.68621826171875, -0.6266326904296875, -0.567047119140625, -0.5074615478515625, -0.4478759765625, -0.3882904052734375, -0.328704833984375, -0.2691192626953125, -0.20953369140625, -0.1499481201171875, -0.090362548828125, -0.0307769775390625, 0.02880859375, 0.0883941650390625, 0.147979736328125, 0.2075653076171875, 0.26715087890625, 0.3267364501953125, 0.386322021484375, 0.4459075927734375, 0.5054931640625, 0.5650787353515625, 0.624664306640625, 0.6842498779296875, 0.74383544921875, 0.8034210205078125, 0.863006591796875, 0.9225921630859375, 0.982177734375, 1.0417633056640625, 1.101348876953125, 1.1609344482421875, 1.22052001953125, 1.2801055908203125, 1.339691162109375, 1.3992767333984375, 1.4588623046875, 1.5184478759765625, 1.578033447265625, 1.6376190185546875, 1.69720458984375, 1.7567901611328125, 1.816375732421875, 1.8759613037109375, 1.935546875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 14.0, 29.0, 35.0, 46.0, 48.0, 95.0, 168.0, 247.0, 358.0, 506.0, 797.0, 1264.0, 1928.0, 2914.0, 4449.0, 7161.0, 11035.0, 17574.0, 28485.0, 46274.0, 77277.0, 142260.0, 1338332.0, 182168.0, 91030.0, 53894.0, 32694.0, 20331.0, 12802.0, 8132.0, 5059.0, 3361.0, 2196.0, 1377.0, 918.0, 610.0, 451.0, 276.0, 185.0, 119.0, 89.0, 43.0, 30.0, 23.0, 19.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011478185653686523, -0.011115550994873047, -0.01075291633605957, -0.010390281677246094, -0.010027647018432617, -0.00966501235961914, -0.009302377700805664, -0.008939743041992188, -0.008577108383178711, -0.008214473724365234, -0.007851839065551758, -0.007489204406738281, -0.007126569747924805, -0.006763935089111328, -0.0064013004302978516, -0.006038665771484375, -0.0056760311126708984, -0.005313396453857422, -0.004950761795043945, -0.004588127136230469, -0.004225492477416992, -0.0038628578186035156, -0.003500223159790039, -0.0031375885009765625, -0.002774953842163086, -0.0024123191833496094, -0.002049684524536133, -0.0016870498657226562, -0.0013244152069091797, -0.0009617805480957031, -0.0005991458892822266, -0.00023651123046875, 0.00012612342834472656, 0.0004887580871582031, 0.0008513927459716797, 0.0012140274047851562, 0.0015766620635986328, 0.0019392967224121094, 0.002301931381225586, 0.0026645660400390625, 0.003027200698852539, 0.0033898353576660156, 0.003752470016479492, 0.004115104675292969, 0.004477739334106445, 0.004840373992919922, 0.0052030086517333984, 0.005565643310546875, 0.0059282779693603516, 0.006290912628173828, 0.006653547286987305, 0.007016181945800781, 0.007378816604614258, 0.007741451263427734, 0.008104085922241211, 0.008466720581054688, 0.008829355239868164, 0.00919198989868164, 0.009554624557495117, 0.009917259216308594, 0.01027989387512207, 0.010642528533935547, 0.011005163192749023, 0.0113677978515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 839.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 14.0, 25.0, 30.0, 22.0, 1.0, 2.0, 11.0, 85.0, 116.0, 558.0, 46634.0, 1000180.0, 573.0, 112.0, 52.0, 50.0, 3.0, 0.0, 21.0, 19.0, 34.0, 17.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.636123776435852e-06, -4.503875970840454e-06, -4.371628165245056e-06, -4.239380359649658e-06, -4.10713255405426e-06, -3.974884748458862e-06, -3.842636942863464e-06, -3.7103891372680664e-06, -3.5781413316726685e-06, -3.4458935260772705e-06, -3.3136457204818726e-06, -3.1813979148864746e-06, -3.0491501092910767e-06, -2.9169023036956787e-06, -2.7846544981002808e-06, -2.652406692504883e-06, -2.520158886909485e-06, -2.387911081314087e-06, -2.255663275718689e-06, -2.123415470123291e-06, -1.991167664527893e-06, -1.8589198589324951e-06, -1.7266720533370972e-06, -1.5944242477416992e-06, -1.4621764421463013e-06, -1.3299286365509033e-06, -1.1976808309555054e-06, -1.0654330253601074e-06, -9.331852197647095e-07, -8.009374141693115e-07, -6.686896085739136e-07, -5.364418029785156e-07, -4.041939973831177e-07, -2.7194619178771973e-07, -1.3969838619232178e-07, -7.450580596923828e-09, 1.2479722499847412e-07, 2.5704503059387207e-07, 3.8929283618927e-07, 5.21540641784668e-07, 6.537884473800659e-07, 7.860362529754639e-07, 9.182840585708618e-07, 1.0505318641662598e-06, 1.1827796697616577e-06, 1.3150274753570557e-06, 1.4472752809524536e-06, 1.5795230865478516e-06, 1.7117708921432495e-06, 1.8440186977386475e-06, 1.9762665033340454e-06, 2.1085143089294434e-06, 2.2407621145248413e-06, 2.3730099201202393e-06, 2.505257725715637e-06, 2.637505531311035e-06, 2.769753336906433e-06, 2.902001142501831e-06, 3.034248948097229e-06, 3.166496753692627e-06, 3.298744559288025e-06, 3.430992364883423e-06, 3.563240170478821e-06, 3.6954879760742188e-06]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 2.3011285932295067e-10, 4.6022571864590134e-10, 6.903385640910642e-10, 9.204514372918027e-10, 1.1505643104925412e-09, 1.3806771281821284e-09, 1.6107900568940181e-09, 1.8409028745836054e-09, 2.071015803295495e-09, 2.3011286209850823e-09, 2.5312414386746696e-09, 2.761354256364257e-09, 2.991467074053844e-09, 3.2215798917434313e-09, 3.4516929314776235e-09, 3.6818057491672107e-09, 3.911918788901403e-09, 4.14203160659099e-09, 4.372144424280577e-09, 4.602257241970165e-09, 4.832370059659752e-09, 5.062482877349339e-09, 5.292595695038926e-09, 5.522708512728514e-09, 5.752821330418101e-09, 5.982934148107688e-09, 6.213046965797275e-09, 6.4431597834868626e-09, 6.67327260117645e-09, 6.903385418866037e-09, 7.133498680644834e-09, 7.363611498334421e-09, 7.593724760113219e-09, 7.823837577802806e-09, 8.053950395492393e-09, 8.28406321318198e-09, 8.514176030871567e-09, 8.744288848561155e-09, 8.974401666250742e-09, 9.20451448394033e-09, 9.434627301629916e-09, 9.664740119319504e-09, 9.894852937009091e-09, 1.0124965754698678e-08, 1.0355078572388265e-08, 1.0585191390077853e-08, 1.081530420776744e-08, 1.1045417025457027e-08, 1.1275529843146614e-08, 1.1505642660836202e-08, 1.1735755478525789e-08, 1.1965868296215376e-08, 1.2195981113904963e-08, 1.242609393159455e-08, 1.2656206749284138e-08, 1.2886320455152145e-08, 1.3116433272841732e-08, 1.334654609053132e-08, 1.3576658908220907e-08, 1.3806771725910494e-08, 1.4036884543600081e-08, 1.4266997361289668e-08, 1.4497110178979256e-08, 1.4727222996668843e-08]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 35.0, 22.0, 41.0, 31.0, 30.0, 41.0, 38.0, 38.0, 47.0, 58.0, 54.0, 55.0, 53.0, 46.0, 40.0, 43.0, 40.0, 36.0, 32.0, 19.0, 31.0, 26.0, 20.0, 9.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.919189453125, -3.80322265625, -3.687255859375, -3.5712890625, -3.455322265625, -3.33935546875, -3.223388671875, -3.107421875, -2.991455078125, -2.87548828125, -2.759521484375, -2.6435546875, -2.527587890625, -2.41162109375, -2.295654296875, -2.1796875, -2.063720703125, -1.94775390625, -1.831787109375, -1.7158203125, -1.599853515625, -1.48388671875, -1.367919921875, -1.251953125, -1.135986328125, -1.02001953125, -0.904052734375, -0.7880859375, -0.672119140625, -0.55615234375, -0.440185546875, -0.32421875, -0.208251953125, -0.09228515625, 0.023681640625, 0.1396484375, 0.255615234375, 0.37158203125, 0.487548828125, 0.603515625, 0.719482421875, 0.83544921875, 0.951416015625, 1.0673828125, 1.183349609375, 1.29931640625, 1.415283203125, 1.53125, 1.647216796875, 1.76318359375, 1.879150390625, 1.9951171875, 2.111083984375, 2.22705078125, 2.343017578125, 2.458984375, 2.574951171875, 2.69091796875, 2.806884765625, 2.9228515625, 3.038818359375, 3.15478515625, 3.270751953125, 3.38671875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 13.0, 15.0, 14.0, 27.0, 49.0, 62.0, 85.0, 132.0, 216.0, 442.0, 1056.0, 2814.0, 7952.0, 22928.0, 100084.0, 715148.0, 152961.0, 28944.0, 9695.0, 3434.0, 1301.0, 503.0, 252.0, 135.0, 77.0, 53.0, 51.0, 28.0, 16.0, 16.0, 11.0, 9.0, 6.0, 10.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.53448486328125, -5.3697509765625, -5.20501708984375, -5.040283203125, -4.87554931640625, -4.7108154296875, -4.54608154296875, -4.38134765625, -4.21661376953125, -4.0518798828125, -3.88714599609375, -3.722412109375, -3.55767822265625, -3.3929443359375, -3.22821044921875, -3.0634765625, -2.89874267578125, -2.7340087890625, -2.56927490234375, -2.404541015625, -2.23980712890625, -2.0750732421875, -1.91033935546875, -1.74560546875, -1.58087158203125, -1.4161376953125, -1.25140380859375, -1.086669921875, -0.92193603515625, -0.7572021484375, -0.59246826171875, -0.427734375, -0.26300048828125, -0.0982666015625, 0.06646728515625, 0.231201171875, 0.39593505859375, 0.5606689453125, 0.72540283203125, 0.89013671875, 1.05487060546875, 1.2196044921875, 1.38433837890625, 1.549072265625, 1.71380615234375, 1.8785400390625, 2.04327392578125, 2.2080078125, 2.37274169921875, 2.5374755859375, 2.70220947265625, 2.866943359375, 3.03167724609375, 3.1964111328125, 3.36114501953125, 3.52587890625, 3.69061279296875, 3.8553466796875, 4.02008056640625, 4.184814453125, 4.34954833984375, 4.5142822265625, 4.67901611328125, 4.84375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 7.0, 6.0, 9.0, 8.0, 7.0, 5.0, 17.0, 11.0, 17.0, 10.0, 12.0, 17.0, 25.0, 28.0, 33.0, 38.0, 31.0, 33.0, 58.0, 55.0, 97.0, 221.0, 1656.0, 163.0, 75.0, 48.0, 35.0, 40.0, 35.0, 38.0, 22.0, 19.0, 31.0, 23.0, 20.0, 16.0, 20.0, 14.0, 10.0, 12.0, 11.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.78125, -8.4920654296875, -8.202880859375, -7.9136962890625, -7.62451171875, -7.3353271484375, -7.046142578125, -6.7569580078125, -6.4677734375, -6.1785888671875, -5.889404296875, -5.6002197265625, -5.31103515625, -5.0218505859375, -4.732666015625, -4.4434814453125, -4.154296875, -3.8651123046875, -3.575927734375, -3.2867431640625, -2.99755859375, -2.7083740234375, -2.419189453125, -2.1300048828125, -1.8408203125, -1.5516357421875, -1.262451171875, -0.9732666015625, -0.68408203125, -0.3948974609375, -0.105712890625, 0.1834716796875, 0.47265625, 0.7618408203125, 1.051025390625, 1.3402099609375, 1.62939453125, 1.9185791015625, 2.207763671875, 2.4969482421875, 2.7861328125, 3.0753173828125, 3.364501953125, 3.6536865234375, 3.94287109375, 4.2320556640625, 4.521240234375, 4.8104248046875, 5.099609375, 5.3887939453125, 5.677978515625, 5.9671630859375, 6.25634765625, 6.5455322265625, 6.834716796875, 7.1239013671875, 7.4130859375, 7.7022705078125, 7.991455078125, 8.2806396484375, 8.56982421875, 8.8590087890625, 9.148193359375, 9.4373779296875, 9.7265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 4.0, 6.0, 14.0, 8.0, 15.0, 12.0, 24.0, 18.0, 23.0, 40.0, 29.0, 35.0, 49.0, 65.0, 115.0, 140.0, 255.0, 650.0, 4288.0, 703249.0, 2428852.0, 6155.0, 778.0, 262.0, 162.0, 109.0, 77.0, 51.0, 43.0, 27.0, 21.0, 14.0, 13.0, 16.0, 14.0, 14.0, 13.0, 6.0, 6.0, 12.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.53125, -22.84033203125, -22.1494140625, -21.45849609375, -20.767578125, -20.07666015625, -19.3857421875, -18.69482421875, -18.00390625, -17.31298828125, -16.6220703125, -15.93115234375, -15.240234375, -14.54931640625, -13.8583984375, -13.16748046875, -12.4765625, -11.78564453125, -11.0947265625, -10.40380859375, -9.712890625, -9.02197265625, -8.3310546875, -7.64013671875, -6.94921875, -6.25830078125, -5.5673828125, -4.87646484375, -4.185546875, -3.49462890625, -2.8037109375, -2.11279296875, -1.421875, -0.73095703125, -0.0400390625, 0.65087890625, 1.341796875, 2.03271484375, 2.7236328125, 3.41455078125, 4.10546875, 4.79638671875, 5.4873046875, 6.17822265625, 6.869140625, 7.56005859375, 8.2509765625, 8.94189453125, 9.6328125, 10.32373046875, 11.0146484375, 11.70556640625, 12.396484375, 13.08740234375, 13.7783203125, 14.46923828125, 15.16015625, 15.85107421875, 16.5419921875, 17.23291015625, 17.923828125, 18.61474609375, 19.3056640625, 19.99658203125, 20.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 18.0, 39.0, 70.0, 96.0, 116.0, 152.0, 154.0, 139.0, 81.0, 65.0, 30.0, 23.0, 8.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624663352966309, -5.2265753746032715, -4.828487396240234, -4.4303998947143555, -4.032311916351318, -3.6342239379882812, -3.2361361980438232, -2.8380484580993652, -2.439960479736328, -2.041872501373291, -1.643784761428833, -1.2456969022750854, -0.8476090431213379, -0.44952118396759033, -0.05143332481384277, 0.34665441513061523, 0.7447423934936523, 1.1428302526474, 1.5409181118011475, 1.939005970954895, 2.3370938301086426, 2.7351818084716797, 3.1332695484161377, 3.5313572883605957, 3.929445266723633, 4.32753324508667, 4.725621223449707, 5.123708724975586, 5.521796703338623, 5.91988468170166, 6.317972183227539, 6.716060161590576, 7.11414909362793, 7.512237071990967, 7.910325050354004, 8.308412551879883, 8.706501007080078, 9.104588508605957, 9.502676010131836, 9.900764465332031, 10.29885196685791, 10.696939468383789, 11.095027923583984, 11.493115425109863, 11.891202926635742, 12.289291381835938, 12.687378883361816, 13.085466384887695, 13.48355484008789, 13.88164234161377, 14.279730796813965, 14.677818298339844, 15.075906753540039, 15.473994255065918, 15.872081756591797, 16.270170211791992, 16.668258666992188, 17.066347122192383, 17.464433670043945, 17.86252212524414, 18.260610580444336, 18.6586971282959, 19.056785583496094, 19.45487403869629, 19.85296058654785]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 9.0, 4.0, 9.0, 17.0, 14.0, 19.0, 17.0, 29.0, 22.0, 38.0, 29.0, 30.0, 38.0, 47.0, 49.0, 44.0, 44.0, 53.0, 44.0, 41.0, 44.0, 43.0, 46.0, 33.0, 44.0, 33.0, 25.0, 20.0, 19.0, 22.0, 15.0, 13.0, 8.0, 12.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.866119384765625, -33.842620849609375, -32.81912612915039, -31.79562759399414, -30.77212905883789, -29.748632431030273, -28.725135803222656, -27.701637268066406, -26.67814064025879, -25.654644012451172, -24.631145477294922, -23.607648849487305, -22.584152221679688, -21.560653686523438, -20.53715705871582, -19.513660430908203, -18.490161895751953, -17.466665267944336, -16.443166732788086, -15.419670104980469, -14.396172523498535, -13.372674942016602, -12.349178314208984, -11.32568073272705, -10.302183151245117, -9.278685569763184, -8.25518798828125, -7.231691360473633, -6.208193778991699, -5.184696197509766, -4.16119909286499, -3.137701988220215, -2.114208221435547, -1.0907108783721924, -0.06721353530883789, 0.9562838077545166, 1.979781150817871, 3.0032787322998047, 4.02677583694458, 5.0502729415893555, 6.073770523071289, 7.097268104553223, 8.120765686035156, 9.144262313842773, 10.167759895324707, 11.19125747680664, 12.214754104614258, 13.238251686096191, 14.261749267578125, 15.285246849060059, 16.308744430541992, 17.33224105834961, 18.35573959350586, 19.379236221313477, 20.402732849121094, 21.426231384277344, 22.44972801208496, 23.473224639892578, 24.496723175048828, 25.520219802856445, 26.543716430664062, 27.567214965820312, 28.59071159362793, 29.614208221435547, 30.637706756591797]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 6.0, 5.0, 12.0, 9.0, 20.0, 32.0, 33.0, 26.0, 37.0, 34.0, 37.0, 41.0, 46.0, 40.0, 52.0, 57.0, 53.0, 48.0, 47.0, 52.0, 42.0, 30.0, 38.0, 28.0, 31.0, 30.0, 25.0, 29.0, 14.0, 8.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.083953857421875, -3.96087646484375, -3.837799072265625, -3.7147216796875, -3.591644287109375, -3.46856689453125, -3.345489501953125, -3.222412109375, -3.099334716796875, -2.97625732421875, -2.853179931640625, -2.7301025390625, -2.607025146484375, -2.48394775390625, -2.360870361328125, -2.23779296875, -2.114715576171875, -1.99163818359375, -1.868560791015625, -1.7454833984375, -1.622406005859375, -1.49932861328125, -1.376251220703125, -1.253173828125, -1.130096435546875, -1.00701904296875, -0.883941650390625, -0.7608642578125, -0.637786865234375, -0.51470947265625, -0.391632080078125, -0.2685546875, -0.145477294921875, -0.02239990234375, 0.100677490234375, 0.2237548828125, 0.346832275390625, 0.46990966796875, 0.592987060546875, 0.716064453125, 0.839141845703125, 0.96221923828125, 1.085296630859375, 1.2083740234375, 1.331451416015625, 1.45452880859375, 1.577606201171875, 1.70068359375, 1.823760986328125, 1.94683837890625, 2.069915771484375, 2.1929931640625, 2.316070556640625, 2.43914794921875, 2.562225341796875, 2.685302734375, 2.808380126953125, 2.93145751953125, 3.054534912109375, 3.1776123046875, 3.300689697265625, 3.42376708984375, 3.546844482421875, 3.669921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 22.0, 23.0, 33.0, 48.0, 75.0, 130.0, 212.0, 318.0, 485.0, 852.0, 1439.0, 2629.0, 5074.0, 10092.0, 20514.0, 44757.0, 104572.0, 266941.0, 675883.0, 1258672.0, 1037679.0, 452914.0, 175046.0, 72178.0, 31965.0, 15352.0, 7430.0, 3914.0, 2116.0, 1094.0, 678.0, 424.0, 254.0, 169.0, 97.0, 62.0, 43.0, 26.0, 22.0, 12.0, 7.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.625, -3.520782470703125, -3.41656494140625, -3.312347412109375, -3.2081298828125, -3.103912353515625, -2.99969482421875, -2.895477294921875, -2.791259765625, -2.687042236328125, -2.58282470703125, -2.478607177734375, -2.3743896484375, -2.270172119140625, -2.16595458984375, -2.061737060546875, -1.95751953125, -1.853302001953125, -1.74908447265625, -1.644866943359375, -1.5406494140625, -1.436431884765625, -1.33221435546875, -1.227996826171875, -1.123779296875, -1.019561767578125, -0.91534423828125, -0.811126708984375, -0.7069091796875, -0.602691650390625, -0.49847412109375, -0.394256591796875, -0.2900390625, -0.185821533203125, -0.08160400390625, 0.022613525390625, 0.1268310546875, 0.231048583984375, 0.33526611328125, 0.439483642578125, 0.543701171875, 0.647918701171875, 0.75213623046875, 0.856353759765625, 0.9605712890625, 1.064788818359375, 1.16900634765625, 1.273223876953125, 1.37744140625, 1.481658935546875, 1.58587646484375, 1.690093994140625, 1.7943115234375, 1.898529052734375, 2.00274658203125, 2.106964111328125, 2.211181640625, 2.315399169921875, 2.41961669921875, 2.523834228515625, 2.6280517578125, 2.732269287109375, 2.83648681640625, 2.940704345703125, 3.044921875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 6.0, 14.0, 15.0, 17.0, 28.0, 38.0, 38.0, 64.0, 69.0, 85.0, 102.0, 135.0, 180.0, 251.0, 272.0, 337.0, 372.0, 399.0, 318.0, 249.0, 228.0, 167.0, 132.0, 106.0, 92.0, 74.0, 50.0, 51.0, 42.0, 28.0, 13.0, 18.0, 19.0, 12.0, 4.0, 10.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.77734375, -4.62762451171875, -4.4779052734375, -4.32818603515625, -4.178466796875, -4.02874755859375, -3.8790283203125, -3.72930908203125, -3.57958984375, -3.42987060546875, -3.2801513671875, -3.13043212890625, -2.980712890625, -2.83099365234375, -2.6812744140625, -2.53155517578125, -2.3818359375, -2.23211669921875, -2.0823974609375, -1.93267822265625, -1.782958984375, -1.63323974609375, -1.4835205078125, -1.33380126953125, -1.18408203125, -1.03436279296875, -0.8846435546875, -0.73492431640625, -0.585205078125, -0.43548583984375, -0.2857666015625, -0.13604736328125, 0.013671875, 0.16339111328125, 0.3131103515625, 0.46282958984375, 0.612548828125, 0.76226806640625, 0.9119873046875, 1.06170654296875, 1.21142578125, 1.36114501953125, 1.5108642578125, 1.66058349609375, 1.810302734375, 1.96002197265625, 2.1097412109375, 2.25946044921875, 2.4091796875, 2.55889892578125, 2.7086181640625, 2.85833740234375, 3.008056640625, 3.15777587890625, 3.3074951171875, 3.45721435546875, 3.60693359375, 3.75665283203125, 3.9063720703125, 4.05609130859375, 4.205810546875, 4.35552978515625, 4.5052490234375, 4.65496826171875, 4.8046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 5.0, 4.0, 9.0, 16.0, 6.0, 20.0, 21.0, 31.0, 29.0, 51.0, 64.0, 92.0, 98.0, 149.0, 197.0, 265.0, 379.0, 722.0, 3108.0, 76417.0, 3370893.0, 724153.0, 14518.0, 1361.0, 496.0, 325.0, 240.0, 136.0, 118.0, 103.0, 63.0, 50.0, 42.0, 28.0, 22.0, 16.0, 10.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.337158203125, -17.72119140625, -17.105224609375, -16.4892578125, -15.873291015625, -15.25732421875, -14.641357421875, -14.025390625, -13.409423828125, -12.79345703125, -12.177490234375, -11.5615234375, -10.945556640625, -10.32958984375, -9.713623046875, -9.09765625, -8.481689453125, -7.86572265625, -7.249755859375, -6.6337890625, -6.017822265625, -5.40185546875, -4.785888671875, -4.169921875, -3.553955078125, -2.93798828125, -2.322021484375, -1.7060546875, -1.090087890625, -0.47412109375, 0.141845703125, 0.7578125, 1.373779296875, 1.98974609375, 2.605712890625, 3.2216796875, 3.837646484375, 4.45361328125, 5.069580078125, 5.685546875, 6.301513671875, 6.91748046875, 7.533447265625, 8.1494140625, 8.765380859375, 9.38134765625, 9.997314453125, 10.61328125, 11.229248046875, 11.84521484375, 12.461181640625, 13.0771484375, 13.693115234375, 14.30908203125, 14.925048828125, 15.541015625, 16.156982421875, 16.77294921875, 17.388916015625, 18.0048828125, 18.620849609375, 19.23681640625, 19.852783203125, 20.46875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 12.0, 47.0, 166.0, 322.0, 263.0, 148.0, 38.0, 15.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.80194091796875, -109.36416625976562, -106.92639923095703, -104.4886245727539, -102.05085754394531, -99.61308288574219, -97.17530822753906, -94.73754119873047, -92.29976654052734, -89.86199188232422, -87.42422485351562, -84.9864501953125, -82.5486831665039, -80.11090850830078, -77.67314147949219, -75.23536682128906, -72.79759216308594, -70.35981750488281, -67.92205047607422, -65.4842758178711, -63.046504974365234, -60.608734130859375, -58.170963287353516, -55.733192443847656, -53.29542541503906, -50.8576545715332, -48.419883728027344, -45.98210906982422, -43.54433822631836, -41.1065673828125, -38.66879653930664, -36.23102569580078, -33.793251037597656, -31.355480194091797, -28.917707443237305, -26.479936599731445, -24.042163848876953, -21.604393005371094, -19.166622161865234, -16.728849411010742, -14.291078567504883, -11.853306770324707, -9.415534973144531, -6.977764129638672, -4.539992332458496, -2.1022205352783203, 0.33555030822753906, 2.7733230590820312, 5.211093902587891, 7.648865699768066, 10.086637496948242, 12.524408340454102, 14.962180137634277, 17.399951934814453, 19.837722778320312, 22.275495529174805, 24.713266372680664, 27.151037216186523, 29.588809967041016, 32.026580810546875, 34.464351654052734, 36.902122497558594, 39.33989715576172, 41.77766799926758, 44.21543884277344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 10.0, 3.0, 9.0, 7.0, 18.0, 13.0, 14.0, 20.0, 20.0, 13.0, 23.0, 24.0, 36.0, 28.0, 34.0, 52.0, 38.0, 37.0, 38.0, 54.0, 39.0, 41.0, 38.0, 46.0, 41.0, 42.0, 36.0, 34.0, 32.0, 30.0, 21.0, 25.0, 17.0, 5.0, 12.0, 8.0, 9.0, 9.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5845947265625, -18.91526222229004, -18.245929718017578, -17.576597213745117, -16.907264709472656, -16.237934112548828, -15.568601608276367, -14.899269104003906, -14.229936599731445, -13.560604095458984, -12.891271591186523, -12.221940040588379, -11.552607536315918, -10.883275032043457, -10.213943481445312, -9.544610977172852, -8.87527847290039, -8.20594596862793, -7.536613941192627, -6.867281913757324, -6.197949409484863, -5.528616905212402, -4.8592848777771, -4.189952850341797, -3.520620346069336, -2.851288080215454, -2.1819558143615723, -1.5126235485076904, -0.8432912826538086, -0.17395901679992676, 0.4953732490539551, 1.1647052764892578, 1.8340377807617188, 2.5033700466156006, 3.1727023124694824, 3.8420345783233643, 4.511366844177246, 5.180699348449707, 5.85003137588501, 6.5193634033203125, 7.188695907592773, 7.858028411865234, 8.527360916137695, 9.19669246673584, 9.8660249710083, 10.535357475280762, 11.204689025878906, 11.874021530151367, 12.543354034423828, 13.212686538696289, 13.88201904296875, 14.551350593566895, 15.220683097839355, 15.890015602111816, 16.55934715270996, 17.228679656982422, 17.898012161254883, 18.567344665527344, 19.236677169799805, 19.906009674072266, 20.575340270996094, 21.244672775268555, 21.914005279541016, 22.583337783813477, 23.252670288085938]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 21.0, 12.0, 24.0, 45.0, 32.0, 25.0, 39.0, 42.0, 33.0, 35.0, 41.0, 58.0, 58.0, 55.0, 43.0, 42.0, 45.0, 45.0, 45.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.97320556640625, -3.8565673828125, -3.73992919921875, -3.623291015625, -3.50665283203125, -3.3900146484375, -3.27337646484375, -3.15673828125, -3.04010009765625, -2.9234619140625, -2.80682373046875, -2.690185546875, -2.57354736328125, -2.4569091796875, -2.34027099609375, -2.2236328125, -2.10699462890625, -1.9903564453125, -1.87371826171875, -1.757080078125, -1.64044189453125, -1.5238037109375, -1.40716552734375, -1.29052734375, -1.17388916015625, -1.0572509765625, -0.94061279296875, -0.823974609375, -0.70733642578125, -0.5906982421875, -0.47406005859375, -0.357421875, -0.24078369140625, -0.1241455078125, -0.00750732421875, 0.109130859375, 0.22576904296875, 0.3424072265625, 0.45904541015625, 0.57568359375, 0.69232177734375, 0.8089599609375, 0.92559814453125, 1.042236328125, 1.15887451171875, 1.2755126953125, 1.39215087890625, 1.5087890625, 1.62542724609375, 1.7420654296875, 1.85870361328125, 1.975341796875, 2.09197998046875, 2.2086181640625, 2.32525634765625, 2.44189453125, 2.55853271484375, 2.6751708984375, 2.79180908203125, 2.908447265625, 3.02508544921875, 3.1417236328125, 3.25836181640625, 3.375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 20.0, 25.0, 32.0, 43.0, 63.0, 115.0, 155.0, 227.0, 309.0, 528.0, 805.0, 1330.0, 2078.0, 3358.0, 5349.0, 8659.0, 13979.0, 22794.0, 37245.0, 62672.0, 113493.0, 280613.0, 243714.0, 102683.0, 57764.0, 34673.0, 21025.0, 13150.0, 8210.0, 4954.0, 3078.0, 1933.0, 1244.0, 771.0, 459.0, 334.0, 213.0, 131.0, 94.0, 59.0, 47.0, 24.0, 26.0, 25.0, 14.0, 8.0, 6.0, 7.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.018951416015625, -0.01839280128479004, -0.017834186553955078, -0.017275571823120117, -0.016716957092285156, -0.016158342361450195, -0.015599727630615234, -0.015041112899780273, -0.014482498168945312, -0.013923883438110352, -0.01336526870727539, -0.01280665397644043, -0.012248039245605469, -0.011689424514770508, -0.011130809783935547, -0.010572195053100586, -0.010013580322265625, -0.009454965591430664, -0.008896350860595703, -0.008337736129760742, -0.007779121398925781, -0.00722050666809082, -0.006661891937255859, -0.0061032772064208984, -0.0055446624755859375, -0.0049860477447509766, -0.004427433013916016, -0.0038688182830810547, -0.0033102035522460938, -0.002751588821411133, -0.002192974090576172, -0.001634359359741211, -0.00107574462890625, -0.0005171298980712891, 4.1484832763671875e-05, 0.0006000995635986328, 0.0011587142944335938, 0.0017173290252685547, 0.0022759437561035156, 0.0028345584869384766, 0.0033931732177734375, 0.0039517879486083984, 0.004510402679443359, 0.00506901741027832, 0.005627632141113281, 0.006186246871948242, 0.006744861602783203, 0.007303476333618164, 0.007862091064453125, 0.008420705795288086, 0.008979320526123047, 0.009537935256958008, 0.010096549987792969, 0.01065516471862793, 0.01121377944946289, 0.011772394180297852, 0.012331008911132812, 0.012889623641967773, 0.013448238372802734, 0.014006853103637695, 0.014565467834472656, 0.015124082565307617, 0.015682697296142578, 0.01624131202697754, 0.0167999267578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 0.0, 6.0, 6.0, 9.0, 8.0, 14.0, 17.0, 16.0, 21.0, 28.0, 26.0, 30.0, 38.0, 37.0, 36.0, 37.0, 50.0, 45.0, 50.0, 1075.0, 38.0, 47.0, 47.0, 35.0, 37.0, 31.0, 39.0, 32.0, 22.0, 21.0, 19.0, 14.0, 22.0, 13.0, 9.0, 7.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9214935302734375, -1.853729248046875, -1.7859649658203125, -1.71820068359375, -1.6504364013671875, -1.582672119140625, -1.5149078369140625, -1.4471435546875, -1.3793792724609375, -1.311614990234375, -1.2438507080078125, -1.17608642578125, -1.1083221435546875, -1.040557861328125, -0.9727935791015625, -0.905029296875, -0.8372650146484375, -0.769500732421875, -0.7017364501953125, -0.63397216796875, -0.5662078857421875, -0.498443603515625, -0.4306793212890625, -0.3629150390625, -0.2951507568359375, -0.227386474609375, -0.1596221923828125, -0.09185791015625, -0.0240936279296875, 0.043670654296875, 0.1114349365234375, 0.17919921875, 0.2469635009765625, 0.314727783203125, 0.3824920654296875, 0.45025634765625, 0.5180206298828125, 0.585784912109375, 0.6535491943359375, 0.7213134765625, 0.7890777587890625, 0.856842041015625, 0.9246063232421875, 0.99237060546875, 1.0601348876953125, 1.127899169921875, 1.1956634521484375, 1.263427734375, 1.3311920166015625, 1.398956298828125, 1.4667205810546875, 1.53448486328125, 1.6022491455078125, 1.670013427734375, 1.7377777099609375, 1.8055419921875, 1.8733062744140625, 1.941070556640625, 2.0088348388671875, 2.07659912109375, 2.1443634033203125, 2.212127685546875, 2.2798919677734375, 2.34765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 11.0, 15.0, 32.0, 26.0, 50.0, 64.0, 109.0, 218.0, 326.0, 480.0, 742.0, 1237.0, 2025.0, 3129.0, 5036.0, 8290.0, 13582.0, 22869.0, 39567.0, 71621.0, 148211.0, 1388718.0, 192988.0, 84839.0, 46151.0, 26424.0, 15471.0, 9598.0, 5488.0, 3618.0, 2255.0, 1408.0, 908.0, 594.0, 367.0, 239.0, 168.0, 107.0, 44.0, 31.0, 26.0, 17.0, 15.0, 8.0, 9.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.014434814453125, -0.014005661010742188, -0.013576507568359375, -0.013147354125976562, -0.01271820068359375, -0.012289047241210938, -0.011859893798828125, -0.011430740356445312, -0.0110015869140625, -0.010572433471679688, -0.010143280029296875, -0.009714126586914062, -0.00928497314453125, -0.008855819702148438, -0.008426666259765625, -0.007997512817382812, -0.007568359375, -0.0071392059326171875, -0.006710052490234375, -0.0062808990478515625, -0.00585174560546875, -0.0054225921630859375, -0.004993438720703125, -0.0045642852783203125, -0.0041351318359375, -0.0037059783935546875, -0.003276824951171875, -0.0028476715087890625, -0.00241851806640625, -0.0019893646240234375, -0.001560211181640625, -0.0011310577392578125, -0.000701904296875, -0.0002727508544921875, 0.000156402587890625, 0.0005855560302734375, 0.00101470947265625, 0.0014438629150390625, 0.001873016357421875, 0.0023021697998046875, 0.0027313232421875, 0.0031604766845703125, 0.003589630126953125, 0.0040187835693359375, 0.00444793701171875, 0.0048770904541015625, 0.005306243896484375, 0.0057353973388671875, 0.00616455078125, 0.0065937042236328125, 0.007022857666015625, 0.0074520111083984375, 0.00788116455078125, 0.008310317993164062, 0.008739471435546875, 0.009168624877929688, 0.0095977783203125, 0.010026931762695312, 0.010456085205078125, 0.010885238647460938, 0.01131439208984375, 0.011743545532226562, 0.012172698974609375, 0.012601852416992188, 0.013031005859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 13.0, 44.0, 15.0, 23.0, 10.0, 0.0, 7.0, 41.0, 67.0, 65.0, 257.0, 4954.0, 991059.0, 51461.0, 257.0, 48.0, 75.0, 41.0, 4.0, 2.0, 6.0, 21.0, 21.0, 37.0, 16.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.7513673305511475e-06, -3.6284327507019043e-06, -3.505498170852661e-06, -3.382563591003418e-06, -3.259629011154175e-06, -3.1366944313049316e-06, -3.0137598514556885e-06, -2.8908252716064453e-06, -2.767890691757202e-06, -2.644956111907959e-06, -2.522021532058716e-06, -2.3990869522094727e-06, -2.2761523723602295e-06, -2.1532177925109863e-06, -2.030283212661743e-06, -1.9073486328125e-06, -1.7844140529632568e-06, -1.6614794731140137e-06, -1.5385448932647705e-06, -1.4156103134155273e-06, -1.2926757335662842e-06, -1.169741153717041e-06, -1.0468065738677979e-06, -9.238719940185547e-07, -8.009374141693115e-07, -6.780028343200684e-07, -5.550682544708252e-07, -4.3213367462158203e-07, -3.0919909477233887e-07, -1.862645149230957e-07, -6.332993507385254e-08, 5.960464477539063e-08, 1.825392246246338e-07, 3.0547380447387695e-07, 4.284083843231201e-07, 5.513429641723633e-07, 6.742775440216064e-07, 7.972121238708496e-07, 9.201467037200928e-07, 1.043081283569336e-06, 1.166015863418579e-06, 1.2889504432678223e-06, 1.4118850231170654e-06, 1.5348196029663086e-06, 1.6577541828155518e-06, 1.780688762664795e-06, 1.903623342514038e-06, 2.0265579223632812e-06, 2.1494925022125244e-06, 2.2724270820617676e-06, 2.3953616619110107e-06, 2.518296241760254e-06, 2.641230821609497e-06, 2.7641654014587402e-06, 2.8870999813079834e-06, 3.0100345611572266e-06, 3.1329691410064697e-06, 3.255903720855713e-06, 3.378838300704956e-06, 3.5017728805541992e-06, 3.6247074604034424e-06, 3.7476420402526855e-06, 3.870576620101929e-06, 3.993511199951172e-06]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.357754773172019e-08, -5.245936307574084e-08, -5.134118197247517e-08, -5.022299731649582e-08, -4.910481266051647e-08, -4.7986628004537124e-08, -4.6868446901271454e-08, -4.5750262245292106e-08, -4.463207758931276e-08, -4.351389293333341e-08, -4.239571183006774e-08, -4.127752717408839e-08, -4.015934251810904e-08, -3.9041157862129694e-08, -3.7922976758864024e-08, -3.6804792102884676e-08, -3.5686610999619006e-08, -3.456842634363966e-08, -3.345024524037399e-08, -3.233206058439464e-08, -3.121387592841529e-08, -3.009569127243594e-08, -2.8977510169170273e-08, -2.7859325513190925e-08, -2.6741140857211576e-08, -2.5622957977589067e-08, -2.450477332160972e-08, -2.338659044198721e-08, -2.226840578600786e-08, -2.1150222906385352e-08, -2.0032040026762843e-08, -1.8913855370783494e-08, -1.7795668938447307e-08, -1.6677486058824798e-08, -1.555930140284545e-08, -1.444111852322294e-08, -1.3322933867243592e-08, -1.2204750987621082e-08, -1.1086567219820154e-08, -9.968383452019225e-09, -8.850199684218296e-09, -7.732015916417367e-09, -6.613832148616439e-09, -5.49564882490472e-09, -4.377465057103791e-09, -3.259281289302862e-09, -2.1410979655911433e-09, -1.0229141977902145e-09, 9.526957001071423e-11, 1.2134532267893405e-09, 2.331636883567967e-09, 3.4498204293242907e-09, 4.5680041971252194e-09, 5.686187964926148e-09, 6.804371288637867e-09, 7.922555056438796e-09, 9.040738824239725e-09, 1.0158922592040653e-08, 1.1277106359841582e-08, 1.2395290127642511e-08, 1.351347300726502e-08, 1.4631657663244368e-08, 1.5749840542866878e-08, 1.6868025198846226e-08, 1.7986208078468735e-08]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 21.0, 12.0, 24.0, 45.0, 32.0, 25.0, 39.0, 42.0, 33.0, 35.0, 41.0, 58.0, 58.0, 55.0, 43.0, 42.0, 45.0, 45.0, 45.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.97320556640625, -3.8565673828125, -3.73992919921875, -3.623291015625, -3.50665283203125, -3.3900146484375, -3.27337646484375, -3.15673828125, -3.04010009765625, -2.9234619140625, -2.80682373046875, -2.690185546875, -2.57354736328125, -2.4569091796875, -2.34027099609375, -2.2236328125, -2.10699462890625, -1.9903564453125, -1.87371826171875, -1.757080078125, -1.64044189453125, -1.5238037109375, -1.40716552734375, -1.29052734375, -1.17388916015625, -1.0572509765625, -0.94061279296875, -0.823974609375, -0.70733642578125, -0.5906982421875, -0.47406005859375, -0.357421875, -0.24078369140625, -0.1241455078125, -0.00750732421875, 0.109130859375, 0.22576904296875, 0.3424072265625, 0.45904541015625, 0.57568359375, 0.69232177734375, 0.8089599609375, 0.92559814453125, 1.042236328125, 1.15887451171875, 1.2755126953125, 1.39215087890625, 1.5087890625, 1.62542724609375, 1.7420654296875, 1.85870361328125, 1.975341796875, 2.09197998046875, 2.2086181640625, 2.32525634765625, 2.44189453125, 2.55853271484375, 2.6751708984375, 2.79180908203125, 2.908447265625, 3.02508544921875, 3.1417236328125, 3.25836181640625, 3.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 22.0, 27.0, 48.0, 47.0, 89.0, 134.0, 244.0, 343.0, 551.0, 834.0, 1221.0, 1916.0, 2766.0, 4489.0, 6857.0, 10968.0, 18066.0, 29198.0, 50138.0, 92572.0, 191853.0, 287498.0, 157782.0, 78270.0, 43655.0, 25924.0, 15704.0, 9562.0, 6251.0, 4081.0, 2633.0, 1638.0, 1104.0, 695.0, 457.0, 324.0, 207.0, 116.0, 101.0, 57.0, 34.0, 19.0, 16.0, 9.0, 8.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0], "bins": [-2.546875, -2.4727783203125, -2.398681640625, -2.3245849609375, -2.25048828125, -2.1763916015625, -2.102294921875, -2.0281982421875, -1.9541015625, -1.8800048828125, -1.805908203125, -1.7318115234375, -1.65771484375, -1.5836181640625, -1.509521484375, -1.4354248046875, -1.361328125, -1.2872314453125, -1.213134765625, -1.1390380859375, -1.06494140625, -0.9908447265625, -0.916748046875, -0.8426513671875, -0.7685546875, -0.6944580078125, -0.620361328125, -0.5462646484375, -0.47216796875, -0.3980712890625, -0.323974609375, -0.2498779296875, -0.17578125, -0.1016845703125, -0.027587890625, 0.0465087890625, 0.12060546875, 0.1947021484375, 0.268798828125, 0.3428955078125, 0.4169921875, 0.4910888671875, 0.565185546875, 0.6392822265625, 0.71337890625, 0.7874755859375, 0.861572265625, 0.9356689453125, 1.009765625, 1.0838623046875, 1.157958984375, 1.2320556640625, 1.30615234375, 1.3802490234375, 1.454345703125, 1.5284423828125, 1.6025390625, 1.6766357421875, 1.750732421875, 1.8248291015625, 1.89892578125, 1.9730224609375, 2.047119140625, 2.1212158203125, 2.1953125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 5.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 5.0, 12.0, 12.0, 10.0, 13.0, 24.0, 25.0, 27.0, 32.0, 23.0, 24.0, 42.0, 35.0, 48.0, 58.0, 141.0, 329.0, 1411.0, 187.0, 85.0, 54.0, 49.0, 41.0, 34.0, 51.0, 28.0, 25.0, 21.0, 23.0, 17.0, 24.0, 24.0, 8.0, 11.0, 15.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.9375, -8.66796875, -8.3984375, -8.12890625, -7.859375, -7.58984375, -7.3203125, -7.05078125, -6.78125, -6.51171875, -6.2421875, -5.97265625, -5.703125, -5.43359375, -5.1640625, -4.89453125, -4.625, -4.35546875, -4.0859375, -3.81640625, -3.546875, -3.27734375, -3.0078125, -2.73828125, -2.46875, -2.19921875, -1.9296875, -1.66015625, -1.390625, -1.12109375, -0.8515625, -0.58203125, -0.3125, -0.04296875, 0.2265625, 0.49609375, 0.765625, 1.03515625, 1.3046875, 1.57421875, 1.84375, 2.11328125, 2.3828125, 2.65234375, 2.921875, 3.19140625, 3.4609375, 3.73046875, 4.0, 4.26953125, 4.5390625, 4.80859375, 5.078125, 5.34765625, 5.6171875, 5.88671875, 6.15625, 6.42578125, 6.6953125, 6.96484375, 7.234375, 7.50390625, 7.7734375, 8.04296875, 8.3125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 4.0, 13.0, 19.0, 18.0, 13.0, 16.0, 35.0, 30.0, 40.0, 36.0, 71.0, 74.0, 105.0, 165.0, 163.0, 300.0, 528.0, 1841.0, 11717.0, 136702.0, 2772118.0, 202294.0, 15721.0, 2064.0, 548.0, 297.0, 165.0, 120.0, 107.0, 75.0, 69.0, 52.0, 39.0, 24.0, 22.0, 21.0, 11.0, 7.0, 9.0, 9.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5078125, -11.1431884765625, -10.778564453125, -10.4139404296875, -10.04931640625, -9.6846923828125, -9.320068359375, -8.9554443359375, -8.5908203125, -8.2261962890625, -7.861572265625, -7.4969482421875, -7.13232421875, -6.7677001953125, -6.403076171875, -6.0384521484375, -5.673828125, -5.3092041015625, -4.944580078125, -4.5799560546875, -4.21533203125, -3.8507080078125, -3.486083984375, -3.1214599609375, -2.7568359375, -2.3922119140625, -2.027587890625, -1.6629638671875, -1.29833984375, -0.9337158203125, -0.569091796875, -0.2044677734375, 0.16015625, 0.5247802734375, 0.889404296875, 1.2540283203125, 1.61865234375, 1.9832763671875, 2.347900390625, 2.7125244140625, 3.0771484375, 3.4417724609375, 3.806396484375, 4.1710205078125, 4.53564453125, 4.9002685546875, 5.264892578125, 5.6295166015625, 5.994140625, 6.3587646484375, 6.723388671875, 7.0880126953125, 7.45263671875, 7.8172607421875, 8.181884765625, 8.5465087890625, 8.9111328125, 9.2757568359375, 9.640380859375, 10.0050048828125, 10.36962890625, 10.7342529296875, 11.098876953125, 11.4635009765625, 11.828125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [197.0, 780.0, 40.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.472397327423096, -1.4493160247802734, 2.573765277862549, 6.596847057342529, 10.619928359985352, 14.643009185791016, 18.666091918945312, 22.689172744750977, 26.71225357055664, 30.735334396362305, 34.75841522216797, 38.781497955322266, 42.80458068847656, 46.827659606933594, 50.85074234008789, 54.87382507324219, 58.89690399169922, 62.919986724853516, 66.94306945800781, 70.96614837646484, 74.98922729492188, 79.01231384277344, 83.03539276123047, 87.0584716796875, 91.08155059814453, 95.10462951660156, 99.12771606445312, 103.15079498291016, 107.17387390136719, 111.19696044921875, 115.22003936767578, 119.24311828613281, 123.26618957519531, 127.28926849365234, 131.31234741210938, 135.33543395996094, 139.3585205078125, 143.381591796875, 147.40467834472656, 151.42776489257812, 155.45083618164062, 159.4739227294922, 163.4969940185547, 167.52008056640625, 171.5431671142578, 175.5662384033203, 179.58932495117188, 183.61241149902344, 187.635498046875, 191.65858459472656, 195.68165588378906, 199.70474243164062, 203.7278289794922, 207.7509002685547, 211.77398681640625, 215.7970733642578, 219.8201446533203, 223.84323120117188, 227.86630249023438, 231.88938903808594, 235.9124755859375, 239.935546875, 243.95863342285156, 247.98171997070312, 252.00479125976562]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 7.0, 6.0, 4.0, 6.0, 6.0, 8.0, 8.0, 11.0, 12.0, 13.0, 14.0, 13.0, 24.0, 13.0, 15.0, 29.0, 26.0, 26.0, 25.0, 24.0, 28.0, 29.0, 35.0, 35.0, 26.0, 34.0, 54.0, 42.0, 35.0, 40.0, 24.0, 32.0, 22.0, 36.0, 29.0, 17.0, 21.0, 27.0, 21.0, 19.0, 18.0, 11.0, 16.0, 14.0, 10.0, 7.0, 4.0, 4.0, 8.0, 3.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.229881286621094, -20.539918899536133, -19.84995460510254, -19.159992218017578, -18.470027923583984, -17.780065536499023, -17.090103149414062, -16.40013885498047, -15.710175514221191, -15.020212173461914, -14.330248832702637, -13.64028549194336, -12.950323104858398, -12.260358810424805, -11.570396423339844, -10.880433082580566, -10.190469741821289, -9.500506401062012, -8.810543060302734, -8.120580673217773, -7.430616855621338, -6.7406535148620605, -6.050690650939941, -5.360727310180664, -4.670763969421387, -3.9808006286621094, -3.290837526321411, -2.600874423980713, -1.9109110832214355, -1.2209477424621582, -0.5309848785400391, 0.15897846221923828, 0.8489437103271484, 1.5389069318771362, 2.228870153427124, 2.9188332557678223, 3.6087965965270996, 4.298759937286377, 4.988722801208496, 5.678686141967773, 6.368649482727051, 7.058612823486328, 7.7485761642456055, 8.438539505004883, 9.128501892089844, 9.818466186523438, 10.508428573608398, 11.198391914367676, 11.888355255126953, 12.57831859588623, 13.268281936645508, 13.958244323730469, 14.648208618164062, 15.338171005249023, 16.028133392333984, 16.718097686767578, 17.408061981201172, 18.098024368286133, 18.787988662719727, 19.477951049804688, 20.16791534423828, 20.857877731323242, 21.547840118408203, 22.237804412841797, 22.927766799926758]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 2.0, 10.0, 15.0, 14.0, 13.0, 28.0, 26.0, 34.0, 42.0, 27.0, 31.0, 42.0, 34.0, 45.0, 54.0, 46.0, 43.0, 62.0, 39.0, 42.0, 41.0, 43.0, 39.0, 38.0, 24.0, 22.0, 29.0, 21.0, 18.0, 18.0, 11.0, 9.0, 13.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.140625, -4.024261474609375, -3.90789794921875, -3.791534423828125, -3.6751708984375, -3.558807373046875, -3.44244384765625, -3.326080322265625, -3.209716796875, -3.093353271484375, -2.97698974609375, -2.860626220703125, -2.7442626953125, -2.627899169921875, -2.51153564453125, -2.395172119140625, -2.27880859375, -2.162445068359375, -2.04608154296875, -1.929718017578125, -1.8133544921875, -1.696990966796875, -1.58062744140625, -1.464263916015625, -1.347900390625, -1.231536865234375, -1.11517333984375, -0.998809814453125, -0.8824462890625, -0.766082763671875, -0.64971923828125, -0.533355712890625, -0.4169921875, -0.300628662109375, -0.18426513671875, -0.067901611328125, 0.0484619140625, 0.164825439453125, 0.28118896484375, 0.397552490234375, 0.513916015625, 0.630279541015625, 0.74664306640625, 0.863006591796875, 0.9793701171875, 1.095733642578125, 1.21209716796875, 1.328460693359375, 1.44482421875, 1.561187744140625, 1.67755126953125, 1.793914794921875, 1.9102783203125, 2.026641845703125, 2.14300537109375, 2.259368896484375, 2.375732421875, 2.492095947265625, 2.60845947265625, 2.724822998046875, 2.8411865234375, 2.957550048828125, 3.07391357421875, 3.190277099609375, 3.306640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 3.0, 1.0, 9.0, 7.0, 9.0, 13.0, 21.0, 20.0, 18.0, 23.0, 33.0, 36.0, 51.0, 96.0, 279.0, 823.0, 3291.0, 15294.0, 99169.0, 1134971.0, 2634752.0, 263464.0, 32956.0, 6483.0, 1566.0, 453.0, 152.0, 69.0, 56.0, 33.0, 20.0, 22.0, 14.0, 13.0, 12.0, 15.0, 13.0, 3.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.846923828125, -7.56884765625, -7.290771484375, -7.0126953125, -6.734619140625, -6.45654296875, -6.178466796875, -5.900390625, -5.622314453125, -5.34423828125, -5.066162109375, -4.7880859375, -4.510009765625, -4.23193359375, -3.953857421875, -3.67578125, -3.397705078125, -3.11962890625, -2.841552734375, -2.5634765625, -2.285400390625, -2.00732421875, -1.729248046875, -1.451171875, -1.173095703125, -0.89501953125, -0.616943359375, -0.3388671875, -0.060791015625, 0.21728515625, 0.495361328125, 0.7734375, 1.051513671875, 1.32958984375, 1.607666015625, 1.8857421875, 2.163818359375, 2.44189453125, 2.719970703125, 2.998046875, 3.276123046875, 3.55419921875, 3.832275390625, 4.1103515625, 4.388427734375, 4.66650390625, 4.944580078125, 5.22265625, 5.500732421875, 5.77880859375, 6.056884765625, 6.3349609375, 6.613037109375, 6.89111328125, 7.169189453125, 7.447265625, 7.725341796875, 8.00341796875, 8.281494140625, 8.5595703125, 8.837646484375, 9.11572265625, 9.393798828125, 9.671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 13.0, 13.0, 27.0, 32.0, 47.0, 64.0, 94.0, 116.0, 137.0, 235.0, 318.0, 437.0, 540.0, 510.0, 408.0, 306.0, 212.0, 145.0, 110.0, 84.0, 59.0, 37.0, 27.0, 28.0, 25.0, 5.0, 7.0, 13.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0078125, -6.8123779296875, -6.616943359375, -6.4215087890625, -6.22607421875, -6.0306396484375, -5.835205078125, -5.6397705078125, -5.4443359375, -5.2489013671875, -5.053466796875, -4.8580322265625, -4.66259765625, -4.4671630859375, -4.271728515625, -4.0762939453125, -3.880859375, -3.6854248046875, -3.489990234375, -3.2945556640625, -3.09912109375, -2.9036865234375, -2.708251953125, -2.5128173828125, -2.3173828125, -2.1219482421875, -1.926513671875, -1.7310791015625, -1.53564453125, -1.3402099609375, -1.144775390625, -0.9493408203125, -0.75390625, -0.5584716796875, -0.363037109375, -0.1676025390625, 0.02783203125, 0.2232666015625, 0.418701171875, 0.6141357421875, 0.8095703125, 1.0050048828125, 1.200439453125, 1.3958740234375, 1.59130859375, 1.7867431640625, 1.982177734375, 2.1776123046875, 2.373046875, 2.5684814453125, 2.763916015625, 2.9593505859375, 3.15478515625, 3.3502197265625, 3.545654296875, 3.7410888671875, 3.9365234375, 4.1319580078125, 4.327392578125, 4.5228271484375, 4.71826171875, 4.9136962890625, 5.109130859375, 5.3045654296875, 5.5]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 6.0, 7.0, 8.0, 21.0, 10.0, 25.0, 35.0, 42.0, 51.0, 65.0, 86.0, 127.0, 191.0, 199.0, 357.0, 740.0, 4168.0, 86896.0, 3520138.0, 564348.0, 13923.0, 1397.0, 468.0, 265.0, 181.0, 125.0, 105.0, 98.0, 55.0, 39.0, 38.0, 14.0, 20.0, 9.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.218017578125, -17.56103515625, -16.904052734375, -16.2470703125, -15.590087890625, -14.93310546875, -14.276123046875, -13.619140625, -12.962158203125, -12.30517578125, -11.648193359375, -10.9912109375, -10.334228515625, -9.67724609375, -9.020263671875, -8.36328125, -7.706298828125, -7.04931640625, -6.392333984375, -5.7353515625, -5.078369140625, -4.42138671875, -3.764404296875, -3.107421875, -2.450439453125, -1.79345703125, -1.136474609375, -0.4794921875, 0.177490234375, 0.83447265625, 1.491455078125, 2.1484375, 2.805419921875, 3.46240234375, 4.119384765625, 4.7763671875, 5.433349609375, 6.09033203125, 6.747314453125, 7.404296875, 8.061279296875, 8.71826171875, 9.375244140625, 10.0322265625, 10.689208984375, 11.34619140625, 12.003173828125, 12.66015625, 13.317138671875, 13.97412109375, 14.631103515625, 15.2880859375, 15.945068359375, 16.60205078125, 17.259033203125, 17.916015625, 18.572998046875, 19.22998046875, 19.886962890625, 20.5439453125, 21.200927734375, 21.85791015625, 22.514892578125, 23.171875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 19.0, 28.0, 59.0, 83.0, 116.0, 136.0, 144.0, 138.0, 110.0, 72.0, 49.0, 25.0, 12.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.35489273071289, -45.3507080078125, -44.346527099609375, -43.342342376708984, -42.338157653808594, -41.3339729309082, -40.32978820800781, -39.32560729980469, -38.3214225769043, -37.317237854003906, -36.31305694580078, -35.30887222290039, -34.3046875, -33.30050277709961, -32.29631805419922, -31.292137145996094, -30.287952423095703, -29.283767700195312, -28.279584884643555, -27.275402069091797, -26.271217346191406, -25.267032623291016, -24.262849807739258, -23.2586669921875, -22.25448226928711, -21.25029754638672, -20.24611473083496, -19.241931915283203, -18.237747192382812, -17.233562469482422, -16.229379653930664, -15.22519588470459, -14.22100830078125, -13.216824531555176, -12.212640762329102, -11.208456993103027, -10.204273223876953, -9.200089454650879, -8.195905685424805, -7.1917219161987305, -6.187538146972656, -5.183354377746582, -4.179170608520508, -3.1749868392944336, -2.1708030700683594, -1.1666193008422852, -0.16243553161621094, 0.8417482376098633, 1.8459320068359375, 2.8501157760620117, 3.854299545288086, 4.85848331451416, 5.862667083740234, 6.866850852966309, 7.871034622192383, 8.875218391418457, 9.879402160644531, 10.883585929870605, 11.88776969909668, 12.891953468322754, 13.896137237548828, 14.900321006774902, 15.904504776000977, 16.908687591552734, 17.912872314453125]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 11.0, 15.0, 19.0, 24.0, 22.0, 29.0, 21.0, 38.0, 39.0, 26.0, 33.0, 44.0, 39.0, 42.0, 50.0, 43.0, 36.0, 41.0, 38.0, 35.0, 28.0, 35.0, 43.0, 19.0, 26.0, 27.0, 20.0, 22.0, 14.0, 21.0, 17.0, 16.0, 7.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.529922485351562, -18.9344539642334, -18.338987350463867, -17.743518829345703, -17.148052215576172, -16.552583694458008, -15.957115173339844, -15.361647605895996, -14.766180038452148, -14.1707124710083, -13.575244903564453, -12.979776382446289, -12.384308815002441, -11.788841247558594, -11.19337272644043, -10.597905158996582, -10.002437591552734, -9.406970024108887, -8.811502456665039, -8.216033935546875, -7.620566368103027, -7.02509880065918, -6.429630756378174, -5.834162712097168, -5.23869514465332, -4.643227577209473, -4.047759532928467, -3.45229172706604, -2.8568239212036133, -2.2613561153411865, -1.6658883094787598, -1.070420265197754, -0.47495269775390625, 0.12051510810852051, 0.7159829139709473, 1.311450719833374, 1.9069185256958008, 2.5023863315582275, 3.0978541374206543, 3.69332218170166, 4.288789749145508, 4.8842573165893555, 5.479725360870361, 6.075193405151367, 6.670660972595215, 7.2661285400390625, 7.861596584320068, 8.457064628601074, 9.052532196044922, 9.64799976348877, 10.243467330932617, 10.838935852050781, 11.434403419494629, 12.029870986938477, 12.62533950805664, 13.220807075500488, 13.816274642944336, 14.411742210388184, 15.007209777832031, 15.602678298950195, 16.19814682006836, 16.79361343383789, 17.389081954956055, 17.98455047607422, 18.58001708984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 17.0, 20.0, 29.0, 30.0, 29.0, 31.0, 41.0, 39.0, 42.0, 51.0, 51.0, 45.0, 43.0, 43.0, 40.0, 52.0, 45.0, 44.0, 34.0, 33.0, 31.0, 28.0, 18.0, 17.0, 18.0, 17.0, 14.0, 8.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.41796875, -4.300048828125, -4.18212890625, -4.064208984375, -3.9462890625, -3.828369140625, -3.71044921875, -3.592529296875, -3.474609375, -3.356689453125, -3.23876953125, -3.120849609375, -3.0029296875, -2.885009765625, -2.76708984375, -2.649169921875, -2.53125, -2.413330078125, -2.29541015625, -2.177490234375, -2.0595703125, -1.941650390625, -1.82373046875, -1.705810546875, -1.587890625, -1.469970703125, -1.35205078125, -1.234130859375, -1.1162109375, -0.998291015625, -0.88037109375, -0.762451171875, -0.64453125, -0.526611328125, -0.40869140625, -0.290771484375, -0.1728515625, -0.054931640625, 0.06298828125, 0.180908203125, 0.298828125, 0.416748046875, 0.53466796875, 0.652587890625, 0.7705078125, 0.888427734375, 1.00634765625, 1.124267578125, 1.2421875, 1.360107421875, 1.47802734375, 1.595947265625, 1.7138671875, 1.831787109375, 1.94970703125, 2.067626953125, 2.185546875, 2.303466796875, 2.42138671875, 2.539306640625, 2.6572265625, 2.775146484375, 2.89306640625, 3.010986328125, 3.12890625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 10.0, 12.0, 23.0, 29.0, 56.0, 69.0, 90.0, 169.0, 248.0, 396.0, 578.0, 963.0, 1432.0, 2373.0, 3590.0, 5747.0, 9156.0, 14667.0, 24134.0, 39981.0, 69366.0, 134177.0, 312686.0, 202415.0, 93838.0, 51823.0, 30774.0, 18649.0, 11419.0, 7153.0, 4603.0, 2862.0, 1819.0, 1121.0, 756.0, 464.0, 330.0, 188.0, 135.0, 86.0, 55.0, 31.0, 30.0, 15.0, 13.0, 5.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.020111083984375, -0.019515037536621094, -0.018918991088867188, -0.01832294464111328, -0.017726898193359375, -0.01713085174560547, -0.016534805297851562, -0.015938758850097656, -0.01534271240234375, -0.014746665954589844, -0.014150619506835938, -0.013554573059082031, -0.012958526611328125, -0.012362480163574219, -0.011766433715820312, -0.011170387268066406, -0.0105743408203125, -0.009978294372558594, -0.009382247924804688, -0.008786201477050781, -0.008190155029296875, -0.007594108581542969, -0.0069980621337890625, -0.006402015686035156, -0.00580596923828125, -0.005209922790527344, -0.0046138763427734375, -0.004017829895019531, -0.003421783447265625, -0.0028257369995117188, -0.0022296905517578125, -0.0016336441040039062, -0.00103759765625, -0.00044155120849609375, 0.0001544952392578125, 0.0007505416870117188, 0.001346588134765625, 0.0019426345825195312, 0.0025386810302734375, 0.0031347274780273438, 0.00373077392578125, 0.004326820373535156, 0.0049228668212890625, 0.005518913269042969, 0.006114959716796875, 0.006711006164550781, 0.0073070526123046875, 0.007903099060058594, 0.0084991455078125, 0.009095191955566406, 0.009691238403320312, 0.010287284851074219, 0.010883331298828125, 0.011479377746582031, 0.012075424194335938, 0.012671470642089844, 0.01326751708984375, 0.013863563537597656, 0.014459609985351562, 0.015055656433105469, 0.015651702880859375, 0.01624774932861328, 0.016843795776367188, 0.017439842224121094, 0.018035888671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 4.0, 9.0, 5.0, 2.0, 7.0, 11.0, 16.0, 24.0, 20.0, 31.0, 23.0, 26.0, 37.0, 33.0, 59.0, 41.0, 49.0, 40.0, 48.0, 1067.0, 45.0, 29.0, 48.0, 49.0, 34.0, 47.0, 30.0, 25.0, 32.0, 28.0, 18.0, 12.0, 13.0, 13.0, 14.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.23828125, -2.16455078125, -2.0908203125, -2.01708984375, -1.943359375, -1.86962890625, -1.7958984375, -1.72216796875, -1.6484375, -1.57470703125, -1.5009765625, -1.42724609375, -1.353515625, -1.27978515625, -1.2060546875, -1.13232421875, -1.05859375, -0.98486328125, -0.9111328125, -0.83740234375, -0.763671875, -0.68994140625, -0.6162109375, -0.54248046875, -0.46875, -0.39501953125, -0.3212890625, -0.24755859375, -0.173828125, -0.10009765625, -0.0263671875, 0.04736328125, 0.12109375, 0.19482421875, 0.2685546875, 0.34228515625, 0.416015625, 0.48974609375, 0.5634765625, 0.63720703125, 0.7109375, 0.78466796875, 0.8583984375, 0.93212890625, 1.005859375, 1.07958984375, 1.1533203125, 1.22705078125, 1.30078125, 1.37451171875, 1.4482421875, 1.52197265625, 1.595703125, 1.66943359375, 1.7431640625, 1.81689453125, 1.890625, 1.96435546875, 2.0380859375, 2.11181640625, 2.185546875, 2.25927734375, 2.3330078125, 2.40673828125, 2.48046875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 11.0, 15.0, 34.0, 49.0, 59.0, 98.0, 109.0, 191.0, 305.0, 456.0, 638.0, 1001.0, 1557.0, 2583.0, 3988.0, 6580.0, 10695.0, 18159.0, 31321.0, 55978.0, 106821.0, 251026.0, 1336967.0, 121379.0, 61876.0, 34422.0, 19891.0, 11864.0, 6995.0, 4352.0, 2743.0, 1705.0, 1141.0, 712.0, 483.0, 306.0, 181.0, 128.0, 79.0, 56.0, 46.0, 46.0, 29.0, 17.0, 11.0, 7.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0148773193359375, -0.014427661895751953, -0.013978004455566406, -0.01352834701538086, -0.013078689575195312, -0.012629032135009766, -0.012179374694824219, -0.011729717254638672, -0.011280059814453125, -0.010830402374267578, -0.010380744934082031, -0.009931087493896484, -0.009481430053710938, -0.00903177261352539, -0.008582115173339844, -0.008132457733154297, -0.00768280029296875, -0.007233142852783203, -0.006783485412597656, -0.006333827972412109, -0.0058841705322265625, -0.005434513092041016, -0.004984855651855469, -0.004535198211669922, -0.004085540771484375, -0.003635883331298828, -0.0031862258911132812, -0.0027365684509277344, -0.0022869110107421875, -0.0018372535705566406, -0.0013875961303710938, -0.0009379386901855469, -0.00048828125, -3.8623809814453125e-05, 0.00041103363037109375, 0.0008606910705566406, 0.0013103485107421875, 0.0017600059509277344, 0.0022096633911132812, 0.002659320831298828, 0.003108978271484375, 0.003558635711669922, 0.004008293151855469, 0.004457950592041016, 0.0049076080322265625, 0.005357265472412109, 0.005806922912597656, 0.006256580352783203, 0.00670623779296875, 0.007155895233154297, 0.007605552673339844, 0.00805521011352539, 0.008504867553710938, 0.008954524993896484, 0.009404182434082031, 0.009853839874267578, 0.010303497314453125, 0.010753154754638672, 0.011202812194824219, 0.011652469635009766, 0.012102127075195312, 0.01255178451538086, 0.013001441955566406, 0.013451099395751953, 0.0139007568359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 109.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 776.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 35.0, 44.0, 27.0, 6.0, 2.0, 0.0, 1.0, 85.0, 51.0, 89.0, 307.0, 4777.0, 986377.0, 55593.0, 464.0, 312.0, 93.0, 54.0, 82.0, 7.0, 0.0, 1.0, 21.0, 14.0, 31.0, 47.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8079375624656677e-06, -2.695247530937195e-06, -2.582557499408722e-06, -2.469867467880249e-06, -2.357177436351776e-06, -2.2444874048233032e-06, -2.1317973732948303e-06, -2.0191073417663574e-06, -1.9064173102378845e-06, -1.7937272787094116e-06, -1.6810372471809387e-06, -1.5683472156524658e-06, -1.455657184123993e-06, -1.34296715259552e-06, -1.2302771210670471e-06, -1.1175870895385742e-06, -1.0048970580101013e-06, -8.922070264816284e-07, -7.795169949531555e-07, -6.668269634246826e-07, -5.541369318962097e-07, -4.414469003677368e-07, -3.287568688392639e-07, -2.1606683731079102e-07, -1.0337680578231812e-07, 9.313225746154785e-09, 1.2200325727462769e-07, 2.3469328880310059e-07, 3.473833203315735e-07, 4.600733518600464e-07, 5.727633833885193e-07, 6.854534149169922e-07, 7.981434464454651e-07, 9.10833477973938e-07, 1.0235235095024109e-06, 1.1362135410308838e-06, 1.2489035725593567e-06, 1.3615936040878296e-06, 1.4742836356163025e-06, 1.5869736671447754e-06, 1.6996636986732483e-06, 1.8123537302017212e-06, 1.925043761730194e-06, 2.037733793258667e-06, 2.15042382478714e-06, 2.263113856315613e-06, 2.3758038878440857e-06, 2.4884939193725586e-06, 2.6011839509010315e-06, 2.7138739824295044e-06, 2.8265640139579773e-06, 2.93925404548645e-06, 3.051944077014923e-06, 3.164634108543396e-06, 3.277324140071869e-06, 3.390014171600342e-06, 3.5027042031288147e-06, 3.6153942346572876e-06, 3.7280842661857605e-06, 3.840774297714233e-06, 3.953464329242706e-06, 4.066154360771179e-06, 4.178844392299652e-06, 4.291534423828125e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 17.0, 20.0, 29.0, 30.0, 29.0, 31.0, 41.0, 39.0, 42.0, 51.0, 51.0, 45.0, 43.0, 43.0, 40.0, 52.0, 45.0, 44.0, 34.0, 33.0, 31.0, 28.0, 18.0, 17.0, 18.0, 17.0, 14.0, 8.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.41796875, -4.300048828125, -4.18212890625, -4.064208984375, -3.9462890625, -3.828369140625, -3.71044921875, -3.592529296875, -3.474609375, -3.356689453125, -3.23876953125, -3.120849609375, -3.0029296875, -2.885009765625, -2.76708984375, -2.649169921875, -2.53125, -2.413330078125, -2.29541015625, -2.177490234375, -2.0595703125, -1.941650390625, -1.82373046875, -1.705810546875, -1.587890625, -1.469970703125, -1.35205078125, -1.234130859375, -1.1162109375, -0.998291015625, -0.88037109375, -0.762451171875, -0.64453125, -0.526611328125, -0.40869140625, -0.290771484375, -0.1728515625, -0.054931640625, 0.06298828125, 0.180908203125, 0.298828125, 0.416748046875, 0.53466796875, 0.652587890625, 0.7705078125, 0.888427734375, 1.00634765625, 1.124267578125, 1.2421875, 1.360107421875, 1.47802734375, 1.595947265625, 1.7138671875, 1.831787109375, 1.94970703125, 2.067626953125, 2.185546875, 2.303466796875, 2.42138671875, 2.539306640625, 2.6572265625, 2.775146484375, 2.89306640625, 3.010986328125, 3.12890625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 17.0, 15.0, 21.0, 22.0, 48.0, 56.0, 95.0, 139.0, 248.0, 498.0, 1304.0, 3274.0, 8835.0, 25915.0, 96336.0, 645350.0, 203489.0, 41143.0, 13318.0, 4959.0, 1918.0, 724.0, 334.0, 172.0, 86.0, 61.0, 35.0, 28.0, 23.0, 20.0, 9.0, 18.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-7.484375, -7.28582763671875, -7.0872802734375, -6.88873291015625, -6.690185546875, -6.49163818359375, -6.2930908203125, -6.09454345703125, -5.89599609375, -5.69744873046875, -5.4989013671875, -5.30035400390625, -5.101806640625, -4.90325927734375, -4.7047119140625, -4.50616455078125, -4.3076171875, -4.10906982421875, -3.9105224609375, -3.71197509765625, -3.513427734375, -3.31488037109375, -3.1163330078125, -2.91778564453125, -2.71923828125, -2.52069091796875, -2.3221435546875, -2.12359619140625, -1.925048828125, -1.72650146484375, -1.5279541015625, -1.32940673828125, -1.130859375, -0.93231201171875, -0.7337646484375, -0.53521728515625, -0.336669921875, -0.13812255859375, 0.0604248046875, 0.25897216796875, 0.45751953125, 0.65606689453125, 0.8546142578125, 1.05316162109375, 1.251708984375, 1.45025634765625, 1.6488037109375, 1.84735107421875, 2.0458984375, 2.24444580078125, 2.4429931640625, 2.64154052734375, 2.840087890625, 3.03863525390625, 3.2371826171875, 3.43572998046875, 3.63427734375, 3.83282470703125, 4.0313720703125, 4.22991943359375, 4.428466796875, 4.62701416015625, 4.8255615234375, 5.02410888671875, 5.22265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 12.0, 11.0, 19.0, 17.0, 19.0, 30.0, 28.0, 37.0, 32.0, 36.0, 51.0, 52.0, 52.0, 108.0, 453.0, 1536.0, 119.0, 60.0, 69.0, 33.0, 31.0, 39.0, 34.0, 23.0, 21.0, 22.0, 21.0, 9.0, 15.0, 8.0, 16.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.3946533203125, -11.015869140625, -10.6370849609375, -10.25830078125, -9.8795166015625, -9.500732421875, -9.1219482421875, -8.7431640625, -8.3643798828125, -7.985595703125, -7.6068115234375, -7.22802734375, -6.8492431640625, -6.470458984375, -6.0916748046875, -5.712890625, -5.3341064453125, -4.955322265625, -4.5765380859375, -4.19775390625, -3.8189697265625, -3.440185546875, -3.0614013671875, -2.6826171875, -2.3038330078125, -1.925048828125, -1.5462646484375, -1.16748046875, -0.7886962890625, -0.409912109375, -0.0311279296875, 0.34765625, 0.7264404296875, 1.105224609375, 1.4840087890625, 1.86279296875, 2.2415771484375, 2.620361328125, 2.9991455078125, 3.3779296875, 3.7567138671875, 4.135498046875, 4.5142822265625, 4.89306640625, 5.2718505859375, 5.650634765625, 6.0294189453125, 6.408203125, 6.7869873046875, 7.165771484375, 7.5445556640625, 7.92333984375, 8.3021240234375, 8.680908203125, 9.0596923828125, 9.4384765625, 9.8172607421875, 10.196044921875, 10.5748291015625, 10.95361328125, 11.3323974609375, 11.711181640625, 12.0899658203125, 12.46875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 15.0, 7.0, 15.0, 10.0, 20.0, 27.0, 27.0, 44.0, 52.0, 60.0, 89.0, 124.0, 282.0, 830.0, 5757.0, 227039.0, 2892944.0, 15800.0, 1564.0, 358.0, 180.0, 104.0, 91.0, 60.0, 41.0, 28.0, 31.0, 25.0, 16.0, 17.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.875, -22.185791015625, -21.49658203125, -20.807373046875, -20.1181640625, -19.428955078125, -18.73974609375, -18.050537109375, -17.361328125, -16.672119140625, -15.98291015625, -15.293701171875, -14.6044921875, -13.915283203125, -13.22607421875, -12.536865234375, -11.84765625, -11.158447265625, -10.46923828125, -9.780029296875, -9.0908203125, -8.401611328125, -7.71240234375, -7.023193359375, -6.333984375, -5.644775390625, -4.95556640625, -4.266357421875, -3.5771484375, -2.887939453125, -2.19873046875, -1.509521484375, -0.8203125, -0.131103515625, 0.55810546875, 1.247314453125, 1.9365234375, 2.625732421875, 3.31494140625, 4.004150390625, 4.693359375, 5.382568359375, 6.07177734375, 6.760986328125, 7.4501953125, 8.139404296875, 8.82861328125, 9.517822265625, 10.20703125, 10.896240234375, 11.58544921875, 12.274658203125, 12.9638671875, 13.653076171875, 14.34228515625, 15.031494140625, 15.720703125, 16.409912109375, 17.09912109375, 17.788330078125, 18.4775390625, 19.166748046875, 19.85595703125, 20.545166015625, 21.234375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [28.0, 143.0, 432.0, 319.0, 81.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.330500602722168, -2.7925734519958496, -1.2546460628509521, 0.2832813262939453, 1.8212084770202637, 3.359135627746582, 4.897063255310059, 6.434989929199219, 7.972917556762695, 9.510845184326172, 11.048771858215332, 12.586699485778809, 14.124626159667969, 15.662553787231445, 17.200481414794922, 18.738407135009766, 20.276336669921875, 21.81426429748535, 23.352191925048828, 24.890117645263672, 26.42804527282715, 27.965972900390625, 29.5039005279541, 31.041828155517578, 32.57975387573242, 34.117679595947266, 35.655609130859375, 37.19353485107422, 38.73146438598633, 40.26939010620117, 41.80731964111328, 43.345245361328125, 44.883174896240234, 46.42110061645508, 47.95903015136719, 49.49695587158203, 51.03488540649414, 52.572811126708984, 54.110740661621094, 55.64866638183594, 57.18659210205078, 58.724517822265625, 60.262447357177734, 61.80037307739258, 63.33830261230469, 64.87622833251953, 66.41415405273438, 67.95207977294922, 69.4900131225586, 71.02793884277344, 72.56586456298828, 74.10379791259766, 75.6417236328125, 77.17964935302734, 78.71757507324219, 80.25550079345703, 81.79342651367188, 83.33135223388672, 84.86927795410156, 86.40721130371094, 87.94513702392578, 89.48306274414062, 91.02098846435547, 92.55891418457031, 94.09684753417969]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 16.0, 7.0, 12.0, 13.0, 13.0, 30.0, 34.0, 31.0, 46.0, 43.0, 51.0, 51.0, 46.0, 49.0, 54.0, 49.0, 46.0, 51.0, 45.0, 54.0, 45.0, 34.0, 37.0, 35.0, 26.0, 22.0, 8.0, 12.0, 6.0, 14.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.21537399291992, -39.067710876464844, -37.920047760009766, -36.77238082885742, -35.624717712402344, -34.477054595947266, -33.32939147949219, -32.181724548339844, -31.034061431884766, -29.886398315429688, -28.738733291625977, -27.5910701751709, -26.443405151367188, -25.29574203491211, -24.14807891845703, -23.00041389465332, -21.852750778198242, -20.705087661743164, -19.557422637939453, -18.409759521484375, -17.262094497680664, -16.114431381225586, -14.966767311096191, -13.819103240966797, -12.671439170837402, -11.523775100708008, -10.376111030578613, -9.228446960449219, -8.08078384399414, -6.933119297027588, -5.785455703735352, -4.637791633605957, -3.4901275634765625, -2.342463493347168, -1.1947996616363525, -0.04713582992553711, 1.1005282402038574, 2.248192310333252, 3.3958559036254883, 4.543519973754883, 5.691184043884277, 6.838848114013672, 7.986512184143066, 9.134176254272461, 10.281839370727539, 11.42950439453125, 12.577167510986328, 13.724831581115723, 14.872495651245117, 16.020158767700195, 17.167823791503906, 18.315486907958984, 19.463151931762695, 20.610815048217773, 21.758480072021484, 22.906143188476562, 24.05380630493164, 25.20146942138672, 26.34913444519043, 27.496797561645508, 28.64446258544922, 29.792125701904297, 30.939788818359375, 32.08745574951172, 33.2351188659668]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 5.0, 11.0, 20.0, 22.0, 16.0, 19.0, 28.0, 23.0, 32.0, 34.0, 39.0, 46.0, 41.0, 48.0, 40.0, 44.0, 50.0, 40.0, 51.0, 48.0, 34.0, 34.0, 41.0, 36.0, 35.0, 19.0, 16.0, 15.0, 25.0, 17.0, 15.0, 10.0, 9.0, 12.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-4.48828125, -4.3675537109375, -4.246826171875, -4.1260986328125, -4.00537109375, -3.8846435546875, -3.763916015625, -3.6431884765625, -3.5224609375, -3.4017333984375, -3.281005859375, -3.1602783203125, -3.03955078125, -2.9188232421875, -2.798095703125, -2.6773681640625, -2.556640625, -2.4359130859375, -2.315185546875, -2.1944580078125, -2.07373046875, -1.9530029296875, -1.832275390625, -1.7115478515625, -1.5908203125, -1.4700927734375, -1.349365234375, -1.2286376953125, -1.10791015625, -0.9871826171875, -0.866455078125, -0.7457275390625, -0.625, -0.5042724609375, -0.383544921875, -0.2628173828125, -0.14208984375, -0.0213623046875, 0.099365234375, 0.2200927734375, 0.3408203125, 0.4615478515625, 0.582275390625, 0.7030029296875, 0.82373046875, 0.9444580078125, 1.065185546875, 1.1859130859375, 1.306640625, 1.4273681640625, 1.548095703125, 1.6688232421875, 1.78955078125, 1.9102783203125, 2.031005859375, 2.1517333984375, 2.2724609375, 2.3931884765625, 2.513916015625, 2.6346435546875, 2.75537109375, 2.8760986328125, 2.996826171875, 3.1175537109375, 3.23828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 11.0, 16.0, 12.0, 18.0, 24.0, 22.0, 40.0, 37.0, 89.0, 152.0, 273.0, 722.0, 2000.0, 6019.0, 22149.0, 104480.0, 726278.0, 2583257.0, 623733.0, 94328.0, 21291.0, 5958.0, 1926.0, 708.0, 316.0, 146.0, 78.0, 37.0, 43.0, 28.0, 17.0, 11.0, 13.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.59765625, -7.3636474609375, -7.129638671875, -6.8956298828125, -6.66162109375, -6.4276123046875, -6.193603515625, -5.9595947265625, -5.7255859375, -5.4915771484375, -5.257568359375, -5.0235595703125, -4.78955078125, -4.5555419921875, -4.321533203125, -4.0875244140625, -3.853515625, -3.6195068359375, -3.385498046875, -3.1514892578125, -2.91748046875, -2.6834716796875, -2.449462890625, -2.2154541015625, -1.9814453125, -1.7474365234375, -1.513427734375, -1.2794189453125, -1.04541015625, -0.8114013671875, -0.577392578125, -0.3433837890625, -0.109375, 0.1246337890625, 0.358642578125, 0.5926513671875, 0.82666015625, 1.0606689453125, 1.294677734375, 1.5286865234375, 1.7626953125, 1.9967041015625, 2.230712890625, 2.4647216796875, 2.69873046875, 2.9327392578125, 3.166748046875, 3.4007568359375, 3.634765625, 3.8687744140625, 4.102783203125, 4.3367919921875, 4.57080078125, 4.8048095703125, 5.038818359375, 5.2728271484375, 5.5068359375, 5.7408447265625, 5.974853515625, 6.2088623046875, 6.44287109375, 6.6768798828125, 6.910888671875, 7.1448974609375, 7.37890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 4.0, 10.0, 15.0, 14.0, 14.0, 35.0, 39.0, 37.0, 48.0, 58.0, 102.0, 124.0, 147.0, 203.0, 265.0, 318.0, 420.0, 391.0, 399.0, 327.0, 247.0, 184.0, 160.0, 125.0, 78.0, 68.0, 61.0, 46.0, 32.0, 26.0, 18.0, 12.0, 9.0, 5.0, 8.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3671875, -5.21148681640625, -5.0557861328125, -4.90008544921875, -4.744384765625, -4.58868408203125, -4.4329833984375, -4.27728271484375, -4.12158203125, -3.96588134765625, -3.8101806640625, -3.65447998046875, -3.498779296875, -3.34307861328125, -3.1873779296875, -3.03167724609375, -2.8759765625, -2.72027587890625, -2.5645751953125, -2.40887451171875, -2.253173828125, -2.09747314453125, -1.9417724609375, -1.78607177734375, -1.63037109375, -1.47467041015625, -1.3189697265625, -1.16326904296875, -1.007568359375, -0.85186767578125, -0.6961669921875, -0.54046630859375, -0.384765625, -0.22906494140625, -0.0733642578125, 0.08233642578125, 0.238037109375, 0.39373779296875, 0.5494384765625, 0.70513916015625, 0.86083984375, 1.01654052734375, 1.1722412109375, 1.32794189453125, 1.483642578125, 1.63934326171875, 1.7950439453125, 1.95074462890625, 2.1064453125, 2.26214599609375, 2.4178466796875, 2.57354736328125, 2.729248046875, 2.88494873046875, 3.0406494140625, 3.19635009765625, 3.35205078125, 3.50775146484375, 3.6634521484375, 3.81915283203125, 3.974853515625, 4.13055419921875, 4.2862548828125, 4.44195556640625, 4.59765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 7.0, 13.0, 16.0, 20.0, 23.0, 34.0, 41.0, 67.0, 68.0, 103.0, 129.0, 184.0, 244.0, 477.0, 1327.0, 6561.0, 62774.0, 1332953.0, 2658710.0, 116775.0, 10319.0, 1814.0, 594.0, 281.0, 191.0, 132.0, 93.0, 90.0, 67.0, 36.0, 35.0, 25.0, 19.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.473876953125, -12.99462890625, -12.515380859375, -12.0361328125, -11.556884765625, -11.07763671875, -10.598388671875, -10.119140625, -9.639892578125, -9.16064453125, -8.681396484375, -8.2021484375, -7.722900390625, -7.24365234375, -6.764404296875, -6.28515625, -5.805908203125, -5.32666015625, -4.847412109375, -4.3681640625, -3.888916015625, -3.40966796875, -2.930419921875, -2.451171875, -1.971923828125, -1.49267578125, -1.013427734375, -0.5341796875, -0.054931640625, 0.42431640625, 0.903564453125, 1.3828125, 1.862060546875, 2.34130859375, 2.820556640625, 3.2998046875, 3.779052734375, 4.25830078125, 4.737548828125, 5.216796875, 5.696044921875, 6.17529296875, 6.654541015625, 7.1337890625, 7.613037109375, 8.09228515625, 8.571533203125, 9.05078125, 9.530029296875, 10.00927734375, 10.488525390625, 10.9677734375, 11.447021484375, 11.92626953125, 12.405517578125, 12.884765625, 13.364013671875, 13.84326171875, 14.322509765625, 14.8017578125, 15.281005859375, 15.76025390625, 16.239501953125, 16.71875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 12.0, 28.0, 41.0, 83.0, 146.0, 188.0, 187.0, 143.0, 92.0, 53.0, 16.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.303102493286133, -10.067081451416016, -8.831060409545898, -7.595038890838623, -6.359017848968506, -5.122996807098389, -3.8869752883911133, -2.650954246520996, -1.414933204650879, -0.17891204357147217, 1.0571091175079346, 2.293130397796631, 3.529151439666748, 4.765172481536865, 6.001194000244141, 7.237215042114258, 8.473236083984375, 9.709257125854492, 10.94527816772461, 12.181299209594727, 13.417320251464844, 14.653341293334961, 15.889363288879395, 17.125385284423828, 18.361404418945312, 19.59742546081543, 20.833446502685547, 22.069467544555664, 23.30548858642578, 24.5415096282959, 25.777530670166016, 27.013553619384766, 28.249576568603516, 29.485597610473633, 30.72161865234375, 31.957639694213867, 33.193660736083984, 34.429683685302734, 35.66570281982422, 36.90172576904297, 38.13774490356445, 39.3737678527832, 40.60978698730469, 41.84580993652344, 43.08182907104492, 44.31785202026367, 45.553871154785156, 46.789894104003906, 48.025917053222656, 49.261940002441406, 50.49795913696289, 51.73398208618164, 52.970001220703125, 54.206024169921875, 55.44204330444336, 56.67806625366211, 57.914085388183594, 59.150108337402344, 60.38612747192383, 61.62215042114258, 62.85816955566406, 64.09419250488281, 65.33021545410156, 66.56623077392578, 67.80225372314453]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 11.0, 16.0, 10.0, 13.0, 20.0, 12.0, 23.0, 19.0, 25.0, 24.0, 32.0, 31.0, 27.0, 35.0, 42.0, 37.0, 45.0, 50.0, 33.0, 40.0, 46.0, 38.0, 50.0, 38.0, 30.0, 33.0, 21.0, 35.0, 31.0, 21.0, 14.0, 11.0, 12.0, 12.0, 14.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.468196868896484, -15.89360237121582, -15.319007873535156, -14.744413375854492, -14.169818878173828, -13.595224380493164, -13.0206298828125, -12.446035385131836, -11.871440887451172, -11.296846389770508, -10.722251892089844, -10.14765739440918, -9.573062896728516, -8.998468399047852, -8.423873901367188, -7.849279880523682, -7.274685859680176, -6.700091361999512, -6.125496864318848, -5.550902366638184, -4.9763078689575195, -4.4017133712768555, -3.8271193504333496, -3.2525248527526855, -2.6779303550720215, -2.1033358573913574, -1.528741478919983, -0.9541471004486084, -0.37955260276794434, 0.19504189491271973, 0.7696361541748047, 1.3442306518554688, 1.9188251495361328, 2.493419647216797, 3.068014144897461, 3.642608404159546, 4.217203140258789, 4.791797637939453, 5.366391658782959, 5.940986156463623, 6.515580654144287, 7.090175151824951, 7.664769649505615, 8.239363670349121, 8.813958168029785, 9.38855266571045, 9.963147163391113, 10.537741661071777, 11.112336158752441, 11.686930656433105, 12.26152515411377, 12.836119651794434, 13.410714149475098, 13.985308647155762, 14.55990219116211, 15.134496688842773, 15.709091186523438, 16.2836856842041, 16.858280181884766, 17.43287467956543, 18.007469177246094, 18.582063674926758, 19.156658172607422, 19.731252670288086, 20.30584716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 4.0, 15.0, 10.0, 16.0, 20.0, 12.0, 17.0, 23.0, 22.0, 23.0, 31.0, 29.0, 40.0, 41.0, 25.0, 45.0, 55.0, 42.0, 39.0, 40.0, 39.0, 34.0, 48.0, 28.0, 45.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 18.0, 16.0, 20.0, 15.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.625, -3.514434814453125, -3.40386962890625, -3.293304443359375, -3.1827392578125, -3.072174072265625, -2.96160888671875, -2.851043701171875, -2.740478515625, -2.629913330078125, -2.51934814453125, -2.408782958984375, -2.2982177734375, -2.187652587890625, -2.07708740234375, -1.966522216796875, -1.85595703125, -1.745391845703125, -1.63482666015625, -1.524261474609375, -1.4136962890625, -1.303131103515625, -1.19256591796875, -1.082000732421875, -0.971435546875, -0.860870361328125, -0.75030517578125, -0.639739990234375, -0.5291748046875, -0.418609619140625, -0.30804443359375, -0.197479248046875, -0.0869140625, 0.023651123046875, 0.13421630859375, 0.244781494140625, 0.3553466796875, 0.465911865234375, 0.57647705078125, 0.687042236328125, 0.797607421875, 0.908172607421875, 1.01873779296875, 1.129302978515625, 1.2398681640625, 1.350433349609375, 1.46099853515625, 1.571563720703125, 1.68212890625, 1.792694091796875, 1.90325927734375, 2.013824462890625, 2.1243896484375, 2.234954833984375, 2.34552001953125, 2.456085205078125, 2.566650390625, 2.677215576171875, 2.78778076171875, 2.898345947265625, 3.0089111328125, 3.119476318359375, 3.23004150390625, 3.340606689453125, 3.451171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 12.0, 30.0, 35.0, 50.0, 74.0, 103.0, 161.0, 181.0, 296.0, 383.0, 606.0, 758.0, 1221.0, 1636.0, 2405.0, 3604.0, 5046.0, 7224.0, 10639.0, 15811.0, 24064.0, 35783.0, 56084.0, 92623.0, 181005.0, 264275.0, 131486.0, 73998.0, 45826.0, 30291.0, 20135.0, 13322.0, 9001.0, 6068.0, 4445.0, 3001.0, 2176.0, 1327.0, 981.0, 693.0, 528.0, 332.0, 242.0, 171.0, 108.0, 102.0, 61.0, 47.0, 32.0, 21.0, 12.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.016387939453125, -0.015880346298217773, -0.015372753143310547, -0.01486515998840332, -0.014357566833496094, -0.013849973678588867, -0.01334238052368164, -0.012834787368774414, -0.012327194213867188, -0.011819601058959961, -0.011312007904052734, -0.010804414749145508, -0.010296821594238281, -0.009789228439331055, -0.009281635284423828, -0.008774042129516602, -0.008266448974609375, -0.0077588558197021484, -0.007251262664794922, -0.006743669509887695, -0.006236076354980469, -0.005728483200073242, -0.005220890045166016, -0.004713296890258789, -0.0042057037353515625, -0.003698110580444336, -0.0031905174255371094, -0.002682924270629883, -0.0021753311157226562, -0.0016677379608154297, -0.0011601448059082031, -0.0006525516510009766, -0.00014495849609375, 0.00036263465881347656, 0.0008702278137207031, 0.0013778209686279297, 0.0018854141235351562, 0.002393007278442383, 0.0029006004333496094, 0.003408193588256836, 0.0039157867431640625, 0.004423379898071289, 0.004930973052978516, 0.005438566207885742, 0.005946159362792969, 0.006453752517700195, 0.006961345672607422, 0.0074689388275146484, 0.007976531982421875, 0.008484125137329102, 0.008991718292236328, 0.009499311447143555, 0.010006904602050781, 0.010514497756958008, 0.011022090911865234, 0.011529684066772461, 0.012037277221679688, 0.012544870376586914, 0.01305246353149414, 0.013560056686401367, 0.014067649841308594, 0.01457524299621582, 0.015082836151123047, 0.015590429306030273, 0.0160980224609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 8.0, 8.0, 16.0, 16.0, 18.0, 17.0, 22.0, 22.0, 25.0, 34.0, 42.0, 39.0, 42.0, 38.0, 58.0, 50.0, 1073.0, 40.0, 57.0, 47.0, 43.0, 56.0, 38.0, 29.0, 27.0, 18.0, 31.0, 19.0, 13.0, 16.0, 11.0, 8.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.351715087890625, -2.27374267578125, -2.195770263671875, -2.1177978515625, -2.039825439453125, -1.96185302734375, -1.883880615234375, -1.805908203125, -1.727935791015625, -1.64996337890625, -1.571990966796875, -1.4940185546875, -1.416046142578125, -1.33807373046875, -1.260101318359375, -1.18212890625, -1.104156494140625, -1.02618408203125, -0.948211669921875, -0.8702392578125, -0.792266845703125, -0.71429443359375, -0.636322021484375, -0.558349609375, -0.480377197265625, -0.40240478515625, -0.324432373046875, -0.2464599609375, -0.168487548828125, -0.09051513671875, -0.012542724609375, 0.0654296875, 0.143402099609375, 0.22137451171875, 0.299346923828125, 0.3773193359375, 0.455291748046875, 0.53326416015625, 0.611236572265625, 0.689208984375, 0.767181396484375, 0.84515380859375, 0.923126220703125, 1.0010986328125, 1.079071044921875, 1.15704345703125, 1.235015869140625, 1.31298828125, 1.390960693359375, 1.46893310546875, 1.546905517578125, 1.6248779296875, 1.702850341796875, 1.78082275390625, 1.858795166015625, 1.936767578125, 2.014739990234375, 2.09271240234375, 2.170684814453125, 2.2486572265625, 2.326629638671875, 2.40460205078125, 2.482574462890625, 2.560546875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 16.0, 14.0, 24.0, 30.0, 52.0, 77.0, 109.0, 156.0, 270.0, 338.0, 542.0, 858.0, 1196.0, 2023.0, 3131.0, 4907.0, 7938.0, 12719.0, 21932.0, 37702.0, 70248.0, 147672.0, 1389621.0, 197703.0, 86475.0, 45386.0, 25706.0, 15262.0, 9143.0, 5855.0, 3469.0, 2287.0, 1481.0, 919.0, 597.0, 440.0, 292.0, 197.0, 111.0, 78.0, 51.0, 34.0, 24.0, 15.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01522064208984375, -0.014754533767700195, -0.01428842544555664, -0.013822317123413086, -0.013356208801269531, -0.012890100479125977, -0.012423992156982422, -0.011957883834838867, -0.011491775512695312, -0.011025667190551758, -0.010559558868408203, -0.010093450546264648, -0.009627342224121094, -0.009161233901977539, -0.008695125579833984, -0.00822901725769043, -0.007762908935546875, -0.00729680061340332, -0.006830692291259766, -0.006364583969116211, -0.005898475646972656, -0.0054323673248291016, -0.004966259002685547, -0.004500150680541992, -0.0040340423583984375, -0.003567934036254883, -0.003101825714111328, -0.0026357173919677734, -0.0021696090698242188, -0.001703500747680664, -0.0012373924255371094, -0.0007712841033935547, -0.00030517578125, 0.0001609325408935547, 0.0006270408630371094, 0.001093149185180664, 0.0015592575073242188, 0.0020253658294677734, 0.002491474151611328, 0.002957582473754883, 0.0034236907958984375, 0.003889799118041992, 0.004355907440185547, 0.0048220157623291016, 0.005288124084472656, 0.005754232406616211, 0.006220340728759766, 0.00668644905090332, 0.007152557373046875, 0.00761866569519043, 0.008084774017333984, 0.008550882339477539, 0.009016990661621094, 0.009483098983764648, 0.009949207305908203, 0.010415315628051758, 0.010881423950195312, 0.011347532272338867, 0.011813640594482422, 0.012279748916625977, 0.012745857238769531, 0.013211965560913086, 0.01367807388305664, 0.014144182205200195, 0.01461029052734375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 119.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 717.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 134.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 10.0, 5.0, 2.0, 0.0, 4.0, 1.0, 17.0, 60.0, 77.0, 6.0, 6.0, 91.0, 113.0, 273.0, 8753.0, 1029750.0, 8736.0, 284.0, 103.0, 91.0, 5.0, 36.0, 88.0, 16.0, 2.0, 7.0, 1.0, 0.0, 3.0, 7.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.081536412239075e-06, -5.904585123062134e-06, -5.727633833885193e-06, -5.550682544708252e-06, -5.373731255531311e-06, -5.19677996635437e-06, -5.019828677177429e-06, -4.842877388000488e-06, -4.665926098823547e-06, -4.4889748096466064e-06, -4.3120235204696655e-06, -4.135072231292725e-06, -3.958120942115784e-06, -3.7811696529388428e-06, -3.604218363761902e-06, -3.427267074584961e-06, -3.25031578540802e-06, -3.073364496231079e-06, -2.896413207054138e-06, -2.7194619178771973e-06, -2.5425106287002563e-06, -2.3655593395233154e-06, -2.1886080503463745e-06, -2.0116567611694336e-06, -1.8347054719924927e-06, -1.6577541828155518e-06, -1.4808028936386108e-06, -1.30385160446167e-06, -1.126900315284729e-06, -9.499490261077881e-07, -7.729977369308472e-07, -5.960464477539062e-07, -4.1909515857696533e-07, -2.421438694000244e-07, -6.51925802230835e-08, 1.1175870895385742e-07, 2.8870999813079834e-07, 4.6566128730773926e-07, 6.426125764846802e-07, 8.195638656616211e-07, 9.96515154838562e-07, 1.173466444015503e-06, 1.3504177331924438e-06, 1.5273690223693848e-06, 1.7043203115463257e-06, 1.8812716007232666e-06, 2.0582228899002075e-06, 2.2351741790771484e-06, 2.4121254682540894e-06, 2.5890767574310303e-06, 2.766028046607971e-06, 2.942979335784912e-06, 3.119930624961853e-06, 3.296881914138794e-06, 3.473833203315735e-06, 3.6507844924926758e-06, 3.827735781669617e-06, 4.004687070846558e-06, 4.1816383600234985e-06, 4.3585896492004395e-06, 4.53554093837738e-06, 4.712492227554321e-06, 4.889443516731262e-06, 5.066394805908203e-06]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1004.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.492702908644787e-08, -5.963182303503345e-08, -5.4336616983619024e-08, -4.90414109322046e-08, -4.3746204880790174e-08, -3.845099882937575e-08, -3.3155792777961324e-08, -2.78605867265469e-08, -2.2565380675132474e-08, -1.727017462371805e-08, -1.1974968572303624e-08, -6.679762520889199e-09, -1.3845564694747736e-09, 3.910649581939651e-09, 9.205855633354076e-09, 1.4501061684768501e-08, 1.9796267736182926e-08, 2.509147378759735e-08, 3.0386679839011776e-08, 3.56818858904262e-08, 4.0977091941840627e-08, 4.627229799325505e-08, 5.1567504044669477e-08, 5.68627100960839e-08, 6.215791614749833e-08, 6.745312219891275e-08, 7.274832825032718e-08, 7.80435343017416e-08, 8.333874035315603e-08, 8.863394640457045e-08, 9.392915245598488e-08, 9.92243585073993e-08, 1.0451955745338637e-07, 1.098147635048008e-07, 1.1510996955621522e-07, 1.2040517560762964e-07, 1.2570038165904407e-07, 1.309955877104585e-07, 1.3629079376187292e-07, 1.4158599981328734e-07, 1.4688120586470177e-07, 1.521764119161162e-07, 1.5747161796753062e-07, 1.6276682401894504e-07, 1.6806203007035947e-07, 1.733572361217739e-07, 1.7865244217318832e-07, 1.8394764822460274e-07, 1.8924285427601717e-07, 1.945380603274316e-07, 1.9983326637884602e-07, 2.0512847243026044e-07, 2.1042367848167487e-07, 2.157188845330893e-07, 2.2101409058450372e-07, 2.2630929663591814e-07, 2.3160450268733257e-07, 2.36899708738747e-07, 2.421949147901614e-07, 2.4749010663072113e-07, 2.5278532689299027e-07, 2.580805471552594e-07, 2.633757389958191e-07, 2.6867093083637883e-07, 2.7396615109864797e-07]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 4.0, 15.0, 10.0, 16.0, 20.0, 12.0, 17.0, 23.0, 22.0, 23.0, 31.0, 29.0, 40.0, 41.0, 25.0, 45.0, 55.0, 42.0, 39.0, 40.0, 39.0, 34.0, 48.0, 28.0, 45.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 18.0, 16.0, 20.0, 15.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.625, -3.514434814453125, -3.40386962890625, -3.293304443359375, -3.1827392578125, -3.072174072265625, -2.96160888671875, -2.851043701171875, -2.740478515625, -2.629913330078125, -2.51934814453125, -2.408782958984375, -2.2982177734375, -2.187652587890625, -2.07708740234375, -1.966522216796875, -1.85595703125, -1.745391845703125, -1.63482666015625, -1.524261474609375, -1.4136962890625, -1.303131103515625, -1.19256591796875, -1.082000732421875, -0.971435546875, -0.860870361328125, -0.75030517578125, -0.639739990234375, -0.5291748046875, -0.418609619140625, -0.30804443359375, -0.197479248046875, -0.0869140625, 0.023651123046875, 0.13421630859375, 0.244781494140625, 0.3553466796875, 0.465911865234375, 0.57647705078125, 0.687042236328125, 0.797607421875, 0.908172607421875, 1.01873779296875, 1.129302978515625, 1.2398681640625, 1.350433349609375, 1.46099853515625, 1.571563720703125, 1.68212890625, 1.792694091796875, 1.90325927734375, 2.013824462890625, 2.1243896484375, 2.234954833984375, 2.34552001953125, 2.456085205078125, 2.566650390625, 2.677215576171875, 2.78778076171875, 2.898345947265625, 3.0089111328125, 3.119476318359375, 3.23004150390625, 3.340606689453125, 3.451171875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 11.0, 0.0, 7.0, 8.0, 6.0, 24.0, 25.0, 38.0, 36.0, 50.0, 73.0, 92.0, 140.0, 188.0, 275.0, 521.0, 1042.0, 2021.0, 4326.0, 10607.0, 26822.0, 83991.0, 682849.0, 168543.0, 39908.0, 15031.0, 5978.0, 2722.0, 1330.0, 705.0, 401.0, 197.0, 136.0, 111.0, 72.0, 59.0, 44.0, 50.0, 34.0, 16.0, 17.0, 9.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.890625, -6.67987060546875, -6.4691162109375, -6.25836181640625, -6.047607421875, -5.83685302734375, -5.6260986328125, -5.41534423828125, -5.20458984375, -4.99383544921875, -4.7830810546875, -4.57232666015625, -4.361572265625, -4.15081787109375, -3.9400634765625, -3.72930908203125, -3.5185546875, -3.30780029296875, -3.0970458984375, -2.88629150390625, -2.675537109375, -2.46478271484375, -2.2540283203125, -2.04327392578125, -1.83251953125, -1.62176513671875, -1.4110107421875, -1.20025634765625, -0.989501953125, -0.77874755859375, -0.5679931640625, -0.35723876953125, -0.146484375, 0.06427001953125, 0.2750244140625, 0.48577880859375, 0.696533203125, 0.90728759765625, 1.1180419921875, 1.32879638671875, 1.53955078125, 1.75030517578125, 1.9610595703125, 2.17181396484375, 2.382568359375, 2.59332275390625, 2.8040771484375, 3.01483154296875, 3.2255859375, 3.43634033203125, 3.6470947265625, 3.85784912109375, 4.068603515625, 4.27935791015625, 4.4901123046875, 4.70086669921875, 4.91162109375, 5.12237548828125, 5.3331298828125, 5.54388427734375, 5.754638671875, 5.96539306640625, 6.1761474609375, 6.38690185546875, 6.59765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 9.0, 2.0, 2.0, 13.0, 11.0, 10.0, 24.0, 16.0, 30.0, 20.0, 30.0, 30.0, 45.0, 40.0, 49.0, 58.0, 61.0, 114.0, 1542.0, 401.0, 97.0, 52.0, 52.0, 47.0, 33.0, 43.0, 27.0, 30.0, 37.0, 25.0, 17.0, 25.0, 10.0, 6.0, 12.0, 9.0, 6.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9609375, -11.6185302734375, -11.276123046875, -10.9337158203125, -10.59130859375, -10.2489013671875, -9.906494140625, -9.5640869140625, -9.2216796875, -8.8792724609375, -8.536865234375, -8.1944580078125, -7.85205078125, -7.5096435546875, -7.167236328125, -6.8248291015625, -6.482421875, -6.1400146484375, -5.797607421875, -5.4552001953125, -5.11279296875, -4.7703857421875, -4.427978515625, -4.0855712890625, -3.7431640625, -3.4007568359375, -3.058349609375, -2.7159423828125, -2.37353515625, -2.0311279296875, -1.688720703125, -1.3463134765625, -1.00390625, -0.6614990234375, -0.319091796875, 0.0233154296875, 0.36572265625, 0.7081298828125, 1.050537109375, 1.3929443359375, 1.7353515625, 2.0777587890625, 2.420166015625, 2.7625732421875, 3.10498046875, 3.4473876953125, 3.789794921875, 4.1322021484375, 4.474609375, 4.8170166015625, 5.159423828125, 5.5018310546875, 5.84423828125, 6.1866455078125, 6.529052734375, 6.8714599609375, 7.2138671875, 7.5562744140625, 7.898681640625, 8.2410888671875, 8.58349609375, 8.9259033203125, 9.268310546875, 9.6107177734375, 9.953125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 7.0, 14.0, 11.0, 17.0, 29.0, 15.0, 30.0, 40.0, 46.0, 56.0, 91.0, 113.0, 188.0, 343.0, 1026.0, 10175.0, 713567.0, 2404028.0, 13559.0, 1296.0, 363.0, 214.0, 120.0, 79.0, 53.0, 42.0, 35.0, 34.0, 28.0, 14.0, 18.0, 10.0, 12.0, 3.0, 3.0, 10.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.17578125, -18.4921875, -17.80859375, -17.125, -16.44140625, -15.7578125, -15.07421875, -14.390625, -13.70703125, -13.0234375, -12.33984375, -11.65625, -10.97265625, -10.2890625, -9.60546875, -8.921875, -8.23828125, -7.5546875, -6.87109375, -6.1875, -5.50390625, -4.8203125, -4.13671875, -3.453125, -2.76953125, -2.0859375, -1.40234375, -0.71875, -0.03515625, 0.6484375, 1.33203125, 2.015625, 2.69921875, 3.3828125, 4.06640625, 4.75, 5.43359375, 6.1171875, 6.80078125, 7.484375, 8.16796875, 8.8515625, 9.53515625, 10.21875, 10.90234375, 11.5859375, 12.26953125, 12.953125, 13.63671875, 14.3203125, 15.00390625, 15.6875, 16.37109375, 17.0546875, 17.73828125, 18.421875, 19.10546875, 19.7890625, 20.47265625, 21.15625, 21.83984375, 22.5234375, 23.20703125, 23.890625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 14.0, 31.0, 63.0, 181.0, 247.0, 248.0, 142.0, 61.0, 18.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.3286018371582, -34.506431579589844, -33.684261322021484, -32.862091064453125, -32.039920806884766, -31.21775245666504, -30.39558219909668, -29.573413848876953, -28.751243591308594, -27.929073333740234, -27.106903076171875, -26.28473472595215, -25.46256446838379, -24.64039421081543, -23.81822395324707, -22.996055603027344, -22.173885345458984, -21.351715087890625, -20.529544830322266, -19.70737648010254, -18.88520622253418, -18.06303596496582, -17.24086570739746, -16.418697357177734, -15.596525192260742, -14.774354934692383, -13.95218563079834, -13.13001537322998, -12.307846069335938, -11.485675811767578, -10.663505554199219, -9.841336250305176, -9.019166946411133, -8.196996688842773, -7.3748273849487305, -6.552657127380371, -5.730487823486328, -4.908317565917969, -4.086147785186768, -3.2639780044555664, -2.4418082237243652, -1.619638442993164, -0.7974685430526733, 0.024701356887817383, 0.8468711376190186, 1.6690411567687988, 2.4912109375, 3.313380718231201, 4.135550498962402, 4.9577202796936035, 5.779890060424805, 6.602060317993164, 7.424229621887207, 8.246399879455566, 9.06856918334961, 9.890739440917969, 10.712909698486328, 11.535079956054688, 12.35724925994873, 13.17941951751709, 14.001588821411133, 14.823759078979492, 15.645929336547852, 16.468097686767578, 17.290267944335938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 10.0, 17.0, 11.0, 23.0, 28.0, 20.0, 37.0, 25.0, 38.0, 34.0, 35.0, 53.0, 52.0, 38.0, 48.0, 42.0, 39.0, 45.0, 38.0, 48.0, 35.0, 35.0, 41.0, 29.0, 30.0, 21.0, 14.0, 15.0, 14.0, 14.0, 11.0, 13.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.01033592224121, -29.10943031311035, -28.208524703979492, -27.3076171875, -26.40671157836914, -25.50580596923828, -24.604900360107422, -23.703994750976562, -22.803089141845703, -21.902183532714844, -21.001277923583984, -20.100372314453125, -19.199464797973633, -18.298559188842773, -17.397653579711914, -16.496747970581055, -15.595840454101562, -14.694934844970703, -13.794028282165527, -12.893122673034668, -11.992216110229492, -11.091310501098633, -10.190404891967773, -9.289499282836914, -8.388592720031738, -7.487686634063721, -6.586780548095703, -5.685874938964844, -4.784968852996826, -3.8840627670288086, -2.983157157897949, -2.0822510719299316, -1.1813430786132812, -0.2804371118545532, 0.6204688549041748, 1.5213747024536133, 2.422280788421631, 3.3231868743896484, 4.224092483520508, 5.124998569488525, 6.025904655456543, 6.9268107414245605, 7.827716827392578, 8.728622436523438, 9.629528045654297, 10.530434608459473, 11.431340217590332, 12.332246780395508, 13.233152389526367, 14.134057998657227, 15.034964561462402, 15.935870170593262, 16.836776733398438, 17.737682342529297, 18.638587951660156, 19.539493560791016, 20.440399169921875, 21.341304779052734, 22.242210388183594, 23.143115997314453, 24.044023513793945, 24.944929122924805, 25.845834732055664, 26.746740341186523, 27.647647857666016]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 6.0, 11.0, 7.0, 15.0, 19.0, 10.0, 22.0, 18.0, 19.0, 24.0, 29.0, 27.0, 30.0, 35.0, 37.0, 37.0, 34.0, 43.0, 41.0, 49.0, 37.0, 42.0, 39.0, 39.0, 36.0, 36.0, 27.0, 31.0, 30.0, 27.0, 24.0, 17.0, 14.0, 16.0, 14.0, 9.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.50390625, -3.393096923828125, -3.28228759765625, -3.171478271484375, -3.0606689453125, -2.949859619140625, -2.83905029296875, -2.728240966796875, -2.617431640625, -2.506622314453125, -2.39581298828125, -2.285003662109375, -2.1741943359375, -2.063385009765625, -1.95257568359375, -1.841766357421875, -1.73095703125, -1.620147705078125, -1.50933837890625, -1.398529052734375, -1.2877197265625, -1.176910400390625, -1.06610107421875, -0.955291748046875, -0.844482421875, -0.733673095703125, -0.62286376953125, -0.512054443359375, -0.4012451171875, -0.290435791015625, -0.17962646484375, -0.068817138671875, 0.0419921875, 0.152801513671875, 0.26361083984375, 0.374420166015625, 0.4852294921875, 0.596038818359375, 0.70684814453125, 0.817657470703125, 0.928466796875, 1.039276123046875, 1.15008544921875, 1.260894775390625, 1.3717041015625, 1.482513427734375, 1.59332275390625, 1.704132080078125, 1.81494140625, 1.925750732421875, 2.03656005859375, 2.147369384765625, 2.2581787109375, 2.368988037109375, 2.47979736328125, 2.590606689453125, 2.701416015625, 2.812225341796875, 2.92303466796875, 3.033843994140625, 3.1446533203125, 3.255462646484375, 3.36627197265625, 3.477081298828125, 3.587890625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 8.0, 7.0, 9.0, 15.0, 18.0, 24.0, 40.0, 50.0, 98.0, 181.0, 317.0, 595.0, 1354.0, 3054.0, 7793.0, 22460.0, 76467.0, 364329.0, 2091854.0, 1338226.0, 209682.0, 50908.0, 16085.0, 5997.0, 2393.0, 1069.0, 571.0, 275.0, 135.0, 87.0, 37.0, 50.0, 17.0, 24.0, 13.0, 13.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.0703125, -7.84515380859375, -7.6199951171875, -7.39483642578125, -7.169677734375, -6.94451904296875, -6.7193603515625, -6.49420166015625, -6.26904296875, -6.04388427734375, -5.8187255859375, -5.59356689453125, -5.368408203125, -5.14324951171875, -4.9180908203125, -4.69293212890625, -4.4677734375, -4.24261474609375, -4.0174560546875, -3.79229736328125, -3.567138671875, -3.34197998046875, -3.1168212890625, -2.89166259765625, -2.66650390625, -2.44134521484375, -2.2161865234375, -1.99102783203125, -1.765869140625, -1.54071044921875, -1.3155517578125, -1.09039306640625, -0.865234375, -0.64007568359375, -0.4149169921875, -0.18975830078125, 0.035400390625, 0.26055908203125, 0.4857177734375, 0.71087646484375, 0.93603515625, 1.16119384765625, 1.3863525390625, 1.61151123046875, 1.836669921875, 2.06182861328125, 2.2869873046875, 2.51214599609375, 2.7373046875, 2.96246337890625, 3.1876220703125, 3.41278076171875, 3.637939453125, 3.86309814453125, 4.0882568359375, 4.31341552734375, 4.53857421875, 4.76373291015625, 4.9888916015625, 5.21405029296875, 5.439208984375, 5.66436767578125, 5.8895263671875, 6.11468505859375, 6.33984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 8.0, 18.0, 22.0, 20.0, 21.0, 43.0, 55.0, 70.0, 88.0, 117.0, 129.0, 218.0, 268.0, 299.0, 386.0, 452.0, 397.0, 310.0, 261.0, 202.0, 144.0, 112.0, 88.0, 70.0, 67.0, 40.0, 31.0, 33.0, 19.0, 13.0, 17.0, 10.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.87109375, -4.71136474609375, -4.5516357421875, -4.39190673828125, -4.232177734375, -4.07244873046875, -3.9127197265625, -3.75299072265625, -3.59326171875, -3.43353271484375, -3.2738037109375, -3.11407470703125, -2.954345703125, -2.79461669921875, -2.6348876953125, -2.47515869140625, -2.3154296875, -2.15570068359375, -1.9959716796875, -1.83624267578125, -1.676513671875, -1.51678466796875, -1.3570556640625, -1.19732666015625, -1.03759765625, -0.87786865234375, -0.7181396484375, -0.55841064453125, -0.398681640625, -0.23895263671875, -0.0792236328125, 0.08050537109375, 0.240234375, 0.39996337890625, 0.5596923828125, 0.71942138671875, 0.879150390625, 1.03887939453125, 1.1986083984375, 1.35833740234375, 1.51806640625, 1.67779541015625, 1.8375244140625, 1.99725341796875, 2.156982421875, 2.31671142578125, 2.4764404296875, 2.63616943359375, 2.7958984375, 2.95562744140625, 3.1153564453125, 3.27508544921875, 3.434814453125, 3.59454345703125, 3.7542724609375, 3.91400146484375, 4.07373046875, 4.23345947265625, 4.3931884765625, 4.55291748046875, 4.712646484375, 4.87237548828125, 5.0321044921875, 5.19183349609375, 5.3515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 10.0, 9.0, 8.0, 18.0, 18.0, 21.0, 22.0, 37.0, 60.0, 51.0, 76.0, 113.0, 153.0, 179.0, 295.0, 647.0, 2187.0, 10393.0, 77808.0, 1108773.0, 2788851.0, 178739.0, 19953.0, 3698.0, 930.0, 413.0, 208.0, 154.0, 108.0, 92.0, 57.0, 41.0, 35.0, 33.0, 26.0, 10.0, 10.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.68701171875, -13.2333984375, -12.77978515625, -12.326171875, -11.87255859375, -11.4189453125, -10.96533203125, -10.51171875, -10.05810546875, -9.6044921875, -9.15087890625, -8.697265625, -8.24365234375, -7.7900390625, -7.33642578125, -6.8828125, -6.42919921875, -5.9755859375, -5.52197265625, -5.068359375, -4.61474609375, -4.1611328125, -3.70751953125, -3.25390625, -2.80029296875, -2.3466796875, -1.89306640625, -1.439453125, -0.98583984375, -0.5322265625, -0.07861328125, 0.375, 0.82861328125, 1.2822265625, 1.73583984375, 2.189453125, 2.64306640625, 3.0966796875, 3.55029296875, 4.00390625, 4.45751953125, 4.9111328125, 5.36474609375, 5.818359375, 6.27197265625, 6.7255859375, 7.17919921875, 7.6328125, 8.08642578125, 8.5400390625, 8.99365234375, 9.447265625, 9.90087890625, 10.3544921875, 10.80810546875, 11.26171875, 11.71533203125, 12.1689453125, 12.62255859375, 13.076171875, 13.52978515625, 13.9833984375, 14.43701171875, 14.890625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 13.0, 22.0, 30.0, 41.0, 52.0, 71.0, 82.0, 86.0, 86.0, 115.0, 89.0, 79.0, 76.0, 42.0, 31.0, 31.0, 20.0, 16.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.477941513061523, -24.74338150024414, -24.00882339477539, -23.274263381958008, -22.539703369140625, -21.805143356323242, -21.070585250854492, -20.33602523803711, -19.601465225219727, -18.866905212402344, -18.132347106933594, -17.39778709411621, -16.663227081298828, -15.928668022155762, -15.194108963012695, -14.459548950195312, -13.724989891052246, -12.99043083190918, -12.255870819091797, -11.52131175994873, -10.786751747131348, -10.052192687988281, -9.317632675170898, -8.583073616027832, -7.848514080047607, -7.113954544067383, -6.379395008087158, -5.644835472106934, -4.910276412963867, -4.175716400146484, -3.441157341003418, -2.7065978050231934, -1.9720382690429688, -1.2374787330627441, -0.5029193162918091, 0.23164010047912598, 0.9661996364593506, 1.7007591724395752, 2.4353184700012207, 3.1698780059814453, 3.90443754196167, 4.6389970779418945, 5.373556613922119, 6.108116149902344, 6.84267520904541, 7.577235221862793, 8.31179428100586, 9.046354293823242, 9.780913352966309, 10.515472412109375, 11.250032424926758, 11.984591484069824, 12.719151496887207, 13.453710556030273, 14.188270568847656, 14.922829627990723, 15.657388687133789, 16.391948699951172, 17.126506805419922, 17.861066818237305, 18.595626831054688, 19.33018684387207, 20.06474494934082, 20.799304962158203, 21.533864974975586]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 5.0, 10.0, 16.0, 11.0, 12.0, 12.0, 16.0, 16.0, 23.0, 22.0, 22.0, 37.0, 24.0, 35.0, 40.0, 35.0, 36.0, 50.0, 44.0, 37.0, 48.0, 45.0, 32.0, 35.0, 36.0, 46.0, 28.0, 34.0, 35.0, 28.0, 17.0, 11.0, 16.0, 20.0, 12.0, 14.0, 7.0, 10.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-21.35034942626953, -20.72182846069336, -20.093305587768555, -19.464784622192383, -18.836261749267578, -18.207740783691406, -17.5792179107666, -16.95069694519043, -16.322174072265625, -15.693652153015137, -15.065130233764648, -14.43660831451416, -13.808086395263672, -13.1795654296875, -12.551043510437012, -11.922521591186523, -11.294000625610352, -10.665478706359863, -10.036956787109375, -9.408434867858887, -8.779912948608398, -8.151391983032227, -7.522870063781738, -6.89434814453125, -6.265826225280762, -5.637304306030273, -5.008782386779785, -4.380260944366455, -3.751739025115967, -3.1232171058654785, -2.4946954250335693, -1.8661737442016602, -1.2376518249511719, -0.6091300249099731, 0.019391775131225586, 0.6479135751724243, 1.276435375213623, 1.9049572944641113, 2.5334789752960205, 3.1620006561279297, 3.790522575378418, 4.419044494628906, 5.0475664138793945, 5.676087856292725, 6.304609775543213, 6.933131694793701, 7.561653137207031, 8.19017505645752, 8.818696975708008, 9.447218894958496, 10.075740814208984, 10.704262733459473, 11.332784652709961, 11.961305618286133, 12.589827537536621, 13.21834945678711, 13.846871376037598, 14.475393295288086, 15.103915214538574, 15.732437133789062, 16.360958099365234, 16.98948097229004, 17.61800193786621, 18.246524810791016, 18.875045776367188]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 16.0, 21.0, 22.0, 16.0, 34.0, 23.0, 39.0, 37.0, 48.0, 41.0, 43.0, 36.0, 49.0, 43.0, 50.0, 47.0, 50.0, 39.0, 41.0, 32.0, 26.0, 34.0, 28.0, 19.0, 15.0, 20.0, 11.0, 13.0, 14.0, 11.0, 11.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9375, -3.81298828125, -3.6884765625, -3.56396484375, -3.439453125, -3.31494140625, -3.1904296875, -3.06591796875, -2.94140625, -2.81689453125, -2.6923828125, -2.56787109375, -2.443359375, -2.31884765625, -2.1943359375, -2.06982421875, -1.9453125, -1.82080078125, -1.6962890625, -1.57177734375, -1.447265625, -1.32275390625, -1.1982421875, -1.07373046875, -0.94921875, -0.82470703125, -0.7001953125, -0.57568359375, -0.451171875, -0.32666015625, -0.2021484375, -0.07763671875, 0.046875, 0.17138671875, 0.2958984375, 0.42041015625, 0.544921875, 0.66943359375, 0.7939453125, 0.91845703125, 1.04296875, 1.16748046875, 1.2919921875, 1.41650390625, 1.541015625, 1.66552734375, 1.7900390625, 1.91455078125, 2.0390625, 2.16357421875, 2.2880859375, 2.41259765625, 2.537109375, 2.66162109375, 2.7861328125, 2.91064453125, 3.03515625, 3.15966796875, 3.2841796875, 3.40869140625, 3.533203125, 3.65771484375, 3.7822265625, 3.90673828125, 4.03125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 15.0, 14.0, 27.0, 42.0, 50.0, 70.0, 110.0, 183.0, 293.0, 544.0, 949.0, 1673.0, 2784.0, 5041.0, 9262.0, 17215.0, 32718.0, 67378.0, 166938.0, 427891.0, 172627.0, 69866.0, 33304.0, 17802.0, 9638.0, 5358.0, 2895.0, 1554.0, 908.0, 500.0, 336.0, 226.0, 110.0, 90.0, 49.0, 28.0, 20.0, 17.0, 8.0, 1.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0296630859375, -0.028750896453857422, -0.027838706970214844, -0.026926517486572266, -0.026014328002929688, -0.02510213851928711, -0.02418994903564453, -0.023277759552001953, -0.022365570068359375, -0.021453380584716797, -0.02054119110107422, -0.01962900161743164, -0.018716812133789062, -0.017804622650146484, -0.016892433166503906, -0.015980243682861328, -0.01506805419921875, -0.014155864715576172, -0.013243675231933594, -0.012331485748291016, -0.011419296264648438, -0.01050710678100586, -0.009594917297363281, -0.008682727813720703, -0.007770538330078125, -0.006858348846435547, -0.005946159362792969, -0.005033969879150391, -0.0041217803955078125, -0.0032095909118652344, -0.0022974014282226562, -0.0013852119445800781, -0.0004730224609375, 0.0004391670227050781, 0.0013513565063476562, 0.0022635459899902344, 0.0031757354736328125, 0.004087924957275391, 0.005000114440917969, 0.005912303924560547, 0.006824493408203125, 0.007736682891845703, 0.008648872375488281, 0.00956106185913086, 0.010473251342773438, 0.011385440826416016, 0.012297630310058594, 0.013209819793701172, 0.01412200927734375, 0.015034198760986328, 0.015946388244628906, 0.016858577728271484, 0.017770767211914062, 0.01868295669555664, 0.01959514617919922, 0.020507335662841797, 0.021419525146484375, 0.022331714630126953, 0.02324390411376953, 0.02415609359741211, 0.025068283081054688, 0.025980472564697266, 0.026892662048339844, 0.027804851531982422, 0.028717041015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 10.0, 17.0, 11.0, 14.0, 17.0, 14.0, 25.0, 26.0, 23.0, 27.0, 38.0, 37.0, 33.0, 36.0, 38.0, 33.0, 46.0, 1064.0, 40.0, 38.0, 49.0, 40.0, 37.0, 34.0, 32.0, 22.0, 24.0, 23.0, 24.0, 17.0, 21.0, 16.0, 15.0, 12.0, 12.0, 6.0, 4.0, 6.0, 4.0, 2.0, 7.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.16015625, -2.087646484375, -2.01513671875, -1.942626953125, -1.8701171875, -1.797607421875, -1.72509765625, -1.652587890625, -1.580078125, -1.507568359375, -1.43505859375, -1.362548828125, -1.2900390625, -1.217529296875, -1.14501953125, -1.072509765625, -1.0, -0.927490234375, -0.85498046875, -0.782470703125, -0.7099609375, -0.637451171875, -0.56494140625, -0.492431640625, -0.419921875, -0.347412109375, -0.27490234375, -0.202392578125, -0.1298828125, -0.057373046875, 0.01513671875, 0.087646484375, 0.16015625, 0.232666015625, 0.30517578125, 0.377685546875, 0.4501953125, 0.522705078125, 0.59521484375, 0.667724609375, 0.740234375, 0.812744140625, 0.88525390625, 0.957763671875, 1.0302734375, 1.102783203125, 1.17529296875, 1.247802734375, 1.3203125, 1.392822265625, 1.46533203125, 1.537841796875, 1.6103515625, 1.682861328125, 1.75537109375, 1.827880859375, 1.900390625, 1.972900390625, 2.04541015625, 2.117919921875, 2.1904296875, 2.262939453125, 2.33544921875, 2.407958984375, 2.48046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 14.0, 13.0, 15.0, 47.0, 45.0, 118.0, 107.0, 196.0, 262.0, 427.0, 650.0, 840.0, 1362.0, 2033.0, 2897.0, 4468.0, 6875.0, 10571.0, 16489.0, 26264.0, 41700.0, 70555.0, 134304.0, 1342258.0, 199441.0, 92175.0, 52988.0, 32344.0, 20256.0, 12847.0, 8248.0, 5457.0, 3564.0, 2393.0, 1606.0, 1006.0, 704.0, 474.0, 337.0, 250.0, 160.0, 105.0, 73.0, 55.0, 47.0, 32.0, 20.0, 10.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-0.01480865478515625, -0.014369606971740723, -0.013930559158325195, -0.013491511344909668, -0.01305246353149414, -0.012613415718078613, -0.012174367904663086, -0.011735320091247559, -0.011296272277832031, -0.010857224464416504, -0.010418176651000977, -0.00997912883758545, -0.009540081024169922, -0.009101033210754395, -0.008661985397338867, -0.00822293758392334, -0.0077838897705078125, -0.007344841957092285, -0.006905794143676758, -0.0064667463302612305, -0.006027698516845703, -0.005588650703430176, -0.0051496028900146484, -0.004710555076599121, -0.004271507263183594, -0.0038324594497680664, -0.003393411636352539, -0.0029543638229370117, -0.0025153160095214844, -0.002076268196105957, -0.0016372203826904297, -0.0011981725692749023, -0.000759124755859375, -0.00032007694244384766, 0.00011897087097167969, 0.000558018684387207, 0.0009970664978027344, 0.0014361143112182617, 0.001875162124633789, 0.0023142099380493164, 0.0027532577514648438, 0.003192305564880371, 0.0036313533782958984, 0.004070401191711426, 0.004509449005126953, 0.0049484968185424805, 0.005387544631958008, 0.005826592445373535, 0.0062656402587890625, 0.00670468807220459, 0.007143735885620117, 0.0075827836990356445, 0.008021831512451172, 0.0084608793258667, 0.008899927139282227, 0.009338974952697754, 0.009778022766113281, 0.010217070579528809, 0.010656118392944336, 0.011095166206359863, 0.01153421401977539, 0.011973261833190918, 0.012412309646606445, 0.012851357460021973, 0.0132904052734375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 146.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 631.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 165.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-2.980232238769531e-07, -2.905726432800293e-07, -2.8312206268310547e-07, -2.7567148208618164e-07, -2.682209014892578e-07, -2.60770320892334e-07, -2.5331974029541016e-07, -2.4586915969848633e-07, -2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 11.0, 10.0, 5.0, 4.0, 0.0, 2.0, 14.0, 52.0, 68.0, 55.0, 11.0, 122.0, 115.0, 104.0, 409.0, 11468.0, 933672.0, 101177.0, 560.0, 213.0, 63.0, 174.0, 16.0, 8.0, 73.0, 54.0, 40.0, 8.0, 0.0, 0.0, 8.0, 4.0, 8.0, 8.0, 14.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814697265625e-06, -3.666616976261139e-06, -3.518536686897278e-06, -3.3704563975334167e-06, -3.2223761081695557e-06, -3.0742958188056946e-06, -2.9262155294418335e-06, -2.7781352400779724e-06, -2.6300549507141113e-06, -2.4819746613502502e-06, -2.333894371986389e-06, -2.185814082622528e-06, -2.037733793258667e-06, -1.889653503894806e-06, -1.7415732145309448e-06, -1.5934929251670837e-06, -1.4454126358032227e-06, -1.2973323464393616e-06, -1.1492520570755005e-06, -1.0011717677116394e-06, -8.530914783477783e-07, -7.050111889839172e-07, -5.569308996200562e-07, -4.0885061025619507e-07, -2.60770320892334e-07, -1.126900315284729e-07, 3.5390257835388184e-08, 1.8347054719924927e-07, 3.3155083656311035e-07, 4.796311259269714e-07, 6.277114152908325e-07, 7.757917046546936e-07, 9.238719940185547e-07, 1.0719522833824158e-06, 1.2200325727462769e-06, 1.368112862110138e-06, 1.516193151473999e-06, 1.6642734408378601e-06, 1.8123537302017212e-06, 1.9604340195655823e-06, 2.1085143089294434e-06, 2.2565945982933044e-06, 2.4046748876571655e-06, 2.5527551770210266e-06, 2.7008354663848877e-06, 2.8489157557487488e-06, 2.99699604511261e-06, 3.145076334476471e-06, 3.293156623840332e-06, 3.441236913204193e-06, 3.589317202568054e-06, 3.7373974919319153e-06, 3.885477781295776e-06, 4.0335580706596375e-06, 4.1816383600234985e-06, 4.32971864938736e-06, 4.477798938751221e-06, 4.625879228115082e-06, 4.773959517478943e-06, 4.922039806842804e-06, 5.070120096206665e-06, 5.218200385570526e-06, 5.366280674934387e-06, 5.514360964298248e-06, 5.662441253662109e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 978.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.877844320271834e-08, -9.563981251403675e-08, -9.25011747199278e-08, -8.936254403124622e-08, -8.622390623713727e-08, -8.308527554845568e-08, -7.99466448597741e-08, -7.680800706566515e-08, -7.36693692715562e-08, -7.053073858287462e-08, -6.739210078876567e-08, -6.425347010008409e-08, -6.111483230597514e-08, -5.7976201617293555e-08, -5.483756737589829e-08, -5.169893313450302e-08, -4.8560302445821435e-08, -4.542166820442617e-08, -4.22830339630309e-08, -3.9144403274349315e-08, -3.600576548024037e-08, -3.286713479155878e-08, -2.9728500550163517e-08, -2.658986630876825e-08, -2.3451232067372985e-08, -2.031259782597772e-08, -1.7173963584582452e-08, -1.4035331119544026e-08, -1.089669687814876e-08, -7.758062636753493e-09, -4.6194301717150665e-09, -1.4807959303198004e-09, 1.6578312056481082e-09, 4.7964650029541644e-09, 7.93509880026022e-09, 1.1073732153477067e-08, 1.4212366394872333e-08, 1.73510006362676e-08, 2.0489633101306026e-08, 2.3628267342701292e-08, 2.676690158409656e-08, 2.9905535825491825e-08, 3.304417006688709e-08, 3.618280430828236e-08, 3.9321434996963944e-08, 4.246007279107289e-08, 4.5598703479754477e-08, 4.873733772114974e-08, 5.187597196254501e-08, 5.5014606203940275e-08, 5.815324044533554e-08, 6.129187113401713e-08, 6.443050892812607e-08, 6.756913961680766e-08, 7.070777030548925e-08, 7.384640809959819e-08, 7.698504589370714e-08, 8.012367658238873e-08, 8.326231437649767e-08, 8.640094506517926e-08, 8.95395828592882e-08, 9.267821354796979e-08, 9.581684423665138e-08, 9.895548203076032e-08, 1.0209411271944191e-07]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 977.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 16.0, 21.0, 22.0, 16.0, 34.0, 23.0, 39.0, 37.0, 48.0, 41.0, 43.0, 36.0, 49.0, 43.0, 50.0, 47.0, 50.0, 39.0, 41.0, 32.0, 26.0, 34.0, 28.0, 19.0, 15.0, 20.0, 11.0, 13.0, 14.0, 11.0, 11.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9375, -3.81298828125, -3.6884765625, -3.56396484375, -3.439453125, -3.31494140625, -3.1904296875, -3.06591796875, -2.94140625, -2.81689453125, -2.6923828125, -2.56787109375, -2.443359375, -2.31884765625, -2.1943359375, -2.06982421875, -1.9453125, -1.82080078125, -1.6962890625, -1.57177734375, -1.447265625, -1.32275390625, -1.1982421875, -1.07373046875, -0.94921875, -0.82470703125, -0.7001953125, -0.57568359375, -0.451171875, -0.32666015625, -0.2021484375, -0.07763671875, 0.046875, 0.17138671875, 0.2958984375, 0.42041015625, 0.544921875, 0.66943359375, 0.7939453125, 0.91845703125, 1.04296875, 1.16748046875, 1.2919921875, 1.41650390625, 1.541015625, 1.66552734375, 1.7900390625, 1.91455078125, 2.0390625, 2.16357421875, 2.2880859375, 2.41259765625, 2.537109375, 2.66162109375, 2.7861328125, 2.91064453125, 3.03515625, 3.15966796875, 3.2841796875, 3.40869140625, 3.533203125, 3.65771484375, 3.7822265625, 3.90673828125, 4.03125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 0.0, 9.0, 8.0, 14.0, 29.0, 33.0, 62.0, 82.0, 106.0, 181.0, 306.0, 530.0, 844.0, 1457.0, 2428.0, 4069.0, 6887.0, 12559.0, 22621.0, 42413.0, 81115.0, 173816.0, 334426.0, 182509.0, 84458.0, 43596.0, 23404.0, 12897.0, 7334.0, 4106.0, 2456.0, 1492.0, 823.0, 544.0, 356.0, 208.0, 123.0, 92.0, 57.0, 37.0, 27.0, 11.0, 12.0, 5.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.91094970703125, -3.7828369140625, -3.65472412109375, -3.526611328125, -3.39849853515625, -3.2703857421875, -3.14227294921875, -3.01416015625, -2.88604736328125, -2.7579345703125, -2.62982177734375, -2.501708984375, -2.37359619140625, -2.2454833984375, -2.11737060546875, -1.9892578125, -1.86114501953125, -1.7330322265625, -1.60491943359375, -1.476806640625, -1.34869384765625, -1.2205810546875, -1.09246826171875, -0.96435546875, -0.83624267578125, -0.7081298828125, -0.58001708984375, -0.451904296875, -0.32379150390625, -0.1956787109375, -0.06756591796875, 0.060546875, 0.18865966796875, 0.3167724609375, 0.44488525390625, 0.572998046875, 0.70111083984375, 0.8292236328125, 0.95733642578125, 1.08544921875, 1.21356201171875, 1.3416748046875, 1.46978759765625, 1.597900390625, 1.72601318359375, 1.8541259765625, 1.98223876953125, 2.1103515625, 2.23846435546875, 2.3665771484375, 2.49468994140625, 2.622802734375, 2.75091552734375, 2.8790283203125, 3.00714111328125, 3.13525390625, 3.26336669921875, 3.3914794921875, 3.51959228515625, 3.647705078125, 3.77581787109375, 3.9039306640625, 4.03204345703125, 4.16015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 11.0, 7.0, 7.0, 12.0, 17.0, 29.0, 13.0, 18.0, 30.0, 38.0, 30.0, 32.0, 57.0, 80.0, 94.0, 166.0, 1384.0, 406.0, 157.0, 102.0, 62.0, 48.0, 46.0, 30.0, 39.0, 29.0, 28.0, 21.0, 13.0, 13.0, 9.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9296875, -11.518310546875, -11.10693359375, -10.695556640625, -10.2841796875, -9.872802734375, -9.46142578125, -9.050048828125, -8.638671875, -8.227294921875, -7.81591796875, -7.404541015625, -6.9931640625, -6.581787109375, -6.17041015625, -5.759033203125, -5.34765625, -4.936279296875, -4.52490234375, -4.113525390625, -3.7021484375, -3.290771484375, -2.87939453125, -2.468017578125, -2.056640625, -1.645263671875, -1.23388671875, -0.822509765625, -0.4111328125, 0.000244140625, 0.41162109375, 0.822998046875, 1.234375, 1.645751953125, 2.05712890625, 2.468505859375, 2.8798828125, 3.291259765625, 3.70263671875, 4.114013671875, 4.525390625, 4.936767578125, 5.34814453125, 5.759521484375, 6.1708984375, 6.582275390625, 6.99365234375, 7.405029296875, 7.81640625, 8.227783203125, 8.63916015625, 9.050537109375, 9.4619140625, 9.873291015625, 10.28466796875, 10.696044921875, 11.107421875, 11.518798828125, 11.93017578125, 12.341552734375, 12.7529296875, 13.164306640625, 13.57568359375, 13.987060546875, 14.3984375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 10.0, 24.0, 29.0, 57.0, 103.0, 135.0, 293.0, 629.0, 2098.0, 14035.0, 217587.0, 2790941.0, 108166.0, 8829.0, 1554.0, 511.0, 261.0, 143.0, 96.0, 58.0, 41.0, 32.0, 13.0, 16.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1160888671875, -14.583740234375, -14.0513916015625, -13.51904296875, -12.9866943359375, -12.454345703125, -11.9219970703125, -11.3896484375, -10.8572998046875, -10.324951171875, -9.7926025390625, -9.26025390625, -8.7279052734375, -8.195556640625, -7.6632080078125, -7.130859375, -6.5985107421875, -6.066162109375, -5.5338134765625, -5.00146484375, -4.4691162109375, -3.936767578125, -3.4044189453125, -2.8720703125, -2.3397216796875, -1.807373046875, -1.2750244140625, -0.74267578125, -0.2103271484375, 0.322021484375, 0.8543701171875, 1.38671875, 1.9190673828125, 2.451416015625, 2.9837646484375, 3.51611328125, 4.0484619140625, 4.580810546875, 5.1131591796875, 5.6455078125, 6.1778564453125, 6.710205078125, 7.2425537109375, 7.77490234375, 8.3072509765625, 8.839599609375, 9.3719482421875, 9.904296875, 10.4366455078125, 10.968994140625, 11.5013427734375, 12.03369140625, 12.5660400390625, 13.098388671875, 13.6307373046875, 14.1630859375, 14.6954345703125, 15.227783203125, 15.7601318359375, 16.29248046875, 16.8248291015625, 17.357177734375, 17.8895263671875, 18.421875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 7.0, 214.0, 579.0, 207.0, 12.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.43085765838623, -8.188886642456055, -4.946916580200195, -1.7049455642700195, 1.5370244979858398, 4.778994560241699, 8.020966529846191, 11.26293659210205, 14.50490665435791, 17.746877670288086, 20.988847732543945, 24.230819702148438, 27.472789764404297, 30.714759826660156, 33.956729888916016, 37.198699951171875, 40.440670013427734, 43.682640075683594, 46.92461013793945, 50.16658020019531, 53.40855407714844, 56.65052032470703, 59.892494201660156, 63.134464263916016, 66.37643432617188, 69.618408203125, 72.8603744506836, 76.10234832763672, 79.34431457519531, 82.58628845214844, 85.82826232910156, 89.07022857666016, 92.31219482421875, 95.55416870117188, 98.79613494873047, 102.0381088256836, 105.28007507324219, 108.52204895019531, 111.76402282714844, 115.00598907470703, 118.24795532226562, 121.48992919921875, 124.73189544677734, 127.97386932373047, 131.21583557128906, 134.4578094482422, 137.6997833251953, 140.94174194335938, 144.1837158203125, 147.42568969726562, 150.66766357421875, 153.9096221923828, 157.15159606933594, 160.39356994628906, 163.6355438232422, 166.87750244140625, 170.11949157714844, 173.36146545410156, 176.6034393310547, 179.84539794921875, 183.08737182617188, 186.329345703125, 189.57131958007812, 192.81329345703125, 196.0552520751953]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 15.0, 7.0, 10.0, 16.0, 8.0, 11.0, 14.0, 17.0, 22.0, 19.0, 30.0, 24.0, 29.0, 39.0, 35.0, 39.0, 47.0, 35.0, 35.0, 50.0, 33.0, 38.0, 52.0, 33.0, 39.0, 21.0, 25.0, 32.0, 34.0, 22.0, 26.0, 24.0, 24.0, 21.0, 10.0, 8.0, 15.0, 3.0, 13.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.566593170166016, -23.82815170288086, -23.08970832824707, -22.351266860961914, -21.612823486328125, -20.87438201904297, -20.135940551757812, -19.397499084472656, -18.659055709838867, -17.92061424255371, -17.182170867919922, -16.443729400634766, -15.705286979675293, -14.96684455871582, -14.228403091430664, -13.489960670471191, -12.751518249511719, -12.013075828552246, -11.274633407592773, -10.536191940307617, -9.797749519348145, -9.059307098388672, -8.320865631103516, -7.582423210144043, -6.84398078918457, -6.105538368225098, -5.367096424102783, -4.628654479980469, -3.890212059020996, -3.1517698764801025, -2.413327693939209, -1.6748857498168945, -0.9364452362060547, -0.19800305366516113, 0.5404391288757324, 1.278881311416626, 2.0173234939575195, 2.755765676498413, 3.4942078590393066, 4.232649803161621, 4.971092224121094, 5.709534645080566, 6.447976589202881, 7.186418533325195, 7.924860954284668, 8.66330337524414, 9.401744842529297, 10.14018726348877, 10.878629684448242, 11.617072105407715, 12.355514526367188, 13.093955993652344, 13.832398414611816, 14.570840835571289, 15.309282302856445, 16.047725677490234, 16.78616714477539, 17.524608612060547, 18.263051986694336, 19.001493453979492, 19.73993682861328, 20.478378295898438, 21.216819763183594, 21.95526123046875, 22.69370460510254]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 7.0, 6.0, 8.0, 9.0, 9.0, 17.0, 18.0, 29.0, 22.0, 25.0, 22.0, 25.0, 45.0, 43.0, 40.0, 31.0, 47.0, 42.0, 38.0, 42.0, 44.0, 41.0, 55.0, 49.0, 32.0, 41.0, 22.0, 25.0, 28.0, 24.0, 20.0, 10.0, 20.0, 9.0, 11.0, 12.0, 6.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.78125, -3.65606689453125, -3.5308837890625, -3.40570068359375, -3.280517578125, -3.15533447265625, -3.0301513671875, -2.90496826171875, -2.77978515625, -2.65460205078125, -2.5294189453125, -2.40423583984375, -2.279052734375, -2.15386962890625, -2.0286865234375, -1.90350341796875, -1.7783203125, -1.65313720703125, -1.5279541015625, -1.40277099609375, -1.277587890625, -1.15240478515625, -1.0272216796875, -0.90203857421875, -0.77685546875, -0.65167236328125, -0.5264892578125, -0.40130615234375, -0.276123046875, -0.15093994140625, -0.0257568359375, 0.09942626953125, 0.224609375, 0.34979248046875, 0.4749755859375, 0.60015869140625, 0.725341796875, 0.85052490234375, 0.9757080078125, 1.10089111328125, 1.22607421875, 1.35125732421875, 1.4764404296875, 1.60162353515625, 1.726806640625, 1.85198974609375, 1.9771728515625, 2.10235595703125, 2.2275390625, 2.35272216796875, 2.4779052734375, 2.60308837890625, 2.728271484375, 2.85345458984375, 2.9786376953125, 3.10382080078125, 3.22900390625, 3.35418701171875, 3.4793701171875, 3.60455322265625, 3.729736328125, 3.85491943359375, 3.9801025390625, 4.10528564453125, 4.23046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 22.0, 39.0, 66.0, 80.0, 153.0, 247.0, 420.0, 908.0, 2038.0, 5166.0, 14582.0, 49167.0, 250323.0, 2231264.0, 1431181.0, 153894.0, 35599.0, 11375.0, 4174.0, 1794.0, 812.0, 412.0, 177.0, 132.0, 75.0, 42.0, 33.0, 22.0, 10.0, 9.0, 8.0, 2.0, 3.0, 2.0, 6.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.41278076171875, -7.1263427734375, -6.83990478515625, -6.553466796875, -6.26702880859375, -5.9805908203125, -5.69415283203125, -5.40771484375, -5.12127685546875, -4.8348388671875, -4.54840087890625, -4.261962890625, -3.97552490234375, -3.6890869140625, -3.40264892578125, -3.1162109375, -2.82977294921875, -2.5433349609375, -2.25689697265625, -1.970458984375, -1.68402099609375, -1.3975830078125, -1.11114501953125, -0.82470703125, -0.53826904296875, -0.2518310546875, 0.03460693359375, 0.321044921875, 0.60748291015625, 0.8939208984375, 1.18035888671875, 1.466796875, 1.75323486328125, 2.0396728515625, 2.32611083984375, 2.612548828125, 2.89898681640625, 3.1854248046875, 3.47186279296875, 3.75830078125, 4.04473876953125, 4.3311767578125, 4.61761474609375, 4.904052734375, 5.19049072265625, 5.4769287109375, 5.76336669921875, 6.0498046875, 6.33624267578125, 6.6226806640625, 6.90911865234375, 7.195556640625, 7.48199462890625, 7.7684326171875, 8.05487060546875, 8.34130859375, 8.62774658203125, 8.9141845703125, 9.20062255859375, 9.487060546875, 9.77349853515625, 10.0599365234375, 10.34637451171875, 10.6328125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 9.0, 17.0, 26.0, 44.0, 62.0, 73.0, 79.0, 121.0, 207.0, 291.0, 420.0, 599.0, 584.0, 476.0, 291.0, 216.0, 180.0, 95.0, 82.0, 63.0, 38.0, 31.0, 16.0, 12.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.8131103515625, -4.594970703125, -4.3768310546875, -4.15869140625, -3.9405517578125, -3.722412109375, -3.5042724609375, -3.2861328125, -3.0679931640625, -2.849853515625, -2.6317138671875, -2.41357421875, -2.1954345703125, -1.977294921875, -1.7591552734375, -1.541015625, -1.3228759765625, -1.104736328125, -0.8865966796875, -0.66845703125, -0.4503173828125, -0.232177734375, -0.0140380859375, 0.2041015625, 0.4222412109375, 0.640380859375, 0.8585205078125, 1.07666015625, 1.2947998046875, 1.512939453125, 1.7310791015625, 1.94921875, 2.1673583984375, 2.385498046875, 2.6036376953125, 2.82177734375, 3.0399169921875, 3.258056640625, 3.4761962890625, 3.6943359375, 3.9124755859375, 4.130615234375, 4.3487548828125, 4.56689453125, 4.7850341796875, 5.003173828125, 5.2213134765625, 5.439453125, 5.6575927734375, 5.875732421875, 6.0938720703125, 6.31201171875, 6.5301513671875, 6.748291015625, 6.9664306640625, 7.1845703125, 7.4027099609375, 7.620849609375, 7.8389892578125, 8.05712890625, 8.2752685546875, 8.493408203125, 8.7115478515625, 8.9296875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 10.0, 2.0, 11.0, 24.0, 22.0, 32.0, 41.0, 74.0, 104.0, 189.0, 362.0, 735.0, 1680.0, 4177.0, 12526.0, 44357.0, 187567.0, 1187573.0, 2318209.0, 334875.0, 72128.0, 19293.0, 6031.0, 2229.0, 972.0, 438.0, 243.0, 139.0, 63.0, 48.0, 34.0, 34.0, 19.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.875, -9.5860595703125, -9.297119140625, -9.0081787109375, -8.71923828125, -8.4302978515625, -8.141357421875, -7.8524169921875, -7.5634765625, -7.2745361328125, -6.985595703125, -6.6966552734375, -6.40771484375, -6.1187744140625, -5.829833984375, -5.5408935546875, -5.251953125, -4.9630126953125, -4.674072265625, -4.3851318359375, -4.09619140625, -3.8072509765625, -3.518310546875, -3.2293701171875, -2.9404296875, -2.6514892578125, -2.362548828125, -2.0736083984375, -1.78466796875, -1.4957275390625, -1.206787109375, -0.9178466796875, -0.62890625, -0.3399658203125, -0.051025390625, 0.2379150390625, 0.52685546875, 0.8157958984375, 1.104736328125, 1.3936767578125, 1.6826171875, 1.9715576171875, 2.260498046875, 2.5494384765625, 2.83837890625, 3.1273193359375, 3.416259765625, 3.7052001953125, 3.994140625, 4.2830810546875, 4.572021484375, 4.8609619140625, 5.14990234375, 5.4388427734375, 5.727783203125, 6.0167236328125, 6.3056640625, 6.5946044921875, 6.883544921875, 7.1724853515625, 7.46142578125, 7.7503662109375, 8.039306640625, 8.3282470703125, 8.6171875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 22.0, 29.0, 30.0, 63.0, 90.0, 121.0, 115.0, 114.0, 118.0, 103.0, 66.0, 57.0, 25.0, 18.0, 11.0, 6.0, 4.0, 4.0], "bins": [-48.4801139831543, -47.56629180908203, -46.65247344970703, -45.738651275634766, -44.8248291015625, -43.9110107421875, -42.997188568115234, -42.08336639404297, -41.16954803466797, -40.2557258605957, -39.3419075012207, -38.42808532714844, -37.51426315307617, -36.60044479370117, -35.686622619628906, -34.772804260253906, -33.85898208618164, -32.945159912109375, -32.031341552734375, -31.11751937866211, -30.203699111938477, -29.289878845214844, -28.376056671142578, -27.462236404418945, -26.54841423034668, -25.634593963623047, -24.72077178955078, -23.80695152282715, -22.893131256103516, -21.97930908203125, -21.065488815307617, -20.151668548583984, -19.23784637451172, -18.324026107788086, -17.41020393371582, -16.496383666992188, -15.582563400268555, -14.668742179870605, -13.754920959472656, -12.841100692749023, -11.92728042602539, -11.013459205627441, -10.099638938903809, -9.18581771850586, -8.271997451782227, -7.358176231384277, -6.444355487823486, -5.530534744262695, -4.6167144775390625, -3.7028937339782715, -2.7890729904174805, -1.8752520084381104, -0.9614312648773193, -0.04761028289794922, 0.8662104606628418, 1.7800312042236328, 2.693851947784424, 3.607672691345215, 4.521493434906006, 5.435314178466797, 6.349135398864746, 7.262956142425537, 8.176776885986328, 9.090597152709961, 10.00441837310791]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 11.0, 10.0, 9.0, 14.0, 11.0, 25.0, 22.0, 24.0, 27.0, 15.0, 23.0, 32.0, 30.0, 40.0, 44.0, 37.0, 32.0, 26.0, 40.0, 34.0, 48.0, 37.0, 35.0, 32.0, 31.0, 34.0, 44.0, 30.0, 18.0, 32.0, 18.0, 18.0, 23.0, 17.0, 15.0, 6.0, 10.0, 14.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-19.134492874145508, -18.515792846679688, -17.897090911865234, -17.278390884399414, -16.659690856933594, -16.04098892211914, -15.42228889465332, -14.803587913513184, -14.184886932373047, -13.56618595123291, -12.947484970092773, -12.328784942626953, -11.710083961486816, -11.09138298034668, -10.47268295288086, -9.853981971740723, -9.235280990600586, -8.61658000946045, -7.997879505157471, -7.379179000854492, -6.7604780197143555, -6.141777038574219, -5.52307653427124, -4.904376029968262, -4.285675048828125, -3.6669743061065674, -3.0482735633850098, -2.429572820663452, -1.8108720779418945, -1.192171335220337, -0.5734705924987793, 0.04522991180419922, 0.6639328002929688, 1.2826335430145264, 1.901334285736084, 2.5200350284576416, 3.138735771179199, 3.757436513900757, 4.3761372566223145, 4.994837760925293, 5.61353874206543, 6.232239723205566, 6.850940227508545, 7.469640731811523, 8.08834171295166, 8.707042694091797, 9.325742721557617, 9.944443702697754, 10.56314468383789, 11.181845664978027, 11.800546646118164, 12.419246673583984, 13.037947654724121, 13.656648635864258, 14.275348663330078, 14.894049644470215, 15.512750625610352, 16.131450653076172, 16.750152587890625, 17.368852615356445, 17.987552642822266, 18.60625457763672, 19.22495460510254, 19.84365463256836, 20.462356567382812]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 17.0, 29.0, 29.0, 25.0, 31.0, 31.0, 35.0, 41.0, 48.0, 48.0, 59.0, 39.0, 50.0, 33.0, 52.0, 29.0, 48.0, 28.0, 41.0, 37.0, 35.0, 29.0, 26.0, 19.0, 20.0, 26.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0076904296875, -3.866943359375, -3.7261962890625, -3.58544921875, -3.4447021484375, -3.303955078125, -3.1632080078125, -3.0224609375, -2.8817138671875, -2.740966796875, -2.6002197265625, -2.45947265625, -2.3187255859375, -2.177978515625, -2.0372314453125, -1.896484375, -1.7557373046875, -1.614990234375, -1.4742431640625, -1.33349609375, -1.1927490234375, -1.052001953125, -0.9112548828125, -0.7705078125, -0.6297607421875, -0.489013671875, -0.3482666015625, -0.20751953125, -0.0667724609375, 0.073974609375, 0.2147216796875, 0.35546875, 0.4962158203125, 0.636962890625, 0.7777099609375, 0.91845703125, 1.0592041015625, 1.199951171875, 1.3406982421875, 1.4814453125, 1.6221923828125, 1.762939453125, 1.9036865234375, 2.04443359375, 2.1851806640625, 2.325927734375, 2.4666748046875, 2.607421875, 2.7481689453125, 2.888916015625, 3.0296630859375, 3.17041015625, 3.3111572265625, 3.451904296875, 3.5926513671875, 3.7333984375, 3.8741455078125, 4.014892578125, 4.1556396484375, 4.29638671875, 4.4371337890625, 4.577880859375, 4.7186279296875, 4.859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 14.0, 21.0, 16.0, 39.0, 50.0, 70.0, 152.0, 172.0, 262.0, 473.0, 599.0, 1060.0, 1778.0, 2842.0, 4826.0, 8435.0, 14362.0, 24287.0, 42488.0, 75915.0, 154407.0, 334118.0, 182851.0, 85963.0, 47185.0, 27227.0, 15897.0, 9260.0, 5363.0, 3289.0, 1889.0, 1154.0, 737.0, 432.0, 298.0, 192.0, 148.0, 71.0, 49.0, 53.0, 33.0, 22.0, 10.0, 13.0, 6.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.02764892578125, -0.026849746704101562, -0.026050567626953125, -0.025251388549804688, -0.02445220947265625, -0.023653030395507812, -0.022853851318359375, -0.022054672241210938, -0.0212554931640625, -0.020456314086914062, -0.019657135009765625, -0.018857955932617188, -0.01805877685546875, -0.017259597778320312, -0.016460418701171875, -0.015661239624023438, -0.014862060546875, -0.014062881469726562, -0.013263702392578125, -0.012464523315429688, -0.01166534423828125, -0.010866165161132812, -0.010066986083984375, -0.009267807006835938, -0.0084686279296875, -0.0076694488525390625, -0.006870269775390625, -0.0060710906982421875, -0.00527191162109375, -0.0044727325439453125, -0.003673553466796875, -0.0028743743896484375, -0.0020751953125, -0.0012760162353515625, -0.000476837158203125, 0.0003223419189453125, 0.00112152099609375, 0.0019207000732421875, 0.002719879150390625, 0.0035190582275390625, 0.0043182373046875, 0.0051174163818359375, 0.005916595458984375, 0.0067157745361328125, 0.00751495361328125, 0.008314132690429688, 0.009113311767578125, 0.009912490844726562, 0.010711669921875, 0.011510848999023438, 0.012310028076171875, 0.013109207153320312, 0.01390838623046875, 0.014707565307617188, 0.015506744384765625, 0.016305923461914062, 0.0171051025390625, 0.017904281616210938, 0.018703460693359375, 0.019502639770507812, 0.02030181884765625, 0.021100997924804688, 0.021900177001953125, 0.022699356079101562, 0.02349853515625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 7.0, 14.0, 11.0, 11.0, 11.0, 12.0, 15.0, 31.0, 28.0, 21.0, 29.0, 33.0, 42.0, 47.0, 37.0, 42.0, 37.0, 39.0, 1069.0, 51.0, 54.0, 31.0, 31.0, 38.0, 35.0, 35.0, 23.0, 17.0, 22.0, 16.0, 22.0, 12.0, 9.0, 17.0, 14.0, 14.0, 7.0, 6.0, 1.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.681640625, -2.601837158203125, -2.52203369140625, -2.442230224609375, -2.3624267578125, -2.282623291015625, -2.20281982421875, -2.123016357421875, -2.043212890625, -1.963409423828125, -1.88360595703125, -1.803802490234375, -1.7239990234375, -1.644195556640625, -1.56439208984375, -1.484588623046875, -1.40478515625, -1.324981689453125, -1.24517822265625, -1.165374755859375, -1.0855712890625, -1.005767822265625, -0.92596435546875, -0.846160888671875, -0.766357421875, -0.686553955078125, -0.60675048828125, -0.526947021484375, -0.4471435546875, -0.367340087890625, -0.28753662109375, -0.207733154296875, -0.1279296875, -0.048126220703125, 0.03167724609375, 0.111480712890625, 0.1912841796875, 0.271087646484375, 0.35089111328125, 0.430694580078125, 0.510498046875, 0.590301513671875, 0.67010498046875, 0.749908447265625, 0.8297119140625, 0.909515380859375, 0.98931884765625, 1.069122314453125, 1.14892578125, 1.228729248046875, 1.30853271484375, 1.388336181640625, 1.4681396484375, 1.547943115234375, 1.62774658203125, 1.707550048828125, 1.787353515625, 1.867156982421875, 1.94696044921875, 2.026763916015625, 2.1065673828125, 2.186370849609375, 2.26617431640625, 2.345977783203125, 2.42578125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 10.0, 5.0, 5.0, 4.0, 9.0, 21.0, 28.0, 51.0, 51.0, 85.0, 96.0, 178.0, 284.0, 369.0, 497.0, 729.0, 1137.0, 1607.0, 2429.0, 3687.0, 5499.0, 8515.0, 12992.0, 21024.0, 33881.0, 58086.0, 106366.0, 254792.0, 1316904.0, 111910.0, 60256.0, 34955.0, 21572.0, 13339.0, 8514.0, 5816.0, 3608.0, 2456.0, 1806.0, 1100.0, 748.0, 523.0, 397.0, 220.0, 152.0, 139.0, 119.0, 64.0, 33.0, 26.0, 11.0, 14.0, 11.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01471710205078125, -0.014227032661437988, -0.013736963272094727, -0.013246893882751465, -0.012756824493408203, -0.012266755104064941, -0.01177668571472168, -0.011286616325378418, -0.010796546936035156, -0.010306477546691895, -0.009816408157348633, -0.009326338768005371, -0.00883626937866211, -0.008346199989318848, -0.007856130599975586, -0.007366061210632324, -0.0068759918212890625, -0.006385922431945801, -0.005895853042602539, -0.005405783653259277, -0.004915714263916016, -0.004425644874572754, -0.003935575485229492, -0.0034455060958862305, -0.0029554367065429688, -0.002465367317199707, -0.0019752979278564453, -0.0014852285385131836, -0.0009951591491699219, -0.0005050897598266602, -1.5020370483398438e-05, 0.0004750490188598633, 0.000965118408203125, 0.0014551877975463867, 0.0019452571868896484, 0.00243532657623291, 0.002925395965576172, 0.0034154653549194336, 0.0039055347442626953, 0.004395604133605957, 0.004885673522949219, 0.0053757429122924805, 0.005865812301635742, 0.006355881690979004, 0.006845951080322266, 0.007336020469665527, 0.007826089859008789, 0.00831615924835205, 0.008806228637695312, 0.009296298027038574, 0.009786367416381836, 0.010276436805725098, 0.01076650619506836, 0.011256575584411621, 0.011746644973754883, 0.012236714363098145, 0.012726783752441406, 0.013216853141784668, 0.01370692253112793, 0.014196991920471191, 0.014687061309814453, 0.015177130699157715, 0.015667200088500977, 0.01615726947784424, 0.0166473388671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 204.0, 0.0, 0.0, 0.0, 0.0, 0.0, 478.0, 0.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 8.0, 6.0, 2.0, 2.0, 35.0, 27.0, 14.0, 1.0, 53.0, 71.0, 50.0, 128.0, 302.0, 229.0, 1219.0, 895471.0, 149319.0, 765.0, 214.0, 273.0, 97.0, 96.0, 56.0, 30.0, 1.0, 16.0, 32.0, 13.0, 3.0, 2.0, 5.0, 3.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.812624633312225e-06, -6.591901183128357e-06, -6.3711777329444885e-06, -6.15045428276062e-06, -5.929730832576752e-06, -5.709007382392883e-06, -5.488283932209015e-06, -5.2675604820251465e-06, -5.046837031841278e-06, -4.82611358165741e-06, -4.605390131473541e-06, -4.384666681289673e-06, -4.1639432311058044e-06, -3.943219780921936e-06, -3.7224963307380676e-06, -3.5017728805541992e-06, -3.281049430370331e-06, -3.0603259801864624e-06, -2.839602530002594e-06, -2.6188790798187256e-06, -2.398155629634857e-06, -2.1774321794509888e-06, -1.9567087292671204e-06, -1.735985279083252e-06, -1.5152618288993835e-06, -1.2945383787155151e-06, -1.0738149285316467e-06, -8.530914783477783e-07, -6.323680281639099e-07, -4.116445779800415e-07, -1.909211277961731e-07, 2.9802322387695312e-08, 2.505257725715637e-07, 4.7124922275543213e-07, 6.919726729393005e-07, 9.126961231231689e-07, 1.1334195733070374e-06, 1.3541430234909058e-06, 1.5748664736747742e-06, 1.7955899238586426e-06, 2.016313374042511e-06, 2.2370368242263794e-06, 2.457760274410248e-06, 2.678483724594116e-06, 2.8992071747779846e-06, 3.119930624961853e-06, 3.3406540751457214e-06, 3.56137752532959e-06, 3.7821009755134583e-06, 4.002824425697327e-06, 4.223547875881195e-06, 4.4442713260650635e-06, 4.664994776248932e-06, 4.8857182264328e-06, 5.106441676616669e-06, 5.327165126800537e-06, 5.5478885769844055e-06, 5.768612027168274e-06, 5.989335477352142e-06, 6.210058927536011e-06, 6.430782377719879e-06, 6.6515058279037476e-06, 6.872229278087616e-06, 7.092952728271484e-06]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 40.0, 888.0, 65.0, 14.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3163825087758596e-06, -1.2823385304727708e-06, -1.248294552169682e-06, -1.2142505738665932e-06, -1.1802065955635044e-06, -1.1461626172604156e-06, -1.1121186389573268e-06, -1.0780745469674002e-06, -1.0440305686643114e-06, -1.0099865903612226e-06, -9.759426120581338e-07, -9.41898633755045e-07, -9.078546554519562e-07, -8.738106771488674e-07, -8.397666420023597e-07, -8.057226636992709e-07, -7.71678742239601e-07, -7.376347639365122e-07, -7.035907856334234e-07, -6.695468073303346e-07, -6.355028290272458e-07, -6.014588507241569e-07, -5.674148155776493e-07, -5.333708372745605e-07, -4.993268589714717e-07, -4.6528288066838286e-07, -4.3123890236529405e-07, -3.971948956404958e-07, -3.63150917337407e-07, -3.291069390343182e-07, -2.9506293230951997e-07, -2.6101895400643116e-07, -2.2697508939018007e-07, -1.9293111108709127e-07, -1.5888711857314775e-07, -1.2484312605920422e-07, -9.079914775611542e-08, -5.675516945302661e-08, -2.271117693908309e-08, 1.1332815574860433e-08, 4.537679387794924e-08, 7.94207792864654e-08, 1.1346476469498157e-07, 1.475087572089251e-07, 1.815527355120139e-07, 2.155967138151027e-07, 2.4964072053990094e-07, 2.8368469884298975e-07, 3.1772867714607855e-07, 3.5177265544916736e-07, 3.8581663375225617e-07, 4.198606404770544e-07, 4.539046187801432e-07, 4.879485686615226e-07, 5.219926038080303e-07, 5.560365821111191e-07, 5.900805604142079e-07, 6.241245387172967e-07, 6.581685170203855e-07, 6.922124953234743e-07, 7.26256530469982e-07, 7.603005087730708e-07, 7.943444870761596e-07, 8.283884653792484e-07, 8.624324436823372e-07]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 101.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 813.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 17.0, 29.0, 29.0, 25.0, 31.0, 31.0, 35.0, 41.0, 48.0, 48.0, 59.0, 39.0, 50.0, 33.0, 52.0, 29.0, 48.0, 28.0, 41.0, 37.0, 35.0, 29.0, 26.0, 19.0, 20.0, 26.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0076904296875, -3.866943359375, -3.7261962890625, -3.58544921875, -3.4447021484375, -3.303955078125, -3.1632080078125, -3.0224609375, -2.8817138671875, -2.740966796875, -2.6002197265625, -2.45947265625, -2.3187255859375, -2.177978515625, -2.0372314453125, -1.896484375, -1.7557373046875, -1.614990234375, -1.4742431640625, -1.33349609375, -1.1927490234375, -1.052001953125, -0.9112548828125, -0.7705078125, -0.6297607421875, -0.489013671875, -0.3482666015625, -0.20751953125, -0.0667724609375, 0.073974609375, 0.2147216796875, 0.35546875, 0.4962158203125, 0.636962890625, 0.7777099609375, 0.91845703125, 1.0592041015625, 1.199951171875, 1.3406982421875, 1.4814453125, 1.6221923828125, 1.762939453125, 1.9036865234375, 2.04443359375, 2.1851806640625, 2.325927734375, 2.4666748046875, 2.607421875, 2.7481689453125, 2.888916015625, 3.0296630859375, 3.17041015625, 3.3111572265625, 3.451904296875, 3.5926513671875, 3.7333984375, 3.8741455078125, 4.014892578125, 4.1556396484375, 4.29638671875, 4.4371337890625, 4.577880859375, 4.7186279296875, 4.859375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 13.0, 9.0, 22.0, 24.0, 43.0, 67.0, 99.0, 155.0, 230.0, 371.0, 670.0, 1113.0, 1836.0, 3270.0, 5642.0, 10505.0, 19370.0, 35581.0, 65358.0, 126624.0, 306979.0, 242079.0, 104726.0, 56128.0, 30368.0, 16526.0, 8890.0, 4939.0, 2865.0, 1568.0, 939.0, 554.0, 335.0, 223.0, 145.0, 77.0, 66.0, 34.0, 30.0, 17.0, 17.0, 12.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.32421875, -4.18853759765625, -4.0528564453125, -3.91717529296875, -3.781494140625, -3.64581298828125, -3.5101318359375, -3.37445068359375, -3.23876953125, -3.10308837890625, -2.9674072265625, -2.83172607421875, -2.696044921875, -2.56036376953125, -2.4246826171875, -2.28900146484375, -2.1533203125, -2.01763916015625, -1.8819580078125, -1.74627685546875, -1.610595703125, -1.47491455078125, -1.3392333984375, -1.20355224609375, -1.06787109375, -0.93218994140625, -0.7965087890625, -0.66082763671875, -0.525146484375, -0.38946533203125, -0.2537841796875, -0.11810302734375, 0.017578125, 0.15325927734375, 0.2889404296875, 0.42462158203125, 0.560302734375, 0.69598388671875, 0.8316650390625, 0.96734619140625, 1.10302734375, 1.23870849609375, 1.3743896484375, 1.51007080078125, 1.645751953125, 1.78143310546875, 1.9171142578125, 2.05279541015625, 2.1884765625, 2.32415771484375, 2.4598388671875, 2.59552001953125, 2.731201171875, 2.86688232421875, 3.0025634765625, 3.13824462890625, 3.27392578125, 3.40960693359375, 3.5452880859375, 3.68096923828125, 3.816650390625, 3.95233154296875, 4.0880126953125, 4.22369384765625, 4.359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 4.0, 8.0, 5.0, 18.0, 16.0, 16.0, 17.0, 22.0, 16.0, 38.0, 27.0, 45.0, 41.0, 44.0, 77.0, 114.0, 197.0, 1497.0, 262.0, 158.0, 74.0, 65.0, 40.0, 41.0, 45.0, 26.0, 17.0, 18.0, 18.0, 12.0, 15.0, 17.0, 7.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.6842041015625, -11.337158203125, -10.9901123046875, -10.64306640625, -10.2960205078125, -9.948974609375, -9.6019287109375, -9.2548828125, -8.9078369140625, -8.560791015625, -8.2137451171875, -7.86669921875, -7.5196533203125, -7.172607421875, -6.8255615234375, -6.478515625, -6.1314697265625, -5.784423828125, -5.4373779296875, -5.09033203125, -4.7432861328125, -4.396240234375, -4.0491943359375, -3.7021484375, -3.3551025390625, -3.008056640625, -2.6610107421875, -2.31396484375, -1.9669189453125, -1.619873046875, -1.2728271484375, -0.92578125, -0.5787353515625, -0.231689453125, 0.1153564453125, 0.46240234375, 0.8094482421875, 1.156494140625, 1.5035400390625, 1.8505859375, 2.1976318359375, 2.544677734375, 2.8917236328125, 3.23876953125, 3.5858154296875, 3.932861328125, 4.2799072265625, 4.626953125, 4.9739990234375, 5.321044921875, 5.6680908203125, 6.01513671875, 6.3621826171875, 6.709228515625, 7.0562744140625, 7.4033203125, 7.7503662109375, 8.097412109375, 8.4444580078125, 8.79150390625, 9.1385498046875, 9.485595703125, 9.8326416015625, 10.1796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 8.0, 8.0, 11.0, 8.0, 18.0, 21.0, 38.0, 39.0, 64.0, 67.0, 93.0, 135.0, 203.0, 372.0, 866.0, 3503.0, 24868.0, 307248.0, 2647200.0, 142961.0, 14082.0, 2219.0, 666.0, 298.0, 193.0, 116.0, 96.0, 78.0, 48.0, 33.0, 31.0, 25.0, 22.0, 19.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.03125, -13.5977783203125, -13.164306640625, -12.7308349609375, -12.29736328125, -11.8638916015625, -11.430419921875, -10.9969482421875, -10.5634765625, -10.1300048828125, -9.696533203125, -9.2630615234375, -8.82958984375, -8.3961181640625, -7.962646484375, -7.5291748046875, -7.095703125, -6.6622314453125, -6.228759765625, -5.7952880859375, -5.36181640625, -4.9283447265625, -4.494873046875, -4.0614013671875, -3.6279296875, -3.1944580078125, -2.760986328125, -2.3275146484375, -1.89404296875, -1.4605712890625, -1.027099609375, -0.5936279296875, -0.16015625, 0.2733154296875, 0.706787109375, 1.1402587890625, 1.57373046875, 2.0072021484375, 2.440673828125, 2.8741455078125, 3.3076171875, 3.7410888671875, 4.174560546875, 4.6080322265625, 5.04150390625, 5.4749755859375, 5.908447265625, 6.3419189453125, 6.775390625, 7.2088623046875, 7.642333984375, 8.0758056640625, 8.50927734375, 8.9427490234375, 9.376220703125, 9.8096923828125, 10.2431640625, 10.6766357421875, 11.110107421875, 11.5435791015625, 11.97705078125, 12.4105224609375, 12.843994140625, 13.2774658203125, 13.7109375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 42.0, 319.0, 486.0, 151.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.276069641113281, -9.38602352142334, -6.495977401733398, -3.605931282043457, -0.7158851623535156, 2.174160957336426, 5.064207077026367, 7.954254150390625, 10.84429931640625, 13.734345436096191, 16.624391555786133, 19.51443862915039, 22.404483795166016, 25.29452896118164, 28.1845760345459, 31.074623107910156, 33.96466827392578, 36.854713439941406, 39.74475860595703, 42.63480758666992, 45.52485275268555, 48.41489791870117, 51.30494689941406, 54.19499206542969, 57.08503723144531, 59.97508239746094, 62.86512756347656, 65.75517272949219, 68.64521789550781, 71.53527069091797, 74.4253158569336, 77.31536102294922, 80.20539855957031, 83.09544372558594, 85.98548889160156, 88.87553405761719, 91.76557922363281, 94.65563201904297, 97.5456771850586, 100.43572235107422, 103.32576751708984, 106.21581268310547, 109.1058578491211, 111.99590301513672, 114.88595581054688, 117.7760009765625, 120.66604614257812, 123.55609130859375, 126.44613647460938, 129.336181640625, 132.22622680664062, 135.11627197265625, 138.00631713867188, 140.8963623046875, 143.78640747070312, 146.67645263671875, 149.56649780273438, 152.45654296875, 155.34658813476562, 158.23663330078125, 161.12667846679688, 164.0167236328125, 166.90676879882812, 169.79681396484375, 172.68687438964844]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 10.0, 6.0, 9.0, 15.0, 9.0, 12.0, 15.0, 17.0, 20.0, 26.0, 25.0, 30.0, 34.0, 24.0, 37.0, 33.0, 35.0, 39.0, 39.0, 48.0, 44.0, 40.0, 38.0, 39.0, 31.0, 27.0, 28.0, 40.0, 23.0, 36.0, 27.0, 28.0, 13.0, 22.0, 13.0, 13.0, 13.0, 8.0, 4.0, 8.0, 3.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.122787475585938, -18.476417541503906, -17.830047607421875, -17.183677673339844, -16.537307739257812, -15.890938758850098, -15.244569778442383, -14.598199844360352, -13.95182991027832, -13.305459976196289, -12.659090042114258, -12.012721061706543, -11.366351127624512, -10.71998119354248, -10.073612213134766, -9.427242279052734, -8.780872344970703, -8.134502410888672, -7.488132953643799, -6.841763496398926, -6.1953935623168945, -5.549023628234863, -4.90265417098999, -4.256284713745117, -3.609914779663086, -2.963545083999634, -2.3171753883361816, -1.6708056926727295, -1.0244359970092773, -0.3780663013458252, 0.26830339431762695, 0.9146728515625, 1.5610427856445312, 2.2074124813079834, 2.8537821769714355, 3.5001518726348877, 4.14652156829834, 4.792891502380371, 5.439260959625244, 6.085630416870117, 6.732000350952148, 7.37837028503418, 8.024740219116211, 8.671109199523926, 9.317479133605957, 9.963849067687988, 10.610218048095703, 11.256587982177734, 11.902957916259766, 12.549327850341797, 13.195697784423828, 13.842066764831543, 14.488436698913574, 15.134806632995605, 15.78117561340332, 16.42754554748535, 17.073915481567383, 17.720285415649414, 18.366655349731445, 19.013025283813477, 19.659393310546875, 20.305763244628906, 20.952133178710938, 21.59850311279297, 22.244873046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 8.0, 9.0, 10.0, 14.0, 17.0, 27.0, 16.0, 20.0, 35.0, 27.0, 36.0, 59.0, 42.0, 45.0, 37.0, 52.0, 43.0, 48.0, 43.0, 44.0, 45.0, 47.0, 38.0, 27.0, 34.0, 33.0, 19.0, 23.0, 25.0, 13.0, 12.0, 15.0, 5.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.02685546875, -3.8818359375, -3.73681640625, -3.591796875, -3.44677734375, -3.3017578125, -3.15673828125, -3.01171875, -2.86669921875, -2.7216796875, -2.57666015625, -2.431640625, -2.28662109375, -2.1416015625, -1.99658203125, -1.8515625, -1.70654296875, -1.5615234375, -1.41650390625, -1.271484375, -1.12646484375, -0.9814453125, -0.83642578125, -0.69140625, -0.54638671875, -0.4013671875, -0.25634765625, -0.111328125, 0.03369140625, 0.1787109375, 0.32373046875, 0.46875, 0.61376953125, 0.7587890625, 0.90380859375, 1.048828125, 1.19384765625, 1.3388671875, 1.48388671875, 1.62890625, 1.77392578125, 1.9189453125, 2.06396484375, 2.208984375, 2.35400390625, 2.4990234375, 2.64404296875, 2.7890625, 2.93408203125, 3.0791015625, 3.22412109375, 3.369140625, 3.51416015625, 3.6591796875, 3.80419921875, 3.94921875, 4.09423828125, 4.2392578125, 4.38427734375, 4.529296875, 4.67431640625, 4.8193359375, 4.96435546875, 5.109375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 8.0, 12.0, 12.0, 19.0, 21.0, 28.0, 41.0, 49.0, 79.0, 90.0, 131.0, 229.0, 361.0, 558.0, 6080.0, 4179324.0, 5643.0, 534.0, 328.0, 219.0, 126.0, 93.0, 80.0, 51.0, 42.0, 32.0, 18.0, 20.0, 10.0, 14.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -64.8642578125, -62.416015625, -59.9677734375, -57.51953125, -55.0712890625, -52.623046875, -50.1748046875, -47.7265625, -45.2783203125, -42.830078125, -40.3818359375, -37.93359375, -35.4853515625, -33.037109375, -30.5888671875, -28.140625, -25.6923828125, -23.244140625, -20.7958984375, -18.34765625, -15.8994140625, -13.451171875, -11.0029296875, -8.5546875, -6.1064453125, -3.658203125, -1.2099609375, 1.23828125, 3.6865234375, 6.134765625, 8.5830078125, 11.03125, 13.4794921875, 15.927734375, 18.3759765625, 20.82421875, 23.2724609375, 25.720703125, 28.1689453125, 30.6171875, 33.0654296875, 35.513671875, 37.9619140625, 40.41015625, 42.8583984375, 45.306640625, 47.7548828125, 50.203125, 52.6513671875, 55.099609375, 57.5478515625, 59.99609375, 62.4443359375, 64.892578125, 67.3408203125, 69.7890625, 72.2373046875, 74.685546875, 77.1337890625, 79.58203125, 82.0302734375, 84.478515625, 86.9267578125, 89.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 17.0, 19.0, 22.0, 34.0, 37.0, 50.0, 77.0, 87.0, 105.0, 159.0, 245.0, 330.0, 473.0, 607.0, 553.0, 352.0, 214.0, 162.0, 126.0, 90.0, 57.0, 54.0, 34.0, 24.0, 24.0, 19.0, 11.0, 14.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.26953125, -5.08502197265625, -4.9005126953125, -4.71600341796875, -4.531494140625, -4.34698486328125, -4.1624755859375, -3.97796630859375, -3.79345703125, -3.60894775390625, -3.4244384765625, -3.23992919921875, -3.055419921875, -2.87091064453125, -2.6864013671875, -2.50189208984375, -2.3173828125, -2.13287353515625, -1.9483642578125, -1.76385498046875, -1.579345703125, -1.39483642578125, -1.2103271484375, -1.02581787109375, -0.84130859375, -0.65679931640625, -0.4722900390625, -0.28778076171875, -0.103271484375, 0.08123779296875, 0.2657470703125, 0.45025634765625, 0.634765625, 0.81927490234375, 1.0037841796875, 1.18829345703125, 1.372802734375, 1.55731201171875, 1.7418212890625, 1.92633056640625, 2.11083984375, 2.29534912109375, 2.4798583984375, 2.66436767578125, 2.848876953125, 3.03338623046875, 3.2178955078125, 3.40240478515625, 3.5869140625, 3.77142333984375, 3.9559326171875, 4.14044189453125, 4.324951171875, 4.50946044921875, 4.6939697265625, 4.87847900390625, 5.06298828125, 5.24749755859375, 5.4320068359375, 5.61651611328125, 5.801025390625, 5.98553466796875, 6.1700439453125, 6.35455322265625, 6.5390625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 11.0, 7.0, 12.0, 13.0, 8.0, 15.0, 24.0, 27.0, 26.0, 44.0, 39.0, 55.0, 117.0, 258.0, 925.0, 11272.0, 487914.0, 3638439.0, 51561.0, 2545.0, 451.0, 162.0, 73.0, 62.0, 44.0, 36.0, 30.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.421875, -29.604736328125, -28.78759765625, -27.970458984375, -27.1533203125, -26.336181640625, -25.51904296875, -24.701904296875, -23.884765625, -23.067626953125, -22.25048828125, -21.433349609375, -20.6162109375, -19.799072265625, -18.98193359375, -18.164794921875, -17.34765625, -16.530517578125, -15.71337890625, -14.896240234375, -14.0791015625, -13.261962890625, -12.44482421875, -11.627685546875, -10.810546875, -9.993408203125, -9.17626953125, -8.359130859375, -7.5419921875, -6.724853515625, -5.90771484375, -5.090576171875, -4.2734375, -3.456298828125, -2.63916015625, -1.822021484375, -1.0048828125, -0.187744140625, 0.62939453125, 1.446533203125, 2.263671875, 3.080810546875, 3.89794921875, 4.715087890625, 5.5322265625, 6.349365234375, 7.16650390625, 7.983642578125, 8.80078125, 9.617919921875, 10.43505859375, 11.252197265625, 12.0693359375, 12.886474609375, 13.70361328125, 14.520751953125, 15.337890625, 16.155029296875, 16.97216796875, 17.789306640625, 18.6064453125, 19.423583984375, 20.24072265625, 21.057861328125, 21.875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 114.0, 447.0, 343.0, 94.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.72113037109375, -27.287437438964844, -23.853742599487305, -20.420047760009766, -16.98635482788086, -13.552661895751953, -10.118967056274414, -6.685272216796875, -3.2515792846679688, 0.1821146011352539, 3.6158084869384766, 7.049502372741699, 10.483196258544922, 13.916889190673828, 17.350584030151367, 20.784278869628906, 24.217971801757812, 27.65166473388672, 31.085359573364258, 34.5190544128418, 37.9527473449707, 41.38644027709961, 44.82013702392578, 48.25382995605469, 51.687522888183594, 55.1212158203125, 58.554908752441406, 61.98860549926758, 65.42230224609375, 68.85598754882812, 72.28968811035156, 75.72338104248047, 79.15707397460938, 82.59076690673828, 86.02445983886719, 89.4581527709961, 92.891845703125, 96.32554626464844, 99.75923919677734, 103.19293212890625, 106.62662506103516, 110.06031799316406, 113.49401092529297, 116.92770385742188, 120.36140441894531, 123.79508972167969, 127.22879028320312, 130.6624755859375, 134.09617614746094, 137.52987670898438, 140.96356201171875, 144.3972625732422, 147.83094787597656, 151.2646484375, 154.69833374023438, 158.1320343017578, 161.56573486328125, 164.9994354248047, 168.43312072753906, 171.8668212890625, 175.30050659179688, 178.7342071533203, 182.1678924560547, 185.60159301757812, 189.0352783203125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 13.0, 11.0, 15.0, 19.0, 17.0, 20.0, 17.0, 32.0, 40.0, 29.0, 48.0, 35.0, 45.0, 41.0, 32.0, 38.0, 56.0, 43.0, 36.0, 49.0, 48.0, 32.0, 35.0, 23.0, 27.0, 32.0, 29.0, 22.0, 21.0, 16.0, 16.0, 6.0, 16.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.727737426757812, -20.0755615234375, -19.423385620117188, -18.771209716796875, -18.119033813476562, -17.46685791015625, -16.814682006835938, -16.162506103515625, -15.510330200195312, -14.858154296875, -14.205978393554688, -13.553802490234375, -12.901626586914062, -12.24945068359375, -11.597274780273438, -10.945098876953125, -10.292922973632812, -9.6407470703125, -8.988571166992188, -8.336395263671875, -7.6842193603515625, -7.03204345703125, -6.3798675537109375, -5.727691650390625, -5.0755157470703125, -4.42333984375, -3.7711639404296875, -3.118988037109375, -2.4668121337890625, -1.81463623046875, -1.1624603271484375, -0.510284423828125, 0.1418895721435547, 0.7940654754638672, 1.4462413787841797, 2.098417282104492, 2.7505931854248047, 3.402769088745117, 4.05494499206543, 4.707120895385742, 5.359296798706055, 6.011472702026367, 6.66364860534668, 7.315824508666992, 7.968000411987305, 8.620176315307617, 9.27235221862793, 9.924528121948242, 10.576704025268555, 11.228879928588867, 11.88105583190918, 12.533231735229492, 13.185407638549805, 13.837583541870117, 14.48975944519043, 15.141935348510742, 15.794111251831055, 16.446287155151367, 17.09846305847168, 17.750638961791992, 18.402814865112305, 19.054990768432617, 19.70716667175293, 20.359342575073242, 21.011518478393555]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 13.0, 11.0, 24.0, 20.0, 25.0, 32.0, 29.0, 24.0, 30.0, 43.0, 40.0, 56.0, 51.0, 58.0, 41.0, 49.0, 56.0, 35.0, 47.0, 33.0, 37.0, 29.0, 31.0, 25.0, 28.0, 20.0, 17.0, 25.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30596923828125, -4.1627197265625, -4.01947021484375, -3.876220703125, -3.73297119140625, -3.5897216796875, -3.44647216796875, -3.30322265625, -3.15997314453125, -3.0167236328125, -2.87347412109375, -2.730224609375, -2.58697509765625, -2.4437255859375, -2.30047607421875, -2.1572265625, -2.01397705078125, -1.8707275390625, -1.72747802734375, -1.584228515625, -1.44097900390625, -1.2977294921875, -1.15447998046875, -1.01123046875, -0.86798095703125, -0.7247314453125, -0.58148193359375, -0.438232421875, -0.29498291015625, -0.1517333984375, -0.00848388671875, 0.134765625, 0.27801513671875, 0.4212646484375, 0.56451416015625, 0.707763671875, 0.85101318359375, 0.9942626953125, 1.13751220703125, 1.28076171875, 1.42401123046875, 1.5672607421875, 1.71051025390625, 1.853759765625, 1.99700927734375, 2.1402587890625, 2.28350830078125, 2.4267578125, 2.57000732421875, 2.7132568359375, 2.85650634765625, 2.999755859375, 3.14300537109375, 3.2862548828125, 3.42950439453125, 3.57275390625, 3.71600341796875, 3.8592529296875, 4.00250244140625, 4.145751953125, 4.28900146484375, 4.4322509765625, 4.57550048828125, 4.71875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 2.0, 11.0, 13.0, 25.0, 42.0, 42.0, 70.0, 107.0, 176.0, 250.0, 425.0, 666.0, 1018.0, 1805.0, 3108.0, 5240.0, 8930.0, 15730.0, 27060.0, 47339.0, 92936.0, 244275.0, 344691.0, 120125.0, 57798.0, 32042.0, 18570.0, 10673.0, 6211.0, 3529.0, 2168.0, 1309.0, 783.0, 499.0, 321.0, 210.0, 116.0, 80.0, 48.0, 39.0, 20.0, 22.0, 7.0, 11.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029083251953125, -0.028149843215942383, -0.027216434478759766, -0.02628302574157715, -0.02534961700439453, -0.024416208267211914, -0.023482799530029297, -0.02254939079284668, -0.021615982055664062, -0.020682573318481445, -0.019749164581298828, -0.01881575584411621, -0.017882347106933594, -0.016948938369750977, -0.01601552963256836, -0.015082120895385742, -0.014148712158203125, -0.013215303421020508, -0.01228189468383789, -0.011348485946655273, -0.010415077209472656, -0.009481668472290039, -0.008548259735107422, -0.007614850997924805, -0.0066814422607421875, -0.00574803352355957, -0.004814624786376953, -0.003881216049194336, -0.0029478073120117188, -0.0020143985748291016, -0.0010809898376464844, -0.0001475811004638672, 0.00078582763671875, 0.0017192363739013672, 0.0026526451110839844, 0.0035860538482666016, 0.004519462585449219, 0.005452871322631836, 0.006386280059814453, 0.00731968879699707, 0.008253097534179688, 0.009186506271362305, 0.010119915008544922, 0.011053323745727539, 0.011986732482910156, 0.012920141220092773, 0.01385354995727539, 0.014786958694458008, 0.015720367431640625, 0.016653776168823242, 0.01758718490600586, 0.018520593643188477, 0.019454002380371094, 0.02038741111755371, 0.021320819854736328, 0.022254228591918945, 0.023187637329101562, 0.02412104606628418, 0.025054454803466797, 0.025987863540649414, 0.02692127227783203, 0.02785468101501465, 0.028788089752197266, 0.029721498489379883, 0.0306549072265625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 14.0, 11.0, 12.0, 12.0, 15.0, 15.0, 15.0, 14.0, 24.0, 31.0, 16.0, 30.0, 28.0, 36.0, 22.0, 42.0, 41.0, 34.0, 28.0, 1075.0, 29.0, 35.0, 45.0, 42.0, 38.0, 29.0, 25.0, 33.0, 29.0, 20.0, 18.0, 25.0, 17.0, 13.0, 18.0, 15.0, 8.0, 12.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.453125, -2.375396728515625, -2.29766845703125, -2.219940185546875, -2.1422119140625, -2.064483642578125, -1.98675537109375, -1.909027099609375, -1.831298828125, -1.753570556640625, -1.67584228515625, -1.598114013671875, -1.5203857421875, -1.442657470703125, -1.36492919921875, -1.287200927734375, -1.20947265625, -1.131744384765625, -1.05401611328125, -0.976287841796875, -0.8985595703125, -0.820831298828125, -0.74310302734375, -0.665374755859375, -0.587646484375, -0.509918212890625, -0.43218994140625, -0.354461669921875, -0.2767333984375, -0.199005126953125, -0.12127685546875, -0.043548583984375, 0.0341796875, 0.111907958984375, 0.18963623046875, 0.267364501953125, 0.3450927734375, 0.422821044921875, 0.50054931640625, 0.578277587890625, 0.656005859375, 0.733734130859375, 0.81146240234375, 0.889190673828125, 0.9669189453125, 1.044647216796875, 1.12237548828125, 1.200103759765625, 1.27783203125, 1.355560302734375, 1.43328857421875, 1.511016845703125, 1.5887451171875, 1.666473388671875, 1.74420166015625, 1.821929931640625, 1.899658203125, 1.977386474609375, 2.05511474609375, 2.132843017578125, 2.2105712890625, 2.288299560546875, 2.36602783203125, 2.443756103515625, 2.521484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 24.0, 44.0, 43.0, 78.0, 126.0, 166.0, 249.0, 350.0, 542.0, 864.0, 1233.0, 1739.0, 2597.0, 3975.0, 5844.0, 8817.0, 13572.0, 20499.0, 31746.0, 50160.0, 85867.0, 173841.0, 1339521.0, 147214.0, 76879.0, 45936.0, 29106.0, 18932.0, 12415.0, 8157.0, 5528.0, 3621.0, 2484.0, 1632.0, 1116.0, 767.0, 495.0, 291.0, 190.0, 134.0, 109.0, 77.0, 47.0, 34.0, 14.0, 15.0, 9.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.0153961181640625, -0.014920949935913086, -0.014445781707763672, -0.013970613479614258, -0.013495445251464844, -0.01302027702331543, -0.012545108795166016, -0.012069940567016602, -0.011594772338867188, -0.011119604110717773, -0.01064443588256836, -0.010169267654418945, -0.009694099426269531, -0.009218931198120117, -0.008743762969970703, -0.008268594741821289, -0.007793426513671875, -0.007318258285522461, -0.006843090057373047, -0.006367921829223633, -0.005892753601074219, -0.005417585372924805, -0.004942417144775391, -0.0044672489166259766, -0.0039920806884765625, -0.0035169124603271484, -0.0030417442321777344, -0.0025665760040283203, -0.0020914077758789062, -0.0016162395477294922, -0.0011410713195800781, -0.0006659030914306641, -0.00019073486328125, 0.00028443336486816406, 0.0007596015930175781, 0.0012347698211669922, 0.0017099380493164062, 0.0021851062774658203, 0.0026602745056152344, 0.0031354427337646484, 0.0036106109619140625, 0.0040857791900634766, 0.004560947418212891, 0.005036115646362305, 0.005511283874511719, 0.005986452102661133, 0.006461620330810547, 0.006936788558959961, 0.007411956787109375, 0.007887125015258789, 0.008362293243408203, 0.008837461471557617, 0.009312629699707031, 0.009787797927856445, 0.01026296615600586, 0.010738134384155273, 0.011213302612304688, 0.011688470840454102, 0.012163639068603516, 0.01263880729675293, 0.013113975524902344, 0.013589143753051758, 0.014064311981201172, 0.014539480209350586, 0.0150146484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 200.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 467.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 193.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 9.0, 5.0, 4.0, 0.0, 0.0, 6.0, 28.0, 28.0, 3.0, 12.0, 5.0, 33.0, 18.0, 58.0, 96.0, 32.0, 119.0, 212.0, 172.0, 459.0, 3369.0, 145920.0, 893308.0, 3341.0, 464.0, 123.0, 196.0, 167.0, 50.0, 78.0, 74.0, 30.0, 40.0, 7.0, 9.0, 6.0, 17.0, 35.0, 4.0, 6.0, 2.0, 0.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.616806447505951e-06, -5.451962351799011e-06, -5.2871182560920715e-06, -5.122274160385132e-06, -4.957430064678192e-06, -4.7925859689712524e-06, -4.627741873264313e-06, -4.462897777557373e-06, -4.298053681850433e-06, -4.133209586143494e-06, -3.968365490436554e-06, -3.8035213947296143e-06, -3.6386772990226746e-06, -3.473833203315735e-06, -3.308989107608795e-06, -3.1441450119018555e-06, -2.9793009161949158e-06, -2.814456820487976e-06, -2.6496127247810364e-06, -2.4847686290740967e-06, -2.319924533367157e-06, -2.1550804376602173e-06, -1.9902363419532776e-06, -1.8253922462463379e-06, -1.6605481505393982e-06, -1.4957040548324585e-06, -1.3308599591255188e-06, -1.166015863418579e-06, -1.0011717677116394e-06, -8.363276720046997e-07, -6.7148357629776e-07, -5.066394805908203e-07, -3.417953848838806e-07, -1.7695128917694092e-07, -1.210719347000122e-08, 1.5273690223693848e-07, 3.175809979438782e-07, 4.824250936508179e-07, 6.472691893577576e-07, 8.121132850646973e-07, 9.76957380771637e-07, 1.1418014764785767e-06, 1.3066455721855164e-06, 1.471489667892456e-06, 1.6363337635993958e-06, 1.8011778593063354e-06, 1.966021955013275e-06, 2.130866050720215e-06, 2.2957101464271545e-06, 2.4605542421340942e-06, 2.625398337841034e-06, 2.7902424335479736e-06, 2.9550865292549133e-06, 3.119930624961853e-06, 3.2847747206687927e-06, 3.4496188163757324e-06, 3.614462912082672e-06, 3.779307007789612e-06, 3.9441511034965515e-06, 4.108995199203491e-06, 4.273839294910431e-06, 4.438683390617371e-06, 4.60352748632431e-06, 4.76837158203125e-06]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 18.0, 15.0, 13.0, 26.0, 756.0, 25.0, 26.0, 22.0, 26.0, 13.0, 10.0, 6.0, 6.0, 3.0, 9.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6370029243262252e-07, -1.5685598953041335e-07, -1.500117008390589e-07, -1.4316739793684974e-07, -1.363231092454953e-07, -1.2947880634328612e-07, -1.2263450344107696e-07, -1.1579021474972251e-07, -1.089459189529407e-07, -1.021016231561589e-07, -9.525732735937709e-08, -8.841303156259528e-08, -8.156872866038611e-08, -7.472443996903166e-08, -6.78801370668225e-08, -6.103584127004069e-08, -5.4191545473258884e-08, -4.734724967647708e-08, -4.050295387969527e-08, -3.365865453019978e-08, -2.6814358733417976e-08, -1.9970062936636168e-08, -1.3125763587140682e-08, -6.2814677903588745e-09, 5.62828006422933e-10, 7.40712469138316e-09, 1.4251421376343387e-08, 2.1095718949482034e-08, 2.794001474626384e-08, 3.478431054304565e-08, 4.1628609892541135e-08, 4.847290568932294e-08, 5.531720148610475e-08, 6.216149728288656e-08, 6.900579307966836e-08, 7.585009598187753e-08, 8.269438467323198e-08, 8.953868757544114e-08, 9.638298337222295e-08, 1.0322727916900476e-07, 1.1007157496578657e-07, 1.1691587076256837e-07, 1.2376017366477754e-07, 1.30604462356132e-07, 1.3744876525834115e-07, 1.442930539496956e-07, 1.5113735685190477e-07, 1.5798164554325922e-07, 1.6482594844546838e-07, 1.7167025134767755e-07, 1.78514540039032e-07, 1.8535884294124116e-07, 1.9220313163259561e-07, 1.9904743453480478e-07, 2.0589172322615923e-07, 2.127360261283684e-07, 2.1958032903057756e-07, 2.2642463193278672e-07, 2.3326892062414117e-07, 2.4011322352635034e-07, 2.469575122177048e-07, 2.5380180090905924e-07, 2.606461180221231e-07, 2.6749040671347757e-07, 2.74334695404832e-07]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 127.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 736.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 129.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 13.0, 11.0, 24.0, 20.0, 25.0, 32.0, 29.0, 24.0, 30.0, 43.0, 40.0, 56.0, 51.0, 58.0, 41.0, 49.0, 56.0, 35.0, 47.0, 33.0, 37.0, 29.0, 31.0, 25.0, 28.0, 20.0, 17.0, 25.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30596923828125, -4.1627197265625, -4.01947021484375, -3.876220703125, -3.73297119140625, -3.5897216796875, -3.44647216796875, -3.30322265625, -3.15997314453125, -3.0167236328125, -2.87347412109375, -2.730224609375, -2.58697509765625, -2.4437255859375, -2.30047607421875, -2.1572265625, -2.01397705078125, -1.8707275390625, -1.72747802734375, -1.584228515625, -1.44097900390625, -1.2977294921875, -1.15447998046875, -1.01123046875, -0.86798095703125, -0.7247314453125, -0.58148193359375, -0.438232421875, -0.29498291015625, -0.1517333984375, -0.00848388671875, 0.134765625, 0.27801513671875, 0.4212646484375, 0.56451416015625, 0.707763671875, 0.85101318359375, 0.9942626953125, 1.13751220703125, 1.28076171875, 1.42401123046875, 1.5672607421875, 1.71051025390625, 1.853759765625, 1.99700927734375, 2.1402587890625, 2.28350830078125, 2.4267578125, 2.57000732421875, 2.7132568359375, 2.85650634765625, 2.999755859375, 3.14300537109375, 3.2862548828125, 3.42950439453125, 3.57275390625, 3.71600341796875, 3.8592529296875, 4.00250244140625, 4.145751953125, 4.28900146484375, 4.4322509765625, 4.57550048828125, 4.71875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 13.0, 8.0, 15.0, 19.0, 25.0, 48.0, 57.0, 81.0, 129.0, 193.0, 289.0, 363.0, 564.0, 823.0, 1272.0, 2126.0, 3418.0, 6139.0, 11013.0, 21808.0, 45896.0, 110402.0, 324522.0, 318895.0, 107943.0, 44931.0, 21308.0, 10836.0, 5923.0, 3444.0, 2078.0, 1395.0, 802.0, 563.0, 411.0, 248.0, 188.0, 98.0, 85.0, 50.0, 40.0, 28.0, 16.0, 12.0, 8.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.22265625, -5.05938720703125, -4.8961181640625, -4.73284912109375, -4.569580078125, -4.40631103515625, -4.2430419921875, -4.07977294921875, -3.91650390625, -3.75323486328125, -3.5899658203125, -3.42669677734375, -3.263427734375, -3.10015869140625, -2.9368896484375, -2.77362060546875, -2.6103515625, -2.44708251953125, -2.2838134765625, -2.12054443359375, -1.957275390625, -1.79400634765625, -1.6307373046875, -1.46746826171875, -1.30419921875, -1.14093017578125, -0.9776611328125, -0.81439208984375, -0.651123046875, -0.48785400390625, -0.3245849609375, -0.16131591796875, 0.001953125, 0.16522216796875, 0.3284912109375, 0.49176025390625, 0.655029296875, 0.81829833984375, 0.9815673828125, 1.14483642578125, 1.30810546875, 1.47137451171875, 1.6346435546875, 1.79791259765625, 1.961181640625, 2.12445068359375, 2.2877197265625, 2.45098876953125, 2.6142578125, 2.77752685546875, 2.9407958984375, 3.10406494140625, 3.267333984375, 3.43060302734375, 3.5938720703125, 3.75714111328125, 3.92041015625, 4.08367919921875, 4.2469482421875, 4.41021728515625, 4.573486328125, 4.73675537109375, 4.9000244140625, 5.06329345703125, 5.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 12.0, 14.0, 14.0, 21.0, 27.0, 26.0, 41.0, 40.0, 52.0, 69.0, 78.0, 130.0, 290.0, 1539.0, 207.0, 109.0, 69.0, 56.0, 44.0, 41.0, 31.0, 28.0, 22.0, 22.0, 16.0, 9.0, 13.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.41357421875, -13.0224609375, -12.63134765625, -12.240234375, -11.84912109375, -11.4580078125, -11.06689453125, -10.67578125, -10.28466796875, -9.8935546875, -9.50244140625, -9.111328125, -8.72021484375, -8.3291015625, -7.93798828125, -7.546875, -7.15576171875, -6.7646484375, -6.37353515625, -5.982421875, -5.59130859375, -5.2001953125, -4.80908203125, -4.41796875, -4.02685546875, -3.6357421875, -3.24462890625, -2.853515625, -2.46240234375, -2.0712890625, -1.68017578125, -1.2890625, -0.89794921875, -0.5068359375, -0.11572265625, 0.275390625, 0.66650390625, 1.0576171875, 1.44873046875, 1.83984375, 2.23095703125, 2.6220703125, 3.01318359375, 3.404296875, 3.79541015625, 4.1865234375, 4.57763671875, 4.96875, 5.35986328125, 5.7509765625, 6.14208984375, 6.533203125, 6.92431640625, 7.3154296875, 7.70654296875, 8.09765625, 8.48876953125, 8.8798828125, 9.27099609375, 9.662109375, 10.05322265625, 10.4443359375, 10.83544921875, 11.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 7.0, 18.0, 23.0, 35.0, 75.0, 110.0, 174.0, 333.0, 934.0, 12484.0, 3113947.0, 15693.0, 996.0, 386.0, 168.0, 104.0, 62.0, 38.0, 27.0, 12.0, 12.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.8125, -42.54345703125, -41.2744140625, -40.00537109375, -38.736328125, -37.46728515625, -36.1982421875, -34.92919921875, -33.66015625, -32.39111328125, -31.1220703125, -29.85302734375, -28.583984375, -27.31494140625, -26.0458984375, -24.77685546875, -23.5078125, -22.23876953125, -20.9697265625, -19.70068359375, -18.431640625, -17.16259765625, -15.8935546875, -14.62451171875, -13.35546875, -12.08642578125, -10.8173828125, -9.54833984375, -8.279296875, -7.01025390625, -5.7412109375, -4.47216796875, -3.203125, -1.93408203125, -0.6650390625, 0.60400390625, 1.873046875, 3.14208984375, 4.4111328125, 5.68017578125, 6.94921875, 8.21826171875, 9.4873046875, 10.75634765625, 12.025390625, 13.29443359375, 14.5634765625, 15.83251953125, 17.1015625, 18.37060546875, 19.6396484375, 20.90869140625, 22.177734375, 23.44677734375, 24.7158203125, 25.98486328125, 27.25390625, 28.52294921875, 29.7919921875, 31.06103515625, 32.330078125, 33.59912109375, 34.8681640625, 36.13720703125, 37.40625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 49.0, 281.0, 427.0, 204.0, 39.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.09678268432617, -43.83516311645508, -41.57353973388672, -39.311920166015625, -37.05030059814453, -34.78867721557617, -32.52705764770508, -30.26543617248535, -28.003814697265625, -25.7421932220459, -23.480571746826172, -21.218952178955078, -18.95733070373535, -16.695709228515625, -14.434088706970215, -12.172468185424805, -9.910846710205078, -7.64922571182251, -5.387604713439941, -3.125983715057373, -0.8643627166748047, 1.3972587585449219, 3.658879280090332, 5.920499801635742, 8.182121276855469, 10.443742752075195, 12.705363273620605, 14.966983795166016, 17.228605270385742, 19.49022674560547, 21.751846313476562, 24.01346778869629, 26.27508544921875, 28.536706924438477, 30.798328399658203, 33.0599479675293, 35.321571350097656, 37.58319091796875, 39.844810485839844, 42.10643005371094, 44.3680534362793, 46.62967300415039, 48.89129638671875, 51.152915954589844, 53.41453552246094, 55.6761589050293, 57.93777847290039, 60.19940185546875, 62.461021423339844, 64.72264099121094, 66.98426055908203, 69.24588775634766, 71.50750732421875, 73.76912689208984, 76.03074645996094, 78.29236602783203, 80.55398559570312, 82.81560516357422, 85.07722473144531, 87.33885192871094, 89.60047149658203, 91.86209106445312, 94.12371063232422, 96.38533020019531, 98.64695739746094]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 13.0, 10.0, 6.0, 7.0, 11.0, 14.0, 21.0, 18.0, 21.0, 26.0, 30.0, 26.0, 33.0, 27.0, 33.0, 35.0, 33.0, 45.0, 44.0, 39.0, 40.0, 37.0, 49.0, 25.0, 42.0, 37.0, 28.0, 33.0, 31.0, 23.0, 25.0, 18.0, 26.0, 12.0, 11.0, 19.0, 12.0, 6.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.42755889892578, -23.595754623413086, -22.763952255249023, -21.932147979736328, -21.100343704223633, -20.268539428710938, -19.436737060546875, -18.60493278503418, -17.773128509521484, -16.94132423400879, -16.109521865844727, -15.277717590332031, -14.445913314819336, -13.614109992980957, -12.782306671142578, -11.950502395629883, -11.11870002746582, -10.286896705627441, -9.455092430114746, -8.623289108276367, -7.79148530960083, -6.959681510925293, -6.127878189086914, -5.296074390411377, -4.46427059173584, -3.6324667930603027, -2.8006632328033447, -1.9688596725463867, -1.1370558738708496, -0.3052520751953125, 0.5265512466430664, 1.3583550453186035, 2.1901588439941406, 3.0219626426696777, 3.8537662029266357, 4.685569763183594, 5.517373561859131, 6.349177360534668, 7.180980682373047, 8.012784957885742, 8.844588279724121, 9.6763916015625, 10.508195877075195, 11.339999198913574, 12.171802520751953, 13.003606796264648, 13.835410118103027, 14.667213439941406, 15.499017715454102, 16.330821990966797, 17.16262435913086, 17.994428634643555, 18.82623291015625, 19.658035278320312, 20.489839553833008, 21.321643829345703, 22.153446197509766, 22.98525047302246, 23.817052841186523, 24.64885711669922, 25.480661392211914, 26.31246566772461, 27.144268035888672, 27.976072311401367, 28.807876586914062]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 14.0, 9.0, 12.0, 15.0, 19.0, 26.0, 19.0, 27.0, 33.0, 34.0, 37.0, 41.0, 41.0, 49.0, 35.0, 64.0, 45.0, 53.0, 62.0, 36.0, 39.0, 33.0, 42.0, 31.0, 30.0, 21.0, 21.0, 22.0, 10.0, 16.0, 11.0, 12.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.000732421875, -3.85693359375, -3.713134765625, -3.5693359375, -3.425537109375, -3.28173828125, -3.137939453125, -2.994140625, -2.850341796875, -2.70654296875, -2.562744140625, -2.4189453125, -2.275146484375, -2.13134765625, -1.987548828125, -1.84375, -1.699951171875, -1.55615234375, -1.412353515625, -1.2685546875, -1.124755859375, -0.98095703125, -0.837158203125, -0.693359375, -0.549560546875, -0.40576171875, -0.261962890625, -0.1181640625, 0.025634765625, 0.16943359375, 0.313232421875, 0.45703125, 0.600830078125, 0.74462890625, 0.888427734375, 1.0322265625, 1.176025390625, 1.31982421875, 1.463623046875, 1.607421875, 1.751220703125, 1.89501953125, 2.038818359375, 2.1826171875, 2.326416015625, 2.47021484375, 2.614013671875, 2.7578125, 2.901611328125, 3.04541015625, 3.189208984375, 3.3330078125, 3.476806640625, 3.62060546875, 3.764404296875, 3.908203125, 4.052001953125, 4.19580078125, 4.339599609375, 4.4833984375, 4.627197265625, 4.77099609375, 4.914794921875, 5.05859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 9.0, 14.0, 15.0, 21.0, 28.0, 41.0, 53.0, 63.0, 95.0, 144.0, 209.0, 374.0, 636.0, 1074.0, 2201.0, 4731.0, 12942.0, 52142.0, 429107.0, 2463962.0, 1074655.0, 116463.0, 21732.0, 7087.0, 2996.0, 1362.0, 774.0, 455.0, 284.0, 187.0, 118.0, 69.0, 55.0, 48.0, 33.0, 20.0, 19.0, 14.0, 14.0, 6.0, 5.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.44384765625, -7.1845703125, -6.92529296875, -6.666015625, -6.40673828125, -6.1474609375, -5.88818359375, -5.62890625, -5.36962890625, -5.1103515625, -4.85107421875, -4.591796875, -4.33251953125, -4.0732421875, -3.81396484375, -3.5546875, -3.29541015625, -3.0361328125, -2.77685546875, -2.517578125, -2.25830078125, -1.9990234375, -1.73974609375, -1.48046875, -1.22119140625, -0.9619140625, -0.70263671875, -0.443359375, -0.18408203125, 0.0751953125, 0.33447265625, 0.59375, 0.85302734375, 1.1123046875, 1.37158203125, 1.630859375, 1.89013671875, 2.1494140625, 2.40869140625, 2.66796875, 2.92724609375, 3.1865234375, 3.44580078125, 3.705078125, 3.96435546875, 4.2236328125, 4.48291015625, 4.7421875, 5.00146484375, 5.2607421875, 5.52001953125, 5.779296875, 6.03857421875, 6.2978515625, 6.55712890625, 6.81640625, 7.07568359375, 7.3349609375, 7.59423828125, 7.853515625, 8.11279296875, 8.3720703125, 8.63134765625, 8.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 5.0, 11.0, 12.0, 13.0, 19.0, 18.0, 32.0, 43.0, 37.0, 64.0, 81.0, 79.0, 128.0, 170.0, 191.0, 254.0, 309.0, 413.0, 417.0, 385.0, 317.0, 230.0, 155.0, 155.0, 96.0, 92.0, 67.0, 50.0, 42.0, 44.0, 37.0, 22.0, 13.0, 18.0, 14.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.11737060546875, -4.9534912109375, -4.78961181640625, -4.625732421875, -4.46185302734375, -4.2979736328125, -4.13409423828125, -3.97021484375, -3.80633544921875, -3.6424560546875, -3.47857666015625, -3.314697265625, -3.15081787109375, -2.9869384765625, -2.82305908203125, -2.6591796875, -2.49530029296875, -2.3314208984375, -2.16754150390625, -2.003662109375, -1.83978271484375, -1.6759033203125, -1.51202392578125, -1.34814453125, -1.18426513671875, -1.0203857421875, -0.85650634765625, -0.692626953125, -0.52874755859375, -0.3648681640625, -0.20098876953125, -0.037109375, 0.12677001953125, 0.2906494140625, 0.45452880859375, 0.618408203125, 0.78228759765625, 0.9461669921875, 1.11004638671875, 1.27392578125, 1.43780517578125, 1.6016845703125, 1.76556396484375, 1.929443359375, 2.09332275390625, 2.2572021484375, 2.42108154296875, 2.5849609375, 2.74884033203125, 2.9127197265625, 3.07659912109375, 3.240478515625, 3.40435791015625, 3.5682373046875, 3.73211669921875, 3.89599609375, 4.05987548828125, 4.2237548828125, 4.38763427734375, 4.551513671875, 4.71539306640625, 4.8792724609375, 5.04315185546875, 5.20703125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 18.0, 16.0, 36.0, 47.0, 70.0, 109.0, 146.0, 221.0, 360.0, 629.0, 1133.0, 2626.0, 7608.0, 34143.0, 221676.0, 2034447.0, 1662905.0, 186803.0, 29618.0, 6825.0, 2275.0, 984.0, 585.0, 337.0, 207.0, 125.0, 95.0, 67.0, 42.0, 20.0, 21.0, 16.0, 13.0, 11.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.05706787109375, -6.7742919921875, -6.49151611328125, -6.208740234375, -5.92596435546875, -5.6431884765625, -5.36041259765625, -5.07763671875, -4.79486083984375, -4.5120849609375, -4.22930908203125, -3.946533203125, -3.66375732421875, -3.3809814453125, -3.09820556640625, -2.8154296875, -2.53265380859375, -2.2498779296875, -1.96710205078125, -1.684326171875, -1.40155029296875, -1.1187744140625, -0.83599853515625, -0.55322265625, -0.27044677734375, 0.0123291015625, 0.29510498046875, 0.577880859375, 0.86065673828125, 1.1434326171875, 1.42620849609375, 1.708984375, 1.99176025390625, 2.2745361328125, 2.55731201171875, 2.840087890625, 3.12286376953125, 3.4056396484375, 3.68841552734375, 3.97119140625, 4.25396728515625, 4.5367431640625, 4.81951904296875, 5.102294921875, 5.38507080078125, 5.6678466796875, 5.95062255859375, 6.2333984375, 6.51617431640625, 6.7989501953125, 7.08172607421875, 7.364501953125, 7.64727783203125, 7.9300537109375, 8.21282958984375, 8.49560546875, 8.77838134765625, 9.0611572265625, 9.34393310546875, 9.626708984375, 9.90948486328125, 10.1922607421875, 10.47503662109375, 10.7578125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 43.0, 409.0, 498.0, 61.0, 2.0, 1.0, 2.0], "bins": [-292.6775207519531, -287.7196044921875, -282.76165771484375, -277.8037414550781, -272.8457946777344, -267.88787841796875, -262.929931640625, -257.9720153808594, -253.01406860351562, -248.05613708496094, -243.09820556640625, -238.14027404785156, -233.18234252929688, -228.2244110107422, -223.2664794921875, -218.30856323242188, -213.3506317138672, -208.3927001953125, -203.4347686767578, -198.47683715820312, -193.51890563964844, -188.56097412109375, -183.60304260253906, -178.64511108398438, -173.68719482421875, -168.72926330566406, -163.77133178710938, -158.8134002685547, -153.85546875, -148.8975372314453, -143.93960571289062, -138.981689453125, -134.02374267578125, -129.06581115722656, -124.10787963867188, -119.14994812011719, -114.1920166015625, -109.23408508300781, -104.27616119384766, -99.31822967529297, -94.36029052734375, -89.40235900878906, -84.44442749023438, -79.48649597167969, -74.528564453125, -69.57063293457031, -64.61270904541016, -59.65477752685547, -54.69684600830078, -49.738914489746094, -44.780982971191406, -39.823055267333984, -34.8651237487793, -29.90719223022461, -24.949262619018555, -19.9913330078125, -15.033403396606445, -10.075472831726074, -5.117542266845703, -0.15961170196533203, 4.798318862915039, 9.756250381469727, 14.714179992675781, 19.672109603881836, 24.630041122436523]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 14.0, 14.0, 20.0, 19.0, 21.0, 15.0, 27.0, 25.0, 28.0, 35.0, 39.0, 48.0, 64.0, 35.0, 35.0, 47.0, 48.0, 49.0, 46.0, 42.0, 47.0, 34.0, 31.0, 29.0, 27.0, 20.0, 31.0, 17.0, 19.0, 17.0, 16.0, 13.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.451316833496094, -28.645355224609375, -27.839391708374023, -27.033430099487305, -26.227468490600586, -25.421504974365234, -24.615543365478516, -23.809581756591797, -23.003620147705078, -22.19765853881836, -21.391695022583008, -20.58573341369629, -19.77977180480957, -18.97380828857422, -18.1678466796875, -17.36188507080078, -16.555923461914062, -15.749960899353027, -14.943999290466309, -14.138036727905273, -13.332075119018555, -12.52611255645752, -11.720149993896484, -10.914188385009766, -10.108224868774414, -9.302262306213379, -8.49630069732666, -7.690338134765625, -6.884376525878906, -6.078413963317871, -5.272451877593994, -4.466489791870117, -3.6605281829833984, -2.8545660972595215, -2.0486040115356445, -1.2426416873931885, -0.4366796016693115, 0.36928272247314453, 1.1752448081970215, 1.9812068939208984, 2.7871689796447754, 3.5931310653686523, 4.399093151092529, 5.205055236816406, 6.011017799377441, 6.816979885101318, 7.622941970825195, 8.428903579711914, 9.23486614227295, 10.040828704833984, 10.846790313720703, 11.652752876281738, 12.458714485168457, 13.264677047729492, 14.070638656616211, 14.876601219177246, 15.682563781738281, 16.488525390625, 17.29448890686035, 18.10045051574707, 18.90641212463379, 19.71237564086914, 20.51833724975586, 21.324298858642578, 22.130260467529297]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 21.0, 15.0, 20.0, 27.0, 31.0, 28.0, 32.0, 34.0, 40.0, 31.0, 43.0, 47.0, 48.0, 50.0, 35.0, 37.0, 43.0, 40.0, 35.0, 27.0, 44.0, 18.0, 23.0, 21.0, 21.0, 25.0, 18.0, 7.0, 14.0, 5.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.292022705078125, -3.18756103515625, -3.083099365234375, -2.9786376953125, -2.874176025390625, -2.76971435546875, -2.665252685546875, -2.560791015625, -2.456329345703125, -2.35186767578125, -2.247406005859375, -2.1429443359375, -2.038482666015625, -1.93402099609375, -1.829559326171875, -1.72509765625, -1.620635986328125, -1.51617431640625, -1.411712646484375, -1.3072509765625, -1.202789306640625, -1.09832763671875, -0.993865966796875, -0.889404296875, -0.784942626953125, -0.68048095703125, -0.576019287109375, -0.4715576171875, -0.367095947265625, -0.26263427734375, -0.158172607421875, -0.0537109375, 0.050750732421875, 0.15521240234375, 0.259674072265625, 0.3641357421875, 0.468597412109375, 0.57305908203125, 0.677520751953125, 0.781982421875, 0.886444091796875, 0.99090576171875, 1.095367431640625, 1.1998291015625, 1.304290771484375, 1.40875244140625, 1.513214111328125, 1.61767578125, 1.722137451171875, 1.82659912109375, 1.931060791015625, 2.0355224609375, 2.139984130859375, 2.24444580078125, 2.348907470703125, 2.453369140625, 2.557830810546875, 2.66229248046875, 2.766754150390625, 2.8712158203125, 2.975677490234375, 3.08013916015625, 3.184600830078125, 3.2890625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 14.0, 19.0, 27.0, 42.0, 62.0, 85.0, 116.0, 185.0, 243.0, 362.0, 591.0, 816.0, 1223.0, 1803.0, 2725.0, 4216.0, 6717.0, 10286.0, 16616.0, 26882.0, 45928.0, 81924.0, 168388.0, 337297.0, 152923.0, 76635.0, 43126.0, 25343.0, 15656.0, 9800.0, 6378.0, 3998.0, 2671.0, 1747.0, 1200.0, 812.0, 494.0, 381.0, 234.0, 177.0, 118.0, 92.0, 62.0, 37.0, 29.0, 16.0, 19.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0198974609375, -0.019264698028564453, -0.018631935119628906, -0.01799917221069336, -0.017366409301757812, -0.016733646392822266, -0.01610088348388672, -0.015468120574951172, -0.014835357666015625, -0.014202594757080078, -0.013569831848144531, -0.012937068939208984, -0.012304306030273438, -0.01167154312133789, -0.011038780212402344, -0.010406017303466797, -0.00977325439453125, -0.009140491485595703, -0.008507728576660156, -0.00787496566772461, -0.0072422027587890625, -0.006609439849853516, -0.005976676940917969, -0.005343914031982422, -0.004711151123046875, -0.004078388214111328, -0.0034456253051757812, -0.0028128623962402344, -0.0021800994873046875, -0.0015473365783691406, -0.0009145736694335938, -0.0002818107604980469, 0.0003509521484375, 0.0009837150573730469, 0.0016164779663085938, 0.0022492408752441406, 0.0028820037841796875, 0.0035147666931152344, 0.004147529602050781, 0.004780292510986328, 0.005413055419921875, 0.006045818328857422, 0.006678581237792969, 0.007311344146728516, 0.007944107055664062, 0.00857686996459961, 0.009209632873535156, 0.009842395782470703, 0.01047515869140625, 0.011107921600341797, 0.011740684509277344, 0.01237344741821289, 0.013006210327148438, 0.013638973236083984, 0.014271736145019531, 0.014904499053955078, 0.015537261962890625, 0.016170024871826172, 0.01680278778076172, 0.017435550689697266, 0.018068313598632812, 0.01870107650756836, 0.019333839416503906, 0.019966602325439453, 0.020599365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 4.0, 8.0, 8.0, 6.0, 10.0, 18.0, 22.0, 22.0, 20.0, 31.0, 30.0, 37.0, 46.0, 59.0, 46.0, 58.0, 40.0, 1076.0, 46.0, 74.0, 46.0, 50.0, 39.0, 43.0, 23.0, 27.0, 32.0, 24.0, 26.0, 12.0, 13.0, 8.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.4327392578125, -2.340087890625, -2.2474365234375, -2.15478515625, -2.0621337890625, -1.969482421875, -1.8768310546875, -1.7841796875, -1.6915283203125, -1.598876953125, -1.5062255859375, -1.41357421875, -1.3209228515625, -1.228271484375, -1.1356201171875, -1.04296875, -0.9503173828125, -0.857666015625, -0.7650146484375, -0.67236328125, -0.5797119140625, -0.487060546875, -0.3944091796875, -0.3017578125, -0.2091064453125, -0.116455078125, -0.0238037109375, 0.06884765625, 0.1614990234375, 0.254150390625, 0.3468017578125, 0.439453125, 0.5321044921875, 0.624755859375, 0.7174072265625, 0.81005859375, 0.9027099609375, 0.995361328125, 1.0880126953125, 1.1806640625, 1.2733154296875, 1.365966796875, 1.4586181640625, 1.55126953125, 1.6439208984375, 1.736572265625, 1.8292236328125, 1.921875, 2.0145263671875, 2.107177734375, 2.1998291015625, 2.29248046875, 2.3851318359375, 2.477783203125, 2.5704345703125, 2.6630859375, 2.7557373046875, 2.848388671875, 2.9410400390625, 3.03369140625, 3.1263427734375, 3.218994140625, 3.3116455078125, 3.404296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 12.0, 26.0, 31.0, 34.0, 72.0, 131.0, 187.0, 310.0, 559.0, 966.0, 1505.0, 2819.0, 4884.0, 9078.0, 16585.0, 31771.0, 63134.0, 143129.0, 1435359.0, 214457.0, 84159.0, 40976.0, 21011.0, 11405.0, 6330.0, 3413.0, 1958.0, 1134.0, 640.0, 428.0, 254.0, 103.0, 80.0, 63.0, 46.0, 23.0, 12.0, 4.0, 11.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.020538330078125, -0.019928693771362305, -0.01931905746459961, -0.018709421157836914, -0.01809978485107422, -0.017490148544311523, -0.016880512237548828, -0.016270875930786133, -0.015661239624023438, -0.015051603317260742, -0.014441967010498047, -0.013832330703735352, -0.013222694396972656, -0.012613058090209961, -0.012003421783447266, -0.01139378547668457, -0.010784149169921875, -0.01017451286315918, -0.009564876556396484, -0.008955240249633789, -0.008345603942871094, -0.0077359676361083984, -0.007126331329345703, -0.006516695022583008, -0.0059070587158203125, -0.005297422409057617, -0.004687786102294922, -0.0040781497955322266, -0.0034685134887695312, -0.002858877182006836, -0.0022492408752441406, -0.0016396045684814453, -0.00102996826171875, -0.0004203319549560547, 0.00018930435180664062, 0.0007989406585693359, 0.0014085769653320312, 0.0020182132720947266, 0.002627849578857422, 0.003237485885620117, 0.0038471221923828125, 0.004456758499145508, 0.005066394805908203, 0.0056760311126708984, 0.006285667419433594, 0.006895303726196289, 0.007504940032958984, 0.00811457633972168, 0.008724212646484375, 0.00933384895324707, 0.009943485260009766, 0.010553121566772461, 0.011162757873535156, 0.011772394180297852, 0.012382030487060547, 0.012991666793823242, 0.013601303100585938, 0.014210939407348633, 0.014820575714111328, 0.015430212020874023, 0.01603984832763672, 0.016649484634399414, 0.01725912094116211, 0.017868757247924805, 0.0184783935546875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.0, 0.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 404.0, 0.0, 0.0, 0.0, 0.0, 0.0, 229.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.473833203315735e-07, -3.371387720108032e-07, -3.2689422369003296e-07, -3.166496753692627e-07, -3.0640512704849243e-07, -2.9616057872772217e-07, -2.859160304069519e-07, -2.7567148208618164e-07, -2.654269337654114e-07, -2.551823854446411e-07, -2.4493783712387085e-07, -2.3469328880310059e-07, -2.2444874048233032e-07, -2.1420419216156006e-07, -2.039596438407898e-07, -1.9371509552001953e-07, -1.8347054719924927e-07, -1.73225998878479e-07, -1.6298145055770874e-07, -1.5273690223693848e-07, -1.424923539161682e-07, -1.3224780559539795e-07, -1.2200325727462769e-07, -1.1175870895385742e-07, -1.0151416063308716e-07, -9.12696123123169e-08, -8.102506399154663e-08, -7.078051567077637e-08, -6.05359673500061e-08, -5.029141902923584e-08, -4.0046870708465576e-08, -2.9802322387695312e-08, -1.955777406692505e-08, -9.313225746154785e-09, 9.313225746154785e-10, 1.1175870895385742e-08, 2.1420419216156006e-08, 3.166496753692627e-08, 4.190951585769653e-08, 5.21540641784668e-08, 6.239861249923706e-08, 7.264316082000732e-08, 8.288770914077759e-08, 9.313225746154785e-08, 1.0337680578231812e-07, 1.1362135410308838e-07, 1.2386590242385864e-07, 1.341104507446289e-07, 1.4435499906539917e-07, 1.5459954738616943e-07, 1.648440957069397e-07, 1.7508864402770996e-07, 1.8533319234848022e-07, 1.955777406692505e-07, 2.0582228899002075e-07, 2.1606683731079102e-07, 2.2631138563156128e-07, 2.3655593395233154e-07, 2.468004822731018e-07, 2.5704503059387207e-07, 2.6728957891464233e-07, 2.775341272354126e-07, 2.8777867555618286e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 10.0, 1.0, 0.0, 6.0, 28.0, 34.0, 17.0, 8.0, 61.0, 21.0, 114.0, 74.0, 135.0, 289.0, 160.0, 577.0, 16222.0, 1012800.0, 16565.0, 542.0, 188.0, 223.0, 126.0, 93.0, 92.0, 39.0, 21.0, 10.0, 6.0, 14.0, 35.0, 3.0, 1.0, 3.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.398876965045929e-06, -5.194917321205139e-06, -4.990957677364349e-06, -4.7869980335235596e-06, -4.58303838968277e-06, -4.37907874584198e-06, -4.17511910200119e-06, -3.9711594581604e-06, -3.7671998143196106e-06, -3.563240170478821e-06, -3.359280526638031e-06, -3.155320882797241e-06, -2.9513612389564514e-06, -2.7474015951156616e-06, -2.543441951274872e-06, -2.339482307434082e-06, -2.1355226635932922e-06, -1.9315630197525024e-06, -1.7276033759117126e-06, -1.5236437320709229e-06, -1.319684088230133e-06, -1.1157244443893433e-06, -9.117648005485535e-07, -7.078051567077637e-07, -5.038455128669739e-07, -2.998858690261841e-07, -9.592622518539429e-08, 1.0803341865539551e-07, 3.119930624961853e-07, 5.159527063369751e-07, 7.199123501777649e-07, 9.238719940185547e-07, 1.1278316378593445e-06, 1.3317912817001343e-06, 1.535750925540924e-06, 1.7397105693817139e-06, 1.9436702132225037e-06, 2.1476298570632935e-06, 2.3515895009040833e-06, 2.555549144744873e-06, 2.759508788585663e-06, 2.9634684324264526e-06, 3.1674280762672424e-06, 3.3713877201080322e-06, 3.575347363948822e-06, 3.779307007789612e-06, 3.983266651630402e-06, 4.187226295471191e-06, 4.391185939311981e-06, 4.595145583152771e-06, 4.799105226993561e-06, 5.003064870834351e-06, 5.20702451467514e-06, 5.41098415851593e-06, 5.61494380235672e-06, 5.81890344619751e-06, 6.0228630900382996e-06, 6.226822733879089e-06, 6.430782377719879e-06, 6.634742021560669e-06, 6.838701665401459e-06, 7.0426613092422485e-06, 7.246620953083038e-06, 7.450580596923828e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 7.0, 9.0, 15.0, 18.0, 20.0, 17.0, 21.0, 21.0, 712.0, 19.0, 12.0, 16.0, 18.0, 20.0, 18.0, 11.0, 5.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3966374012852611e-07, -1.359658341471004e-07, -1.3226792816567468e-07, -1.2857003639510367e-07, -1.2487213041367795e-07, -1.2117422443225223e-07, -1.1747631845082651e-07, -1.1377841246940079e-07, -1.1008050648797507e-07, -1.0638260050654935e-07, -1.0268470163055099e-07, -9.898679564912527e-08, -9.528888966769955e-08, -9.159099079170119e-08, -8.789308481027547e-08, -8.419517882884975e-08, -8.049727995285139e-08, -7.679937397142567e-08, -7.31014750954273e-08, -6.940356911400158e-08, -6.570566313257586e-08, -6.200775715115014e-08, -5.830985827515178e-08, -5.461195229372606e-08, -5.091404986501402e-08, -4.721614743630198e-08, -4.351824145487626e-08, -3.982033902616422e-08, -3.612243659745218e-08, -3.242453061602646e-08, -2.8726628187314418e-08, -2.5028723982245538e-08, -2.1330819777176657e-08, -1.7632915572107777e-08, -1.3935012255217316e-08, -1.0237108938326855e-08, -6.539204733257975e-09, -2.8413005281890946e-09, 8.566019005229464e-10, 4.554506105591827e-09, 8.252410310660707e-09, 1.1950314515729588e-08, 1.5648218720798468e-08, 1.934612114951051e-08, 2.304402535457939e-08, 2.674192955964827e-08, 3.043983198836031e-08, 3.413773441707235e-08, 3.783564039849807e-08, 4.153354282721011e-08, 4.523144880863583e-08, 4.8929351237347873e-08, 5.262725721877359e-08, 5.6325159647485634e-08, 6.002306207619768e-08, 6.37209680576234e-08, 6.741886693362176e-08, 7.111677291504748e-08, 7.481467179104584e-08, 7.851257777247156e-08, 8.221048375389728e-08, 8.590838262989564e-08, 8.960628861132136e-08, 9.330419459274708e-08, 9.70021005741728e-08]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 160.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 701.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 140.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 21.0, 15.0, 20.0, 27.0, 31.0, 28.0, 32.0, 34.0, 40.0, 31.0, 43.0, 47.0, 48.0, 50.0, 35.0, 37.0, 43.0, 40.0, 35.0, 27.0, 44.0, 18.0, 23.0, 21.0, 21.0, 25.0, 18.0, 7.0, 14.0, 5.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.292022705078125, -3.18756103515625, -3.083099365234375, -2.9786376953125, -2.874176025390625, -2.76971435546875, -2.665252685546875, -2.560791015625, -2.456329345703125, -2.35186767578125, -2.247406005859375, -2.1429443359375, -2.038482666015625, -1.93402099609375, -1.829559326171875, -1.72509765625, -1.620635986328125, -1.51617431640625, -1.411712646484375, -1.3072509765625, -1.202789306640625, -1.09832763671875, -0.993865966796875, -0.889404296875, -0.784942626953125, -0.68048095703125, -0.576019287109375, -0.4715576171875, -0.367095947265625, -0.26263427734375, -0.158172607421875, -0.0537109375, 0.050750732421875, 0.15521240234375, 0.259674072265625, 0.3641357421875, 0.468597412109375, 0.57305908203125, 0.677520751953125, 0.781982421875, 0.886444091796875, 0.99090576171875, 1.095367431640625, 1.1998291015625, 1.304290771484375, 1.40875244140625, 1.513214111328125, 1.61767578125, 1.722137451171875, 1.82659912109375, 1.931060791015625, 2.0355224609375, 2.139984130859375, 2.24444580078125, 2.348907470703125, 2.453369140625, 2.557830810546875, 2.66229248046875, 2.766754150390625, 2.8712158203125, 2.975677490234375, 3.08013916015625, 3.184600830078125, 3.2890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 20.0, 31.0, 29.0, 58.0, 73.0, 103.0, 148.0, 212.0, 312.0, 432.0, 678.0, 1140.0, 1780.0, 3288.0, 7013.0, 17314.0, 52078.0, 207796.0, 538560.0, 149254.0, 40761.0, 14192.0, 5894.0, 2844.0, 1595.0, 944.0, 588.0, 423.0, 265.0, 226.0, 137.0, 85.0, 77.0, 43.0, 31.0, 35.0, 14.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96875, -5.77862548828125, -5.5885009765625, -5.39837646484375, -5.208251953125, -5.01812744140625, -4.8280029296875, -4.63787841796875, -4.44775390625, -4.25762939453125, -4.0675048828125, -3.87738037109375, -3.687255859375, -3.49713134765625, -3.3070068359375, -3.11688232421875, -2.9267578125, -2.73663330078125, -2.5465087890625, -2.35638427734375, -2.166259765625, -1.97613525390625, -1.7860107421875, -1.59588623046875, -1.40576171875, -1.21563720703125, -1.0255126953125, -0.83538818359375, -0.645263671875, -0.45513916015625, -0.2650146484375, -0.07489013671875, 0.115234375, 0.30535888671875, 0.4954833984375, 0.68560791015625, 0.875732421875, 1.06585693359375, 1.2559814453125, 1.44610595703125, 1.63623046875, 1.82635498046875, 2.0164794921875, 2.20660400390625, 2.396728515625, 2.58685302734375, 2.7769775390625, 2.96710205078125, 3.1572265625, 3.34735107421875, 3.5374755859375, 3.72760009765625, 3.917724609375, 4.10784912109375, 4.2979736328125, 4.48809814453125, 4.67822265625, 4.86834716796875, 5.0584716796875, 5.24859619140625, 5.438720703125, 5.62884521484375, 5.8189697265625, 6.00909423828125, 6.19921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 11.0, 5.0, 3.0, 10.0, 15.0, 11.0, 11.0, 16.0, 23.0, 33.0, 46.0, 32.0, 41.0, 52.0, 58.0, 100.0, 246.0, 1563.0, 269.0, 141.0, 58.0, 50.0, 45.0, 23.0, 32.0, 31.0, 34.0, 19.0, 17.0, 14.0, 14.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3984375, -11.0867919921875, -10.775146484375, -10.4635009765625, -10.15185546875, -9.8402099609375, -9.528564453125, -9.2169189453125, -8.9052734375, -8.5936279296875, -8.281982421875, -7.9703369140625, -7.65869140625, -7.3470458984375, -7.035400390625, -6.7237548828125, -6.412109375, -6.1004638671875, -5.788818359375, -5.4771728515625, -5.16552734375, -4.8538818359375, -4.542236328125, -4.2305908203125, -3.9189453125, -3.6072998046875, -3.295654296875, -2.9840087890625, -2.67236328125, -2.3607177734375, -2.049072265625, -1.7374267578125, -1.42578125, -1.1141357421875, -0.802490234375, -0.4908447265625, -0.17919921875, 0.1324462890625, 0.444091796875, 0.7557373046875, 1.0673828125, 1.3790283203125, 1.690673828125, 2.0023193359375, 2.31396484375, 2.6256103515625, 2.937255859375, 3.2489013671875, 3.560546875, 3.8721923828125, 4.183837890625, 4.4954833984375, 4.80712890625, 5.1187744140625, 5.430419921875, 5.7420654296875, 6.0537109375, 6.3653564453125, 6.677001953125, 6.9886474609375, 7.30029296875, 7.6119384765625, 7.923583984375, 8.2352294921875, 8.546875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 10.0, 5.0, 4.0, 16.0, 12.0, 13.0, 25.0, 38.0, 40.0, 59.0, 78.0, 120.0, 165.0, 304.0, 508.0, 971.0, 5699.0, 2750349.0, 381818.0, 3302.0, 864.0, 441.0, 231.0, 179.0, 103.0, 86.0, 49.0, 57.0, 30.0, 23.0, 18.0, 19.0, 10.0, 9.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.71875, -19.059326171875, -18.39990234375, -17.740478515625, -17.0810546875, -16.421630859375, -15.76220703125, -15.102783203125, -14.443359375, -13.783935546875, -13.12451171875, -12.465087890625, -11.8056640625, -11.146240234375, -10.48681640625, -9.827392578125, -9.16796875, -8.508544921875, -7.84912109375, -7.189697265625, -6.5302734375, -5.870849609375, -5.21142578125, -4.552001953125, -3.892578125, -3.233154296875, -2.57373046875, -1.914306640625, -1.2548828125, -0.595458984375, 0.06396484375, 0.723388671875, 1.3828125, 2.042236328125, 2.70166015625, 3.361083984375, 4.0205078125, 4.679931640625, 5.33935546875, 5.998779296875, 6.658203125, 7.317626953125, 7.97705078125, 8.636474609375, 9.2958984375, 9.955322265625, 10.61474609375, 11.274169921875, 11.93359375, 12.593017578125, 13.25244140625, 13.911865234375, 14.5712890625, 15.230712890625, 15.89013671875, 16.549560546875, 17.208984375, 17.868408203125, 18.52783203125, 19.187255859375, 19.8466796875, 20.506103515625, 21.16552734375, 21.824951171875, 22.484375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 145.0, 646.0, 201.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.77757263183594, -66.21517944335938, -62.652793884277344, -59.09040069580078, -55.528011322021484, -51.96562194824219, -48.403228759765625, -44.84083938598633, -41.27845001220703, -37.716060638427734, -34.15367126464844, -30.591278076171875, -27.028888702392578, -23.46649932861328, -19.90410804748535, -16.341716766357422, -12.779327392578125, -9.216937065124512, -5.654546737670898, -2.092156410217285, 1.4702339172363281, 5.032623291015625, 8.595014572143555, 12.157405853271484, 15.719795227050781, 19.282184600830078, 22.844575881958008, 26.406967163085938, 29.969356536865234, 33.53174591064453, 37.094139099121094, 40.65652847290039, 44.21891784667969, 47.781307220458984, 51.34369659423828, 54.906089782714844, 58.46847915649414, 62.03086853027344, 65.59326171875, 69.15565490722656, 72.7180404663086, 76.28043365478516, 79.84281921386719, 83.40521240234375, 86.96760559082031, 90.52999114990234, 94.0923843383789, 97.65476989746094, 101.2171630859375, 104.77955627441406, 108.3419418334961, 111.90433502197266, 115.46672058105469, 119.02911376953125, 122.59150695800781, 126.15390014648438, 129.71627807617188, 133.27867126464844, 136.841064453125, 140.4034423828125, 143.96583557128906, 147.52822875976562, 151.0906219482422, 154.65301513671875, 158.2154083251953]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 7.0, 9.0, 17.0, 18.0, 22.0, 23.0, 28.0, 26.0, 25.0, 36.0, 28.0, 26.0, 43.0, 30.0, 39.0, 37.0, 44.0, 39.0, 45.0, 53.0, 36.0, 29.0, 31.0, 41.0, 25.0, 28.0, 31.0, 25.0, 24.0, 20.0, 18.0, 19.0, 8.0, 12.0, 11.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.22344970703125, -20.473140716552734, -19.72283172607422, -18.972524642944336, -18.22221565246582, -17.471906661987305, -16.721599578857422, -15.971290588378906, -15.22098159790039, -14.470672607421875, -13.720364570617676, -12.970056533813477, -12.219747543334961, -11.469438552856445, -10.719130516052246, -9.968822479248047, -9.218513488769531, -8.468204498291016, -7.717896461486816, -6.967587947845459, -6.217279434204102, -5.466970920562744, -4.716662406921387, -3.9663538932800293, -3.216045379638672, -2.4657368659973145, -1.715428352355957, -0.9651198387145996, -0.2148113250732422, 0.5354971885681152, 1.2858057022094727, 2.03611421585083, 2.7864227294921875, 3.536731243133545, 4.287039756774902, 5.03734827041626, 5.787656784057617, 6.537965297698975, 7.288273811340332, 8.038581848144531, 8.788890838623047, 9.539199829101562, 10.289507865905762, 11.039815902709961, 11.790124893188477, 12.540433883666992, 13.290741920471191, 14.04104995727539, 14.791358947753906, 15.541667938232422, 16.291976928710938, 17.04228401184082, 17.792593002319336, 18.54290199279785, 19.293209075927734, 20.04351806640625, 20.793827056884766, 21.54413604736328, 22.294445037841797, 23.04475212097168, 23.795061111450195, 24.54537010192871, 25.295677185058594, 26.04598617553711, 26.796295166015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 5.0, 11.0, 14.0, 12.0, 8.0, 17.0, 16.0, 18.0, 27.0, 21.0, 30.0, 28.0, 25.0, 33.0, 38.0, 48.0, 42.0, 39.0, 37.0, 46.0, 47.0, 51.0, 38.0, 39.0, 31.0, 35.0, 30.0, 35.0, 24.0, 19.0, 24.0, 21.0, 16.0, 9.0, 22.0, 10.0, 7.0, 9.0, 2.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.556640625, -3.446624755859375, -3.33660888671875, -3.226593017578125, -3.1165771484375, -3.006561279296875, -2.89654541015625, -2.786529541015625, -2.676513671875, -2.566497802734375, -2.45648193359375, -2.346466064453125, -2.2364501953125, -2.126434326171875, -2.01641845703125, -1.906402587890625, -1.79638671875, -1.686370849609375, -1.57635498046875, -1.466339111328125, -1.3563232421875, -1.246307373046875, -1.13629150390625, -1.026275634765625, -0.916259765625, -0.806243896484375, -0.69622802734375, -0.586212158203125, -0.4761962890625, -0.366180419921875, -0.25616455078125, -0.146148681640625, -0.0361328125, 0.073883056640625, 0.18389892578125, 0.293914794921875, 0.4039306640625, 0.513946533203125, 0.62396240234375, 0.733978271484375, 0.843994140625, 0.954010009765625, 1.06402587890625, 1.174041748046875, 1.2840576171875, 1.394073486328125, 1.50408935546875, 1.614105224609375, 1.72412109375, 1.834136962890625, 1.94415283203125, 2.054168701171875, 2.1641845703125, 2.274200439453125, 2.38421630859375, 2.494232177734375, 2.604248046875, 2.714263916015625, 2.82427978515625, 2.934295654296875, 3.0443115234375, 3.154327392578125, 3.26434326171875, 3.374359130859375, 3.484375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 19.0, 8.0, 30.0, 43.0, 50.0, 63.0, 102.0, 155.0, 204.0, 279.0, 434.0, 602.0, 1015.0, 1408.0, 2341.0, 3624.0, 6061.0, 10235.0, 20663.0, 62738.0, 324182.0, 1309965.0, 1762358.0, 527646.0, 101484.0, 26915.0, 12470.0, 6968.0, 4256.0, 2694.0, 1699.0, 1138.0, 776.0, 537.0, 334.0, 236.0, 154.0, 113.0, 81.0, 69.0, 39.0, 20.0, 17.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.01953125, -4.87255859375, -4.7255859375, -4.57861328125, -4.431640625, -4.28466796875, -4.1376953125, -3.99072265625, -3.84375, -3.69677734375, -3.5498046875, -3.40283203125, -3.255859375, -3.10888671875, -2.9619140625, -2.81494140625, -2.66796875, -2.52099609375, -2.3740234375, -2.22705078125, -2.080078125, -1.93310546875, -1.7861328125, -1.63916015625, -1.4921875, -1.34521484375, -1.1982421875, -1.05126953125, -0.904296875, -0.75732421875, -0.6103515625, -0.46337890625, -0.31640625, -0.16943359375, -0.0224609375, 0.12451171875, 0.271484375, 0.41845703125, 0.5654296875, 0.71240234375, 0.859375, 1.00634765625, 1.1533203125, 1.30029296875, 1.447265625, 1.59423828125, 1.7412109375, 1.88818359375, 2.03515625, 2.18212890625, 2.3291015625, 2.47607421875, 2.623046875, 2.77001953125, 2.9169921875, 3.06396484375, 3.2109375, 3.35791015625, 3.5048828125, 3.65185546875, 3.798828125, 3.94580078125, 4.0927734375, 4.23974609375, 4.38671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 2.0, 6.0, 7.0, 10.0, 21.0, 13.0, 26.0, 44.0, 54.0, 84.0, 90.0, 140.0, 170.0, 200.0, 290.0, 386.0, 436.0, 467.0, 382.0, 303.0, 210.0, 167.0, 133.0, 112.0, 69.0, 59.0, 51.0, 47.0, 27.0, 18.0, 12.0, 4.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.1754150390625, -4.026611328125, -3.8778076171875, -3.72900390625, -3.5802001953125, -3.431396484375, -3.2825927734375, -3.1337890625, -2.9849853515625, -2.836181640625, -2.6873779296875, -2.53857421875, -2.3897705078125, -2.240966796875, -2.0921630859375, -1.943359375, -1.7945556640625, -1.645751953125, -1.4969482421875, -1.34814453125, -1.1993408203125, -1.050537109375, -0.9017333984375, -0.7529296875, -0.6041259765625, -0.455322265625, -0.3065185546875, -0.15771484375, -0.0089111328125, 0.139892578125, 0.2886962890625, 0.4375, 0.5863037109375, 0.735107421875, 0.8839111328125, 1.03271484375, 1.1815185546875, 1.330322265625, 1.4791259765625, 1.6279296875, 1.7767333984375, 1.925537109375, 2.0743408203125, 2.22314453125, 2.3719482421875, 2.520751953125, 2.6695556640625, 2.818359375, 2.9671630859375, 3.115966796875, 3.2647705078125, 3.41357421875, 3.5623779296875, 3.711181640625, 3.8599853515625, 4.0087890625, 4.1575927734375, 4.306396484375, 4.4552001953125, 4.60400390625, 4.7528076171875, 4.901611328125, 5.0504150390625, 5.19921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 3.0, 11.0, 8.0, 20.0, 19.0, 25.0, 51.0, 69.0, 94.0, 135.0, 227.0, 338.0, 576.0, 1358.0, 3852.0, 17046.0, 196039.0, 3015026.0, 896771.0, 51004.0, 7327.0, 2136.0, 866.0, 462.0, 271.0, 175.0, 109.0, 60.0, 44.0, 51.0, 25.0, 17.0, 17.0, 6.0, 11.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.5, -9.22662353515625, -8.9532470703125, -8.67987060546875, -8.406494140625, -8.13311767578125, -7.8597412109375, -7.58636474609375, -7.31298828125, -7.03961181640625, -6.7662353515625, -6.49285888671875, -6.219482421875, -5.94610595703125, -5.6727294921875, -5.39935302734375, -5.1259765625, -4.85260009765625, -4.5792236328125, -4.30584716796875, -4.032470703125, -3.75909423828125, -3.4857177734375, -3.21234130859375, -2.93896484375, -2.66558837890625, -2.3922119140625, -2.11883544921875, -1.845458984375, -1.57208251953125, -1.2987060546875, -1.02532958984375, -0.751953125, -0.47857666015625, -0.2052001953125, 0.06817626953125, 0.341552734375, 0.61492919921875, 0.8883056640625, 1.16168212890625, 1.43505859375, 1.70843505859375, 1.9818115234375, 2.25518798828125, 2.528564453125, 2.80194091796875, 3.0753173828125, 3.34869384765625, 3.6220703125, 3.89544677734375, 4.1688232421875, 4.44219970703125, 4.715576171875, 4.98895263671875, 5.2623291015625, 5.53570556640625, 5.80908203125, 6.08245849609375, 6.3558349609375, 6.62921142578125, 6.902587890625, 7.17596435546875, 7.4493408203125, 7.72271728515625, 7.99609375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 14.0, 39.0, 89.0, 209.0, 240.0, 221.0, 114.0, 47.0, 27.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.41825103759766, -66.94837188720703, -65.47850036621094, -64.00862121582031, -62.53874588012695, -61.068870544433594, -59.59899139404297, -58.12911605834961, -56.65924072265625, -55.18936538696289, -53.71949005126953, -52.249610900878906, -50.77973556518555, -49.30986022949219, -47.83998107910156, -46.3701057434082, -44.900230407714844, -43.430355072021484, -41.960479736328125, -40.4906005859375, -39.02072525024414, -37.55084991455078, -36.080970764160156, -34.6110954284668, -33.14122009277344, -31.671344757080078, -30.201467514038086, -28.731590270996094, -27.261714935302734, -25.791839599609375, -24.321962356567383, -22.85208511352539, -21.382213592529297, -19.912338256835938, -18.442461013793945, -16.972583770751953, -15.502708435058594, -14.032832145690918, -12.562955856323242, -11.093079566955566, -9.62320327758789, -8.153326988220215, -6.683450698852539, -5.213574409484863, -3.7436981201171875, -2.2738218307495117, -0.8039455413818359, 0.6659307479858398, 2.1358070373535156, 3.6056833267211914, 5.075559616088867, 6.545435905456543, 8.015312194824219, 9.485188484191895, 10.95506477355957, 12.424941062927246, 13.894817352294922, 15.364693641662598, 16.834569931030273, 18.304447174072266, 19.774322509765625, 21.244197845458984, 22.714075088500977, 24.18395233154297, 25.653827667236328]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 4.0, 6.0, 18.0, 14.0, 19.0, 36.0, 25.0, 27.0, 28.0, 30.0, 48.0, 34.0, 39.0, 30.0, 50.0, 45.0, 42.0, 42.0, 39.0, 42.0, 35.0, 39.0, 39.0, 32.0, 30.0, 27.0, 27.0, 23.0, 21.0, 17.0, 17.0, 18.0, 4.0, 7.0, 8.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.364112854003906, -18.760364532470703, -18.156618118286133, -17.55286979675293, -16.94912338256836, -16.345375061035156, -15.74162769317627, -15.137880325317383, -14.53413200378418, -13.930384635925293, -13.326637268066406, -12.722888946533203, -12.119141578674316, -11.51539421081543, -10.911646842956543, -10.307899475097656, -9.70415210723877, -9.100404739379883, -8.496657371520996, -7.892909526824951, -7.289161682128906, -6.6854143142700195, -6.081666946411133, -5.477919101715088, -4.874171733856201, -4.2704243659973145, -3.6666765213012695, -3.062929153442383, -2.459181547164917, -1.8554339408874512, -1.2516865730285645, -0.6479387283325195, -0.04419136047363281, 0.5595561861991882, 1.1633037328720093, 1.7670512199401855, 2.3707988262176514, 2.974546432495117, 3.578293800354004, 4.182041645050049, 4.7857890129089355, 5.389536380767822, 5.993284225463867, 6.597031593322754, 7.200778961181641, 7.8045268058776855, 8.408273696899414, 9.012022018432617, 9.615769386291504, 10.21951675415039, 10.823264122009277, 11.427011489868164, 12.030759811401367, 12.634507179260254, 13.23825454711914, 13.842002868652344, 14.445749282836914, 15.0494966506958, 15.653244018554688, 16.25699234008789, 16.86073875427246, 17.464487075805664, 18.068233489990234, 18.671981811523438, 19.27573013305664]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 2.0, 12.0, 9.0, 17.0, 19.0, 11.0, 22.0, 23.0, 16.0, 28.0, 28.0, 32.0, 28.0, 37.0, 42.0, 29.0, 40.0, 36.0, 52.0, 36.0, 32.0, 45.0, 38.0, 34.0, 29.0, 39.0, 35.0, 20.0, 22.0, 27.0, 19.0, 24.0, 17.0, 19.0, 11.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0], "bins": [-3.029296875, -2.941070556640625, -2.85284423828125, -2.764617919921875, -2.6763916015625, -2.588165283203125, -2.49993896484375, -2.411712646484375, -2.323486328125, -2.235260009765625, -2.14703369140625, -2.058807373046875, -1.9705810546875, -1.882354736328125, -1.79412841796875, -1.705902099609375, -1.61767578125, -1.529449462890625, -1.44122314453125, -1.352996826171875, -1.2647705078125, -1.176544189453125, -1.08831787109375, -1.000091552734375, -0.911865234375, -0.823638916015625, -0.73541259765625, -0.647186279296875, -0.5589599609375, -0.470733642578125, -0.38250732421875, -0.294281005859375, -0.2060546875, -0.117828369140625, -0.02960205078125, 0.058624267578125, 0.1468505859375, 0.235076904296875, 0.32330322265625, 0.411529541015625, 0.499755859375, 0.587982177734375, 0.67620849609375, 0.764434814453125, 0.8526611328125, 0.940887451171875, 1.02911376953125, 1.117340087890625, 1.20556640625, 1.293792724609375, 1.38201904296875, 1.470245361328125, 1.5584716796875, 1.646697998046875, 1.73492431640625, 1.823150634765625, 1.911376953125, 1.999603271484375, 2.08782958984375, 2.176055908203125, 2.2642822265625, 2.352508544921875, 2.44073486328125, 2.528961181640625, 2.6171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 13.0, 19.0, 33.0, 33.0, 52.0, 80.0, 119.0, 162.0, 226.0, 308.0, 429.0, 642.0, 892.0, 1370.0, 2018.0, 2982.0, 4198.0, 6332.0, 9563.0, 14720.0, 22831.0, 36483.0, 61853.0, 112841.0, 268656.0, 241313.0, 104588.0, 57631.0, 34511.0, 21469.0, 14150.0, 9182.0, 5935.0, 4000.0, 2704.0, 2002.0, 1246.0, 885.0, 580.0, 477.0, 266.0, 213.0, 159.0, 113.0, 82.0, 57.0, 40.0, 31.0, 23.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.017024755477905273, -0.016456127166748047, -0.01588749885559082, -0.015318870544433594, -0.014750242233276367, -0.01418161392211914, -0.013612985610961914, -0.013044357299804688, -0.012475728988647461, -0.011907100677490234, -0.011338472366333008, -0.010769844055175781, -0.010201215744018555, -0.009632587432861328, -0.009063959121704102, -0.008495330810546875, -0.007926702499389648, -0.007358074188232422, -0.006789445877075195, -0.006220817565917969, -0.005652189254760742, -0.005083560943603516, -0.004514932632446289, -0.0039463043212890625, -0.003377676010131836, -0.0028090476989746094, -0.002240419387817383, -0.0016717910766601562, -0.0011031627655029297, -0.0005345344543457031, 3.409385681152344e-05, 0.00060272216796875, 0.0011713504791259766, 0.0017399787902832031, 0.0023086071014404297, 0.0028772354125976562, 0.003445863723754883, 0.004014492034912109, 0.004583120346069336, 0.0051517486572265625, 0.005720376968383789, 0.006289005279541016, 0.006857633590698242, 0.007426261901855469, 0.007994890213012695, 0.008563518524169922, 0.009132146835327148, 0.009700775146484375, 0.010269403457641602, 0.010838031768798828, 0.011406660079956055, 0.011975288391113281, 0.012543916702270508, 0.013112545013427734, 0.013681173324584961, 0.014249801635742188, 0.014818429946899414, 0.01538705825805664, 0.015955686569213867, 0.016524314880371094, 0.01709294319152832, 0.017661571502685547, 0.018230199813842773, 0.018798828125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 5.0, 13.0, 8.0, 14.0, 15.0, 16.0, 15.0, 39.0, 35.0, 24.0, 29.0, 33.0, 25.0, 37.0, 40.0, 47.0, 36.0, 40.0, 1063.0, 46.0, 32.0, 39.0, 38.0, 39.0, 30.0, 29.0, 33.0, 29.0, 25.0, 20.0, 23.0, 22.0, 17.0, 7.0, 15.0, 9.0, 10.0, 6.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.12890625, -2.06378173828125, -1.9986572265625, -1.93353271484375, -1.868408203125, -1.80328369140625, -1.7381591796875, -1.67303466796875, -1.60791015625, -1.54278564453125, -1.4776611328125, -1.41253662109375, -1.347412109375, -1.28228759765625, -1.2171630859375, -1.15203857421875, -1.0869140625, -1.02178955078125, -0.9566650390625, -0.89154052734375, -0.826416015625, -0.76129150390625, -0.6961669921875, -0.63104248046875, -0.56591796875, -0.50079345703125, -0.4356689453125, -0.37054443359375, -0.305419921875, -0.24029541015625, -0.1751708984375, -0.11004638671875, -0.044921875, 0.02020263671875, 0.0853271484375, 0.15045166015625, 0.215576171875, 0.28070068359375, 0.3458251953125, 0.41094970703125, 0.47607421875, 0.54119873046875, 0.6063232421875, 0.67144775390625, 0.736572265625, 0.80169677734375, 0.8668212890625, 0.93194580078125, 0.9970703125, 1.06219482421875, 1.1273193359375, 1.19244384765625, 1.257568359375, 1.32269287109375, 1.3878173828125, 1.45294189453125, 1.51806640625, 1.58319091796875, 1.6483154296875, 1.71343994140625, 1.778564453125, 1.84368896484375, 1.9088134765625, 1.97393798828125, 2.0390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 9.0, 11.0, 18.0, 32.0, 36.0, 53.0, 71.0, 132.0, 161.0, 261.0, 370.0, 599.0, 872.0, 1283.0, 2029.0, 3183.0, 4787.0, 7816.0, 11923.0, 19465.0, 31159.0, 50667.0, 84919.0, 171766.0, 1351274.0, 150326.0, 78786.0, 46948.0, 28839.0, 17881.0, 11363.0, 7018.0, 4582.0, 2882.0, 1858.0, 1284.0, 785.0, 534.0, 384.0, 234.0, 156.0, 101.0, 92.0, 63.0, 39.0, 30.0, 22.0, 11.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.012054443359375, -0.011670827865600586, -0.011287212371826172, -0.010903596878051758, -0.010519981384277344, -0.01013636589050293, -0.009752750396728516, -0.009369134902954102, -0.008985519409179688, -0.008601903915405273, -0.00821828842163086, -0.007834672927856445, -0.007451057434082031, -0.007067441940307617, -0.006683826446533203, -0.006300210952758789, -0.005916595458984375, -0.005532979965209961, -0.005149364471435547, -0.004765748977661133, -0.004382133483886719, -0.003998517990112305, -0.0036149024963378906, -0.0032312870025634766, -0.0028476715087890625, -0.0024640560150146484, -0.0020804405212402344, -0.0016968250274658203, -0.0013132095336914062, -0.0009295940399169922, -0.0005459785461425781, -0.00016236305236816406, 0.00022125244140625, 0.0006048679351806641, 0.0009884834289550781, 0.0013720989227294922, 0.0017557144165039062, 0.0021393299102783203, 0.0025229454040527344, 0.0029065608978271484, 0.0032901763916015625, 0.0036737918853759766, 0.004057407379150391, 0.004441022872924805, 0.004824638366699219, 0.005208253860473633, 0.005591869354248047, 0.005975484848022461, 0.006359100341796875, 0.006742715835571289, 0.007126331329345703, 0.007509946823120117, 0.007893562316894531, 0.008277177810668945, 0.00866079330444336, 0.009044408798217773, 0.009428024291992188, 0.009811639785766602, 0.010195255279541016, 0.01057887077331543, 0.010962486267089844, 0.011346101760864258, 0.011729717254638672, 0.012113332748413086, 0.0124969482421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 166.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 528.0, 0.0, 0.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.980232238769531e-07, -2.8870999813079834e-07, -2.7939677238464355e-07, -2.7008354663848877e-07, -2.60770320892334e-07, -2.514570951461792e-07, -2.421438694000244e-07, -2.3283064365386963e-07, -2.2351741790771484e-07, -2.1420419216156006e-07, -2.0489096641540527e-07, -1.955777406692505e-07, -1.862645149230957e-07, -1.7695128917694092e-07, -1.6763806343078613e-07, -1.5832483768463135e-07, -1.4901161193847656e-07, -1.3969838619232178e-07, -1.30385160446167e-07, -1.210719347000122e-07, -1.1175870895385742e-07, -1.0244548320770264e-07, -9.313225746154785e-08, -8.381903171539307e-08, -7.450580596923828e-08, -6.51925802230835e-08, -5.587935447692871e-08, -4.6566128730773926e-08, -3.725290298461914e-08, -2.7939677238464355e-08, -1.862645149230957e-08, -9.313225746154785e-09, 0.0, 9.313225746154785e-09, 1.862645149230957e-08, 2.7939677238464355e-08, 3.725290298461914e-08, 4.6566128730773926e-08, 5.587935447692871e-08, 6.51925802230835e-08, 7.450580596923828e-08, 8.381903171539307e-08, 9.313225746154785e-08, 1.0244548320770264e-07, 1.1175870895385742e-07, 1.210719347000122e-07, 1.30385160446167e-07, 1.3969838619232178e-07, 1.4901161193847656e-07, 1.5832483768463135e-07, 1.6763806343078613e-07, 1.7695128917694092e-07, 1.862645149230957e-07, 1.955777406692505e-07, 2.0489096641540527e-07, 2.1420419216156006e-07, 2.2351741790771484e-07, 2.3283064365386963e-07, 2.421438694000244e-07, 2.514570951461792e-07, 2.60770320892334e-07, 2.7008354663848877e-07, 2.7939677238464355e-07, 2.8870999813079834e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 4.0, 9.0, 6.0, 6.0, 22.0, 29.0, 40.0, 19.0, 7.0, 40.0, 92.0, 201.0, 182.0, 47.0, 411.0, 640.0, 123459.0, 920055.0, 2043.0, 446.0, 107.0, 90.0, 240.0, 114.0, 58.0, 7.0, 13.0, 36.0, 20.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 7.0, 9.0, 5.0, 6.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7220458984375e-06, -5.544163286685944e-06, -5.366280674934387e-06, -5.188398063182831e-06, -5.010515451431274e-06, -4.832632839679718e-06, -4.654750227928162e-06, -4.476867616176605e-06, -4.298985004425049e-06, -4.1211023926734924e-06, -3.943219780921936e-06, -3.7653371691703796e-06, -3.5874545574188232e-06, -3.409571945667267e-06, -3.2316893339157104e-06, -3.053806722164154e-06, -2.8759241104125977e-06, -2.6980414986610413e-06, -2.520158886909485e-06, -2.3422762751579285e-06, -2.164393663406372e-06, -1.9865110516548157e-06, -1.8086284399032593e-06, -1.6307458281517029e-06, -1.4528632164001465e-06, -1.27498060464859e-06, -1.0970979928970337e-06, -9.192153811454773e-07, -7.413327693939209e-07, -5.634501576423645e-07, -3.855675458908081e-07, -2.076849341392517e-07, -2.9802322387695312e-08, 1.4808028936386108e-07, 3.259629011154175e-07, 5.038455128669739e-07, 6.817281246185303e-07, 8.596107363700867e-07, 1.037493348121643e-06, 1.2153759598731995e-06, 1.3932585716247559e-06, 1.5711411833763123e-06, 1.7490237951278687e-06, 1.926906406879425e-06, 2.1047890186309814e-06, 2.282671630382538e-06, 2.4605542421340942e-06, 2.6384368538856506e-06, 2.816319465637207e-06, 2.9942020773887634e-06, 3.17208468914032e-06, 3.3499673008918762e-06, 3.5278499126434326e-06, 3.705732524394989e-06, 3.883615136146545e-06, 4.061497747898102e-06, 4.239380359649658e-06, 4.417262971401215e-06, 4.595145583152771e-06, 4.773028194904327e-06, 4.950910806655884e-06, 5.12879341840744e-06, 5.306676030158997e-06, 5.484558641910553e-06, 5.662441253662109e-06]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 9.0, 6.0, 7.0, 4.0, 4.0, 9.0, 5.0, 864.0, 7.0, 7.0, 9.0, 10.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1453262516170071e-07, -1.1141437994410808e-07, -1.0829613472651545e-07, -1.0517788950892282e-07, -1.0205964429133019e-07, -9.894139907373756e-08, -9.582315385614493e-08, -9.27049086385523e-08, -8.958666342095967e-08, -8.646841820336704e-08, -8.335017298577441e-08, -8.023192776818178e-08, -7.711368255058915e-08, -7.399543733299652e-08, -7.087719211540389e-08, -6.775894689781126e-08, -6.464070878564598e-08, -6.152246356805335e-08, -5.8404218350460724e-08, -5.5285973132868094e-08, -5.2167727915275464e-08, -4.9049482697682834e-08, -4.593124103280388e-08, -4.281299581521125e-08, -3.969475059761862e-08, -3.657650538002599e-08, -3.345826016243336e-08, -3.034001849755441e-08, -2.722177150360494e-08, -2.410352628601231e-08, -2.098528284477652e-08, -1.786703762718389e-08, -1.4748785304163903e-08, -1.1630540086571273e-08, -8.512295757157062e-09, -5.394051427742852e-09, -2.275806210150222e-09, 8.424390074424082e-10, 3.960682448678199e-09, 7.078927666270829e-09, 1.0197172883863459e-08, 1.3315418101456089e-08, 1.643366331904872e-08, 1.955190676028451e-08, 2.267015197787714e-08, 2.578839719546977e-08, 2.890664063670556e-08, 3.202488585429819e-08, 3.514313107189082e-08, 3.826137628948345e-08, 4.137962150707608e-08, 4.449786672466871e-08, 4.761611194226134e-08, 5.073435715985397e-08, 5.385259882473292e-08, 5.697084404232555e-08, 6.008909281263186e-08, 6.320733803022449e-08, 6.632558324781712e-08, 6.944382846540975e-08, 7.256207368300238e-08, 7.568031890059501e-08, 7.879856411818764e-08, 8.191680933578027e-08, 8.503504744794554e-08]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 861.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 2.0, 12.0, 9.0, 17.0, 19.0, 11.0, 22.0, 23.0, 16.0, 28.0, 28.0, 32.0, 28.0, 37.0, 42.0, 29.0, 40.0, 36.0, 52.0, 36.0, 32.0, 45.0, 38.0, 34.0, 29.0, 39.0, 35.0, 20.0, 22.0, 27.0, 19.0, 24.0, 17.0, 19.0, 11.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0], "bins": [-3.029296875, -2.941070556640625, -2.85284423828125, -2.764617919921875, -2.6763916015625, -2.588165283203125, -2.49993896484375, -2.411712646484375, -2.323486328125, -2.235260009765625, -2.14703369140625, -2.058807373046875, -1.9705810546875, -1.882354736328125, -1.79412841796875, -1.705902099609375, -1.61767578125, -1.529449462890625, -1.44122314453125, -1.352996826171875, -1.2647705078125, -1.176544189453125, -1.08831787109375, -1.000091552734375, -0.911865234375, -0.823638916015625, -0.73541259765625, -0.647186279296875, -0.5589599609375, -0.470733642578125, -0.38250732421875, -0.294281005859375, -0.2060546875, -0.117828369140625, -0.02960205078125, 0.058624267578125, 0.1468505859375, 0.235076904296875, 0.32330322265625, 0.411529541015625, 0.499755859375, 0.587982177734375, 0.67620849609375, 0.764434814453125, 0.8526611328125, 0.940887451171875, 1.02911376953125, 1.117340087890625, 1.20556640625, 1.293792724609375, 1.38201904296875, 1.470245361328125, 1.5584716796875, 1.646697998046875, 1.73492431640625, 1.823150634765625, 1.911376953125, 1.999603271484375, 2.08782958984375, 2.176055908203125, 2.2642822265625, 2.352508544921875, 2.44073486328125, 2.528961181640625, 2.6171875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 8.0, 11.0, 20.0, 19.0, 24.0, 37.0, 37.0, 51.0, 84.0, 121.0, 149.0, 231.0, 351.0, 605.0, 1070.0, 2217.0, 5289.0, 16021.0, 66148.0, 328596.0, 474613.0, 114100.0, 24934.0, 7513.0, 2866.0, 1409.0, 724.0, 378.0, 251.0, 163.0, 117.0, 76.0, 62.0, 38.0, 43.0, 32.0, 27.0, 18.0, 13.0, 17.0, 16.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0], "bins": [-4.55078125, -4.41357421875, -4.2763671875, -4.13916015625, -4.001953125, -3.86474609375, -3.7275390625, -3.59033203125, -3.453125, -3.31591796875, -3.1787109375, -3.04150390625, -2.904296875, -2.76708984375, -2.6298828125, -2.49267578125, -2.35546875, -2.21826171875, -2.0810546875, -1.94384765625, -1.806640625, -1.66943359375, -1.5322265625, -1.39501953125, -1.2578125, -1.12060546875, -0.9833984375, -0.84619140625, -0.708984375, -0.57177734375, -0.4345703125, -0.29736328125, -0.16015625, -0.02294921875, 0.1142578125, 0.25146484375, 0.388671875, 0.52587890625, 0.6630859375, 0.80029296875, 0.9375, 1.07470703125, 1.2119140625, 1.34912109375, 1.486328125, 1.62353515625, 1.7607421875, 1.89794921875, 2.03515625, 2.17236328125, 2.3095703125, 2.44677734375, 2.583984375, 2.72119140625, 2.8583984375, 2.99560546875, 3.1328125, 3.27001953125, 3.4072265625, 3.54443359375, 3.681640625, 3.81884765625, 3.9560546875, 4.09326171875, 4.23046875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 9.0, 18.0, 19.0, 19.0, 21.0, 31.0, 30.0, 49.0, 56.0, 62.0, 56.0, 126.0, 389.0, 1583.0, 168.0, 80.0, 67.0, 49.0, 49.0, 40.0, 32.0, 28.0, 15.0, 11.0, 18.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.392333984375, -7.07373046875, -6.755126953125, -6.4365234375, -6.117919921875, -5.79931640625, -5.480712890625, -5.162109375, -4.843505859375, -4.52490234375, -4.206298828125, -3.8876953125, -3.569091796875, -3.25048828125, -2.931884765625, -2.61328125, -2.294677734375, -1.97607421875, -1.657470703125, -1.3388671875, -1.020263671875, -0.70166015625, -0.383056640625, -0.064453125, 0.254150390625, 0.57275390625, 0.891357421875, 1.2099609375, 1.528564453125, 1.84716796875, 2.165771484375, 2.484375, 2.802978515625, 3.12158203125, 3.440185546875, 3.7587890625, 4.077392578125, 4.39599609375, 4.714599609375, 5.033203125, 5.351806640625, 5.67041015625, 5.989013671875, 6.3076171875, 6.626220703125, 6.94482421875, 7.263427734375, 7.58203125, 7.900634765625, 8.21923828125, 8.537841796875, 8.8564453125, 9.175048828125, 9.49365234375, 9.812255859375, 10.130859375, 10.449462890625, 10.76806640625, 11.086669921875, 11.4052734375, 11.723876953125, 12.04248046875, 12.361083984375, 12.6796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 12.0, 15.0, 17.0, 54.0, 68.0, 126.0, 219.0, 393.0, 1004.0, 32904.0, 3106531.0, 2945.0, 642.0, 311.0, 154.0, 100.0, 57.0, 28.0, 21.0, 18.0, 11.0, 12.0, 17.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.0625, -29.297119140625, -28.53173828125, -27.766357421875, -27.0009765625, -26.235595703125, -25.47021484375, -24.704833984375, -23.939453125, -23.174072265625, -22.40869140625, -21.643310546875, -20.8779296875, -20.112548828125, -19.34716796875, -18.581787109375, -17.81640625, -17.051025390625, -16.28564453125, -15.520263671875, -14.7548828125, -13.989501953125, -13.22412109375, -12.458740234375, -11.693359375, -10.927978515625, -10.16259765625, -9.397216796875, -8.6318359375, -7.866455078125, -7.10107421875, -6.335693359375, -5.5703125, -4.804931640625, -4.03955078125, -3.274169921875, -2.5087890625, -1.743408203125, -0.97802734375, -0.212646484375, 0.552734375, 1.318115234375, 2.08349609375, 2.848876953125, 3.6142578125, 4.379638671875, 5.14501953125, 5.910400390625, 6.67578125, 7.441162109375, 8.20654296875, 8.971923828125, 9.7373046875, 10.502685546875, 11.26806640625, 12.033447265625, 12.798828125, 13.564208984375, 14.32958984375, 15.094970703125, 15.8603515625, 16.625732421875, 17.39111328125, 18.156494140625, 18.921875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 31.0, 436.0, 487.0, 57.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.99073314666748, -6.779177188873291, -4.567621231079102, -2.356065273284912, -0.14450931549072266, 2.0670461654663086, 4.278602600097656, 6.490159034729004, 8.701714515686035, 10.913270950317383, 13.124826431274414, 15.336381912231445, 17.54793930053711, 19.75949478149414, 21.971050262451172, 24.182605743408203, 26.394161224365234, 28.605716705322266, 30.817272186279297, 33.02882766723633, 35.240386962890625, 37.451942443847656, 39.66349792480469, 41.87505340576172, 44.08660888671875, 46.29816436767578, 48.50971984863281, 50.721275329589844, 52.932830810546875, 55.144386291503906, 57.3559455871582, 59.567501068115234, 61.779052734375, 63.99060821533203, 66.20216369628906, 68.4137191772461, 70.62527465820312, 72.83683013916016, 75.04838562011719, 77.25994873046875, 79.47149658203125, 81.68305206298828, 83.89460754394531, 86.10616302490234, 88.31771850585938, 90.5292739868164, 92.74082946777344, 94.952392578125, 97.16394805908203, 99.37550354003906, 101.5870590209961, 103.79861450195312, 106.01016998291016, 108.22172546386719, 110.43328094482422, 112.64483642578125, 114.85639953613281, 117.06795501708984, 119.27951049804688, 121.4910659790039, 123.70262145996094, 125.91417694091797, 128.125732421875, 130.33729553222656, 132.54884338378906]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 10.0, 14.0, 15.0, 16.0, 12.0, 18.0, 15.0, 20.0, 26.0, 29.0, 40.0, 28.0, 30.0, 27.0, 34.0, 37.0, 45.0, 36.0, 39.0, 43.0, 23.0, 31.0, 36.0, 41.0, 28.0, 39.0, 29.0, 26.0, 25.0, 29.0, 18.0, 18.0, 17.0, 17.0, 16.0, 16.0, 13.0, 6.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.852767944335938, -15.32209587097168, -14.791422843933105, -14.260750770568848, -13.73007869720459, -13.199405670166016, -12.668733596801758, -12.1380615234375, -11.607389450073242, -11.076717376708984, -10.54604434967041, -10.015372276306152, -9.484700202941895, -8.95402717590332, -8.423355102539062, -7.892683029174805, -7.3620100021362305, -6.8313374519348145, -6.300665378570557, -5.769992828369141, -5.239320755004883, -4.708648204803467, -4.177975654602051, -3.647303342819214, -3.116631031036377, -2.58595871925354, -2.055286407470703, -1.524613857269287, -0.9939415454864502, -0.4632692337036133, 0.06740331649780273, 0.5980756282806396, 1.1287479400634766, 1.6594202518463135, 2.1900925636291504, 2.7207651138305664, 3.2514374256134033, 3.7821097373962402, 4.312782287597656, 4.843454360961914, 5.37412691116333, 5.904799461364746, 6.435471534729004, 6.96614408493042, 7.496816635131836, 8.027488708496094, 8.558160781860352, 9.088833808898926, 9.619505882263184, 10.150177955627441, 10.680850982666016, 11.211523056030273, 11.742195129394531, 12.272867202758789, 12.803540229797363, 13.334212303161621, 13.864885330200195, 14.395557403564453, 14.926230430603027, 15.456902503967285, 15.987574577331543, 16.518247604370117, 17.048919677734375, 17.579591751098633, 18.11026382446289]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 3.0, 8.0, 13.0, 2.0, 13.0, 11.0, 10.0, 18.0, 20.0, 25.0, 31.0, 33.0, 30.0, 26.0, 45.0, 31.0, 42.0, 37.0, 33.0, 43.0, 36.0, 48.0, 35.0, 39.0, 35.0, 52.0, 33.0, 27.0, 20.0, 28.0, 26.0, 17.0, 23.0, 13.0, 17.0, 20.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.12109375, -3.0208740234375, -2.920654296875, -2.8204345703125, -2.72021484375, -2.6199951171875, -2.519775390625, -2.4195556640625, -2.3193359375, -2.2191162109375, -2.118896484375, -2.0186767578125, -1.91845703125, -1.8182373046875, -1.718017578125, -1.6177978515625, -1.517578125, -1.4173583984375, -1.317138671875, -1.2169189453125, -1.11669921875, -1.0164794921875, -0.916259765625, -0.8160400390625, -0.7158203125, -0.6156005859375, -0.515380859375, -0.4151611328125, -0.31494140625, -0.2147216796875, -0.114501953125, -0.0142822265625, 0.0859375, 0.1861572265625, 0.286376953125, 0.3865966796875, 0.48681640625, 0.5870361328125, 0.687255859375, 0.7874755859375, 0.8876953125, 0.9879150390625, 1.088134765625, 1.1883544921875, 1.28857421875, 1.3887939453125, 1.489013671875, 1.5892333984375, 1.689453125, 1.7896728515625, 1.889892578125, 1.9901123046875, 2.09033203125, 2.1905517578125, 2.290771484375, 2.3909912109375, 2.4912109375, 2.5914306640625, 2.691650390625, 2.7918701171875, 2.89208984375, 2.9923095703125, 3.092529296875, 3.1927490234375, 3.29296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 11.0, 15.0, 17.0, 26.0, 27.0, 43.0, 51.0, 62.0, 88.0, 100.0, 164.0, 184.0, 237.0, 329.0, 480.0, 685.0, 1162.0, 2996.0, 14661.0, 156810.0, 2905548.0, 1047370.0, 51463.0, 6827.0, 1808.0, 871.0, 587.0, 381.0, 295.0, 250.0, 167.0, 135.0, 91.0, 67.0, 67.0, 49.0, 32.0, 31.0, 18.0, 22.0, 14.0, 9.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.765625, -15.2696533203125, -14.773681640625, -14.2777099609375, -13.78173828125, -13.2857666015625, -12.789794921875, -12.2938232421875, -11.7978515625, -11.3018798828125, -10.805908203125, -10.3099365234375, -9.81396484375, -9.3179931640625, -8.822021484375, -8.3260498046875, -7.830078125, -7.3341064453125, -6.838134765625, -6.3421630859375, -5.84619140625, -5.3502197265625, -4.854248046875, -4.3582763671875, -3.8623046875, -3.3663330078125, -2.870361328125, -2.3743896484375, -1.87841796875, -1.3824462890625, -0.886474609375, -0.3905029296875, 0.10546875, 0.6014404296875, 1.097412109375, 1.5933837890625, 2.08935546875, 2.5853271484375, 3.081298828125, 3.5772705078125, 4.0732421875, 4.5692138671875, 5.065185546875, 5.5611572265625, 6.05712890625, 6.5531005859375, 7.049072265625, 7.5450439453125, 8.041015625, 8.5369873046875, 9.032958984375, 9.5289306640625, 10.02490234375, 10.5208740234375, 11.016845703125, 11.5128173828125, 12.0087890625, 12.5047607421875, 13.000732421875, 13.4967041015625, 13.99267578125, 14.4886474609375, 14.984619140625, 15.4805908203125, 15.9765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 8.0, 27.0, 39.0, 52.0, 72.0, 100.0, 148.0, 217.0, 280.0, 425.0, 529.0, 618.0, 463.0, 356.0, 215.0, 160.0, 113.0, 78.0, 51.0, 38.0, 19.0, 21.0, 7.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.0355224609375, -5.774169921875, -5.5128173828125, -5.25146484375, -4.9901123046875, -4.728759765625, -4.4674072265625, -4.2060546875, -3.9447021484375, -3.683349609375, -3.4219970703125, -3.16064453125, -2.8992919921875, -2.637939453125, -2.3765869140625, -2.115234375, -1.8538818359375, -1.592529296875, -1.3311767578125, -1.06982421875, -0.8084716796875, -0.547119140625, -0.2857666015625, -0.0244140625, 0.2369384765625, 0.498291015625, 0.7596435546875, 1.02099609375, 1.2823486328125, 1.543701171875, 1.8050537109375, 2.06640625, 2.3277587890625, 2.589111328125, 2.8504638671875, 3.11181640625, 3.3731689453125, 3.634521484375, 3.8958740234375, 4.1572265625, 4.4185791015625, 4.679931640625, 4.9412841796875, 5.20263671875, 5.4639892578125, 5.725341796875, 5.9866943359375, 6.248046875, 6.5093994140625, 6.770751953125, 7.0321044921875, 7.29345703125, 7.5548095703125, 7.816162109375, 8.0775146484375, 8.3388671875, 8.6002197265625, 8.861572265625, 9.1229248046875, 9.38427734375, 9.6456298828125, 9.906982421875, 10.1683349609375, 10.4296875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 20.0, 25.0, 26.0, 45.0, 40.0, 51.0, 109.0, 157.0, 315.0, 592.0, 1681.0, 6035.0, 31417.0, 239177.0, 2276049.0, 1463771.0, 146692.0, 21119.0, 4436.0, 1252.0, 487.0, 240.0, 142.0, 115.0, 65.0, 55.0, 35.0, 33.0, 22.0, 14.0, 13.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.190673828125, -7.89697265625, -7.603271484375, -7.3095703125, -7.015869140625, -6.72216796875, -6.428466796875, -6.134765625, -5.841064453125, -5.54736328125, -5.253662109375, -4.9599609375, -4.666259765625, -4.37255859375, -4.078857421875, -3.78515625, -3.491455078125, -3.19775390625, -2.904052734375, -2.6103515625, -2.316650390625, -2.02294921875, -1.729248046875, -1.435546875, -1.141845703125, -0.84814453125, -0.554443359375, -0.2607421875, 0.032958984375, 0.32666015625, 0.620361328125, 0.9140625, 1.207763671875, 1.50146484375, 1.795166015625, 2.0888671875, 2.382568359375, 2.67626953125, 2.969970703125, 3.263671875, 3.557373046875, 3.85107421875, 4.144775390625, 4.4384765625, 4.732177734375, 5.02587890625, 5.319580078125, 5.61328125, 5.906982421875, 6.20068359375, 6.494384765625, 6.7880859375, 7.081787109375, 7.37548828125, 7.669189453125, 7.962890625, 8.256591796875, 8.55029296875, 8.843994140625, 9.1376953125, 9.431396484375, 9.72509765625, 10.018798828125, 10.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 17.0, 19.0, 29.0, 29.0, 43.0, 49.0, 73.0, 65.0, 46.0, 88.0, 79.0, 71.0, 66.0, 61.0, 57.0, 53.0, 30.0, 29.0, 21.0, 21.0, 6.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.623638153076172, -30.243188858032227, -28.86273956298828, -27.48229217529297, -26.101842880249023, -24.721393585205078, -23.340946197509766, -21.96049690246582, -20.580047607421875, -19.19959831237793, -17.819149017333984, -16.438701629638672, -15.058252334594727, -13.677803039550781, -12.297354698181152, -10.916906356811523, -9.536457061767578, -8.156007766723633, -6.775559425354004, -5.395110607147217, -4.01466178894043, -2.6342129707336426, -1.2537641525268555, 0.12668418884277344, 1.5071334838867188, 2.887582302093506, 4.268031120300293, 5.64847993850708, 7.028928756713867, 8.409378051757812, 9.789826393127441, 11.17027473449707, 12.550724029541016, 13.931173324584961, 15.31162166595459, 16.69207000732422, 18.072519302368164, 19.45296859741211, 20.833415985107422, 22.213865280151367, 23.594314575195312, 24.974763870239258, 26.355213165283203, 27.735660552978516, 29.11610984802246, 30.496559143066406, 31.87700653076172, 33.25745391845703, 34.63790512084961, 36.01835250854492, 37.3988037109375, 38.77925109863281, 40.159698486328125, 41.5401496887207, 42.920597076416016, 44.301048278808594, 45.681495666503906, 47.06194305419922, 48.4423942565918, 49.82284164428711, 51.20329284667969, 52.583740234375, 53.96418762207031, 55.344635009765625, 56.7250862121582]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 13.0, 14.0, 7.0, 13.0, 16.0, 18.0, 17.0, 23.0, 29.0, 28.0, 29.0, 43.0, 44.0, 46.0, 44.0, 37.0, 43.0, 42.0, 38.0, 36.0, 35.0, 42.0, 39.0, 29.0, 34.0, 26.0, 27.0, 23.0, 16.0, 17.0, 15.0, 10.0, 12.0, 11.0, 16.0, 14.0, 8.0, 5.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.3070011138916, -29.419960021972656, -28.53291893005371, -27.645877838134766, -26.75883674621582, -25.871795654296875, -24.984756469726562, -24.097713470458984, -23.210674285888672, -22.323633193969727, -21.43659210205078, -20.549551010131836, -19.66250991821289, -18.775468826293945, -17.888427734375, -17.001388549804688, -16.11434555053711, -15.227304458618164, -14.340263366699219, -13.453222274780273, -12.566181182861328, -11.679140090942383, -10.792099952697754, -9.905058860778809, -9.018017768859863, -8.130976676940918, -7.243935585021973, -6.3568949699401855, -5.46985387802124, -4.582812786102295, -3.695772171020508, -2.8087310791015625, -1.9216880798339844, -1.0346471071243286, -0.14760613441467285, 0.7394347190856934, 1.6264758110046387, 2.513516902923584, 3.400557518005371, 4.287598609924316, 5.174639701843262, 6.061680793762207, 6.948721885681152, 7.8357625007629395, 8.722803115844727, 9.609844207763672, 10.496885299682617, 11.383926391601562, 12.270967483520508, 13.158008575439453, 14.045049667358398, 14.932090759277344, 15.819131851196289, 16.706172943115234, 17.593212127685547, 18.480255126953125, 19.367294311523438, 20.254335403442383, 21.141376495361328, 22.028417587280273, 22.91545867919922, 23.802499771118164, 24.68954086303711, 25.576580047607422, 26.463623046875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 14.0, 13.0, 11.0, 19.0, 20.0, 23.0, 34.0, 37.0, 34.0, 51.0, 43.0, 48.0, 37.0, 49.0, 45.0, 46.0, 45.0, 43.0, 45.0, 35.0, 30.0, 29.0, 25.0, 25.0, 18.0, 23.0, 14.0, 11.0, 16.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-60.21875, -58.46728515625, -56.7158203125, -54.96435546875, -53.212890625, -51.46142578125, -49.7099609375, -47.95849609375, -46.20703125, -44.45556640625, -42.7041015625, -40.95263671875, -39.201171875, -37.44970703125, -35.6982421875, -33.94677734375, -32.1953125, -30.44384765625, -28.6923828125, -26.94091796875, -25.189453125, -23.43798828125, -21.6865234375, -19.93505859375, -18.18359375, -16.43212890625, -14.6806640625, -12.92919921875, -11.177734375, -9.42626953125, -7.6748046875, -5.92333984375, -4.171875, -2.42041015625, -0.6689453125, 1.08251953125, 2.833984375, 4.58544921875, 6.3369140625, 8.08837890625, 9.83984375, 11.59130859375, 13.3427734375, 15.09423828125, 16.845703125, 18.59716796875, 20.3486328125, 22.10009765625, 23.8515625, 25.60302734375, 27.3544921875, 29.10595703125, 30.857421875, 32.60888671875, 34.3603515625, 36.11181640625, 37.86328125, 39.61474609375, 41.3662109375, 43.11767578125, 44.869140625, 46.62060546875, 48.3720703125, 50.12353515625, 51.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 13.0, 15.0, 18.0, 31.0, 55.0, 105.0, 153.0, 209.0, 280.0, 474.0, 685.0, 1058.0, 1589.0, 2379.0, 3564.0, 5329.0, 7980.0, 12144.0, 18246.0, 28914.0, 47594.0, 84932.0, 185914.0, 337393.0, 132043.0, 67286.0, 39374.0, 24134.0, 15655.0, 10247.0, 6907.0, 4601.0, 3135.0, 2008.0, 1347.0, 906.0, 620.0, 420.0, 265.0, 172.0, 111.0, 69.0, 52.0, 46.0, 31.0, 17.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4056587219238281, -0.39310455322265625, -0.3805503845214844, -0.3679962158203125, -0.3554420471191406, -0.34288787841796875, -0.3303337097167969, -0.317779541015625, -0.3052253723144531, -0.29267120361328125, -0.2801170349121094, -0.2675628662109375, -0.2550086975097656, -0.24245452880859375, -0.22990036010742188, -0.21734619140625, -0.20479202270507812, -0.19223785400390625, -0.17968368530273438, -0.1671295166015625, -0.15457534790039062, -0.14202117919921875, -0.12946701049804688, -0.116912841796875, -0.10435867309570312, -0.09180450439453125, -0.07925033569335938, -0.0666961669921875, -0.054141998291015625, -0.04158782958984375, -0.029033660888671875, -0.0164794921875, -0.003925323486328125, 0.00862884521484375, 0.021183013916015625, 0.0337371826171875, 0.046291351318359375, 0.05884552001953125, 0.07139968872070312, 0.083953857421875, 0.09650802612304688, 0.10906219482421875, 0.12161636352539062, 0.1341705322265625, 0.14672470092773438, 0.15927886962890625, 0.17183303833007812, 0.18438720703125, 0.19694137573242188, 0.20949554443359375, 0.22204971313476562, 0.2346038818359375, 0.24715805053710938, 0.25971221923828125, 0.2722663879394531, 0.284820556640625, 0.2973747253417969, 0.30992889404296875, 0.3224830627441406, 0.3350372314453125, 0.3475914001464844, 0.36014556884765625, 0.3726997375488281, 0.38525390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 5.0, 12.0, 14.0, 17.0, 17.0, 17.0, 20.0, 21.0, 26.0, 40.0, 25.0, 33.0, 28.0, 38.0, 39.0, 40.0, 27.0, 48.0, 1060.0, 39.0, 37.0, 44.0, 43.0, 44.0, 41.0, 25.0, 22.0, 27.0, 26.0, 20.0, 17.0, 20.0, 19.0, 8.0, 11.0, 10.0, 7.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-36.03125, -34.976318359375, -33.92138671875, -32.866455078125, -31.8115234375, -30.756591796875, -29.70166015625, -28.646728515625, -27.591796875, -26.536865234375, -25.48193359375, -24.427001953125, -23.3720703125, -22.317138671875, -21.26220703125, -20.207275390625, -19.15234375, -18.097412109375, -17.04248046875, -15.987548828125, -14.9326171875, -13.877685546875, -12.82275390625, -11.767822265625, -10.712890625, -9.657958984375, -8.60302734375, -7.548095703125, -6.4931640625, -5.438232421875, -4.38330078125, -3.328369140625, -2.2734375, -1.218505859375, -0.16357421875, 0.891357421875, 1.9462890625, 3.001220703125, 4.05615234375, 5.111083984375, 6.166015625, 7.220947265625, 8.27587890625, 9.330810546875, 10.3857421875, 11.440673828125, 12.49560546875, 13.550537109375, 14.60546875, 15.660400390625, 16.71533203125, 17.770263671875, 18.8251953125, 19.880126953125, 20.93505859375, 21.989990234375, 23.044921875, 24.099853515625, 25.15478515625, 26.209716796875, 27.2646484375, 28.319580078125, 29.37451171875, 30.429443359375, 31.484375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 14.0, 10.0, 16.0, 24.0, 33.0, 50.0, 69.0, 137.0, 167.0, 221.0, 388.0, 600.0, 897.0, 1187.0, 1995.0, 3051.0, 4543.0, 7172.0, 11436.0, 17735.0, 28453.0, 47114.0, 81255.0, 161640.0, 1353225.0, 165386.0, 83171.0, 47526.0, 29407.0, 18021.0, 11282.0, 7386.0, 4677.0, 3035.0, 1975.0, 1297.0, 838.0, 538.0, 361.0, 283.0, 183.0, 95.0, 81.0, 56.0, 54.0, 20.0, 11.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1943359375, -0.18796730041503906, -0.18159866333007812, -0.1752300262451172, -0.16886138916015625, -0.1624927520751953, -0.15612411499023438, -0.14975547790527344, -0.1433868408203125, -0.13701820373535156, -0.13064956665039062, -0.12428092956542969, -0.11791229248046875, -0.11154365539550781, -0.10517501831054688, -0.09880638122558594, -0.092437744140625, -0.08606910705566406, -0.07970046997070312, -0.07333183288574219, -0.06696319580078125, -0.06059455871582031, -0.054225921630859375, -0.04785728454589844, -0.0414886474609375, -0.03512001037597656, -0.028751373291015625, -0.022382736206054688, -0.01601409912109375, -0.009645462036132812, -0.003276824951171875, 0.0030918121337890625, 0.00946044921875, 0.015829086303710938, 0.022197723388671875, 0.028566360473632812, 0.03493499755859375, 0.04130363464355469, 0.047672271728515625, 0.05404090881347656, 0.0604095458984375, 0.06677818298339844, 0.07314682006835938, 0.07951545715332031, 0.08588409423828125, 0.09225273132324219, 0.09862136840820312, 0.10499000549316406, 0.111358642578125, 0.11772727966308594, 0.12409591674804688, 0.1304645538330078, 0.13683319091796875, 0.1432018280029297, 0.14957046508789062, 0.15593910217285156, 0.1623077392578125, 0.16867637634277344, 0.17504501342773438, 0.1814136505126953, 0.18778228759765625, 0.1941509246826172, 0.20051956176757812, 0.20688819885253906, 0.2132568359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 15.0, 14.0, 12.0, 7.0, 16.0, 29.0, 21.0, 30.0, 52.0, 39.0, 24.0, 32.0, 43.0, 28.0, 41.0, 42.0, 35.0, 54.0, 43.0, 47.0, 37.0, 35.0, 33.0, 28.0, 35.0, 29.0, 23.0, 21.0, 28.0, 17.0, 9.0, 10.0, 14.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.5138800740242004e-06, -3.3918768167495728e-06, -3.269873559474945e-06, -3.1478703022003174e-06, -3.0258670449256897e-06, -2.903863787651062e-06, -2.7818605303764343e-06, -2.6598572731018066e-06, -2.537854015827179e-06, -2.4158507585525513e-06, -2.2938475012779236e-06, -2.171844244003296e-06, -2.0498409867286682e-06, -1.9278377294540405e-06, -1.8058344721794128e-06, -1.6838312149047852e-06, -1.5618279576301575e-06, -1.4398247003555298e-06, -1.317821443080902e-06, -1.1958181858062744e-06, -1.0738149285316467e-06, -9.51811671257019e-07, -8.298084139823914e-07, -7.078051567077637e-07, -5.85801899433136e-07, -4.637986421585083e-07, -3.417953848838806e-07, -2.1979212760925293e-07, -9.778887033462524e-08, 2.421438694000244e-08, 1.4621764421463013e-07, 2.682209014892578e-07, 3.902241587638855e-07, 5.122274160385132e-07, 6.342306733131409e-07, 7.562339305877686e-07, 8.782371878623962e-07, 1.000240445137024e-06, 1.1222437024116516e-06, 1.2442469596862793e-06, 1.366250216960907e-06, 1.4882534742355347e-06, 1.6102567315101624e-06, 1.73225998878479e-06, 1.8542632460594177e-06, 1.9762665033340454e-06, 2.098269760608673e-06, 2.2202730178833008e-06, 2.3422762751579285e-06, 2.464279532432556e-06, 2.586282789707184e-06, 2.7082860469818115e-06, 2.830289304256439e-06, 2.952292561531067e-06, 3.0742958188056946e-06, 3.1962990760803223e-06, 3.31830233335495e-06, 3.4403055906295776e-06, 3.5623088479042053e-06, 3.684312105178833e-06, 3.8063153624534607e-06, 3.928318619728088e-06, 4.050321877002716e-06, 4.172325134277344e-06]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 2.0, 15.0, 17.0, 32.0, 29.0, 56.0, 86.0, 107.0, 167.0, 241.0, 416.0, 783.0, 1357.0, 2637.0, 5792.0, 13435.0, 36698.0, 79836.0, 159044.0, 236346.0, 231018.0, 149760.0, 73429.0, 31910.0, 13394.0, 5853.0, 2768.0, 1329.0, 709.0, 493.0, 244.0, 159.0, 122.0, 76.0, 58.0, 54.0, 23.0, 16.0, 10.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.680385321378708e-05, -1.6203150153160095e-05, -1.560244709253311e-05, -1.5001744031906128e-05, -1.4401040971279144e-05, -1.380033791065216e-05, -1.3199634850025177e-05, -1.2598931789398193e-05, -1.199822872877121e-05, -1.1397525668144226e-05, -1.0796822607517242e-05, -1.0196119546890259e-05, -9.595416486263275e-06, -8.994713425636292e-06, -8.394010365009308e-06, -7.793307304382324e-06, -7.1926042437553406e-06, -6.591901183128357e-06, -5.991198122501373e-06, -5.39049506187439e-06, -4.789792001247406e-06, -4.189088940620422e-06, -3.5883858799934387e-06, -2.987682819366455e-06, -2.3869797587394714e-06, -1.7862766981124878e-06, -1.1855736374855042e-06, -5.848705768585205e-07, 1.5832483768463135e-08, 6.165355443954468e-07, 1.2172386050224304e-06, 1.817941665649414e-06, 2.4186447262763977e-06, 3.0193477869033813e-06, 3.620050847530365e-06, 4.220753908157349e-06, 4.821456968784332e-06, 5.422160029411316e-06, 6.0228630900382996e-06, 6.623566150665283e-06, 7.224269211292267e-06, 7.82497227191925e-06, 8.425675332546234e-06, 9.026378393173218e-06, 9.627081453800201e-06, 1.0227784514427185e-05, 1.0828487575054169e-05, 1.1429190635681152e-05, 1.2029893696308136e-05, 1.263059675693512e-05, 1.3231299817562103e-05, 1.3832002878189087e-05, 1.443270593881607e-05, 1.5033408999443054e-05, 1.5634112060070038e-05, 1.623481512069702e-05, 1.6835518181324005e-05, 1.743622124195099e-05, 1.8036924302577972e-05, 1.8637627363204956e-05, 1.923833042383194e-05, 1.9839033484458923e-05, 2.0439736545085907e-05, 2.104043960571289e-05]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 16.0, 19.0, 16.0, 29.0, 26.0, 46.0, 31.0, 40.0, 58.0, 73.0, 77.0, 75.0, 70.0, 63.0, 60.0, 65.0, 47.0, 45.0, 41.0, 24.0, 17.0, 12.0, 17.0, 15.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05051878260565e-06, -3.9237920645973645e-06, -3.7970648918417282e-06, -3.6703379464597674e-06, -3.5436110010778066e-06, -3.416884283069521e-06, -3.2901573376875604e-06, -3.1634303923055995e-06, -3.0367034469236387e-06, -2.909976501541678e-06, -2.783249556159717e-06, -2.656522610777756e-06, -2.529795892769471e-06, -2.4030687200138345e-06, -2.276342002005549e-06, -2.1496150566235883e-06, -2.0228881112416275e-06, -1.8961611658596667e-06, -1.7694342204777058e-06, -1.6427073887825827e-06, -1.5159804434006219e-06, -1.389253498018661e-06, -1.262526666323538e-06, -1.1357997209415771e-06, -1.0090727755596163e-06, -8.823458301776554e-07, -7.556189416391135e-07, -6.288920531005715e-07, -5.021651077186107e-07, -3.7543816233664984e-07, -2.4871127379810787e-07, -1.219843852595659e-07, 4.742560122394934e-09, 1.3146947708264634e-07, 2.5819639404289774e-07, 3.8492331100314914e-07, 5.116502279634005e-07, 6.383771733453614e-07, 7.651040618839033e-07, 8.918309504224453e-07, 1.0185578958044061e-06, 1.145284841186367e-06, 1.2720117865683278e-06, 1.398738618263451e-06, 1.5254655636454117e-06, 1.6521925090273726e-06, 1.7789193407224957e-06, 1.9056462861044565e-06, 2.0323732314864174e-06, 2.159100176868378e-06, 2.285827122250339e-06, 2.4125540676323e-06, 2.5392810130142607e-06, 2.666007731022546e-06, 2.792734676404507e-06, 2.9194616217864677e-06, 3.0461885671684286e-06, 3.1729155125503894e-06, 3.2996424579323502e-06, 3.426369403314311e-06, 3.5530961213225964e-06, 3.6798232940782327e-06, 3.806550012086518e-06, 3.933277184842154e-06, 4.06000390285044e-06]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 1.0, 9.0, 1.0, 8.0, 12.0, 6.0, 27.0, 13.0, 21.0, 14.0, 18.0, 57.0, 22.0, 44.0, 25.0, 28.0, 59.0, 34.0, 64.0, 24.0, 38.0, 52.0, 25.0, 56.0, 26.0, 62.0, 24.0, 26.0, 38.0, 17.0, 43.0, 13.0, 16.0, 24.0, 9.0, 9.0, 2.0, 4.0, 12.0, 2.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5387853384017944e-06, -2.4549663066864014e-06, -2.3711472749710083e-06, -2.2873282432556152e-06, -2.203509211540222e-06, -2.119690179824829e-06, -2.035871148109436e-06, -1.952052116394043e-06, -1.86823308467865e-06, -1.7844140529632568e-06, -1.7005950212478638e-06, -1.6167759895324707e-06, -1.5329569578170776e-06, -1.4491379261016846e-06, -1.3653188943862915e-06, -1.2814998626708984e-06, -1.1976808309555054e-06, -1.1138617992401123e-06, -1.0300427675247192e-06, -9.462237358093262e-07, -8.624047040939331e-07, -7.7858567237854e-07, -6.94766640663147e-07, -6.109476089477539e-07, -5.271285772323608e-07, -4.4330954551696777e-07, -3.594905138015747e-07, -2.7567148208618164e-07, -1.9185245037078857e-07, -1.0803341865539551e-07, -2.421438694000244e-08, 5.960464477539063e-08, 1.434236764907837e-07, 2.2724270820617676e-07, 3.110617399215698e-07, 3.948807716369629e-07, 4.78699803352356e-07, 5.62518835067749e-07, 6.463378667831421e-07, 7.301568984985352e-07, 8.139759302139282e-07, 8.977949619293213e-07, 9.816139936447144e-07, 1.0654330253601074e-06, 1.1492520570755005e-06, 1.2330710887908936e-06, 1.3168901205062866e-06, 1.4007091522216797e-06, 1.4845281839370728e-06, 1.5683472156524658e-06, 1.6521662473678589e-06, 1.735985279083252e-06, 1.819804310798645e-06, 1.903623342514038e-06, 1.987442374229431e-06, 2.0712614059448242e-06, 2.1550804376602173e-06, 2.2388994693756104e-06, 2.3227185010910034e-06, 2.4065375328063965e-06, 2.4903565645217896e-06, 2.5741755962371826e-06, 2.6579946279525757e-06, 2.7418136596679688e-06]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 14.0, 13.0, 11.0, 19.0, 20.0, 23.0, 34.0, 37.0, 34.0, 51.0, 43.0, 48.0, 37.0, 49.0, 45.0, 46.0, 45.0, 43.0, 45.0, 35.0, 30.0, 29.0, 25.0, 25.0, 18.0, 23.0, 14.0, 11.0, 16.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-60.21875, -58.46728515625, -56.7158203125, -54.96435546875, -53.212890625, -51.46142578125, -49.7099609375, -47.95849609375, -46.20703125, -44.45556640625, -42.7041015625, -40.95263671875, -39.201171875, -37.44970703125, -35.6982421875, -33.94677734375, -32.1953125, -30.44384765625, -28.6923828125, -26.94091796875, -25.189453125, -23.43798828125, -21.6865234375, -19.93505859375, -18.18359375, -16.43212890625, -14.6806640625, -12.92919921875, -11.177734375, -9.42626953125, -7.6748046875, -5.92333984375, -4.171875, -2.42041015625, -0.6689453125, 1.08251953125, 2.833984375, 4.58544921875, 6.3369140625, 8.08837890625, 9.83984375, 11.59130859375, 13.3427734375, 15.09423828125, 16.845703125, 18.59716796875, 20.3486328125, 22.10009765625, 23.8515625, 25.60302734375, 27.3544921875, 29.10595703125, 30.857421875, 32.60888671875, 34.3603515625, 36.11181640625, 37.86328125, 39.61474609375, 41.3662109375, 43.11767578125, 44.869140625, 46.62060546875, 48.3720703125, 50.12353515625, 51.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 4.0, 10.0, 11.0, 16.0, 15.0, 20.0, 27.0, 34.0, 35.0, 61.0, 89.0, 158.0, 194.0, 372.0, 653.0, 1731.0, 5349.0, 22181.0, 109695.0, 433628.0, 367119.0, 82693.0, 17141.0, 4397.0, 1388.0, 588.0, 303.0, 170.0, 121.0, 71.0, 64.0, 54.0, 20.0, 30.0, 26.0, 18.0, 19.0, 14.0, 9.0, 7.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.4140625, -9.136474609375, -8.85888671875, -8.581298828125, -8.3037109375, -8.026123046875, -7.74853515625, -7.470947265625, -7.193359375, -6.915771484375, -6.63818359375, -6.360595703125, -6.0830078125, -5.805419921875, -5.52783203125, -5.250244140625, -4.97265625, -4.695068359375, -4.41748046875, -4.139892578125, -3.8623046875, -3.584716796875, -3.30712890625, -3.029541015625, -2.751953125, -2.474365234375, -2.19677734375, -1.919189453125, -1.6416015625, -1.364013671875, -1.08642578125, -0.808837890625, -0.53125, -0.253662109375, 0.02392578125, 0.301513671875, 0.5791015625, 0.856689453125, 1.13427734375, 1.411865234375, 1.689453125, 1.967041015625, 2.24462890625, 2.522216796875, 2.7998046875, 3.077392578125, 3.35498046875, 3.632568359375, 3.91015625, 4.187744140625, 4.46533203125, 4.742919921875, 5.0205078125, 5.298095703125, 5.57568359375, 5.853271484375, 6.130859375, 6.408447265625, 6.68603515625, 6.963623046875, 7.2412109375, 7.518798828125, 7.79638671875, 8.073974609375, 8.3515625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 13.0, 15.0, 28.0, 36.0, 46.0, 63.0, 62.0, 64.0, 91.0, 2142.0, 86.0, 86.0, 74.0, 52.0, 57.0, 33.0, 19.0, 32.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.875, -149.5517578125, -145.228515625, -140.9052734375, -136.58203125, -132.2587890625, -127.935546875, -123.6123046875, -119.2890625, -114.9658203125, -110.642578125, -106.3193359375, -101.99609375, -97.6728515625, -93.349609375, -89.0263671875, -84.703125, -80.3798828125, -76.056640625, -71.7333984375, -67.41015625, -63.0869140625, -58.763671875, -54.4404296875, -50.1171875, -45.7939453125, -41.470703125, -37.1474609375, -32.82421875, -28.5009765625, -24.177734375, -19.8544921875, -15.53125, -11.2080078125, -6.884765625, -2.5615234375, 1.76171875, 6.0849609375, 10.408203125, 14.7314453125, 19.0546875, 23.3779296875, 27.701171875, 32.0244140625, 36.34765625, 40.6708984375, 44.994140625, 49.3173828125, 53.640625, 57.9638671875, 62.287109375, 66.6103515625, 70.93359375, 75.2568359375, 79.580078125, 83.9033203125, 88.2265625, 92.5498046875, 96.873046875, 101.1962890625, 105.51953125, 109.8427734375, 114.166015625, 118.4892578125, 122.8125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 16.0, 21.0, 22.0, 34.0, 45.0, 75.0, 112.0, 140.0, 231.0, 328.0, 606.0, 1361.0, 4914.0, 68310.0, 2915417.0, 143219.0, 7353.0, 1562.0, 739.0, 426.0, 248.0, 158.0, 106.0, 78.0, 40.0, 41.0, 23.0, 20.0, 17.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6640625, -14.1849365234375, -13.705810546875, -13.2266845703125, -12.74755859375, -12.2684326171875, -11.789306640625, -11.3101806640625, -10.8310546875, -10.3519287109375, -9.872802734375, -9.3936767578125, -8.91455078125, -8.4354248046875, -7.956298828125, -7.4771728515625, -6.998046875, -6.5189208984375, -6.039794921875, -5.5606689453125, -5.08154296875, -4.6024169921875, -4.123291015625, -3.6441650390625, -3.1650390625, -2.6859130859375, -2.206787109375, -1.7276611328125, -1.24853515625, -0.7694091796875, -0.290283203125, 0.1888427734375, 0.66796875, 1.1470947265625, 1.626220703125, 2.1053466796875, 2.58447265625, 3.0635986328125, 3.542724609375, 4.0218505859375, 4.5009765625, 4.9801025390625, 5.459228515625, 5.9383544921875, 6.41748046875, 6.8966064453125, 7.375732421875, 7.8548583984375, 8.333984375, 8.8131103515625, 9.292236328125, 9.7713623046875, 10.25048828125, 10.7296142578125, 11.208740234375, 11.6878662109375, 12.1669921875, 12.6461181640625, 13.125244140625, 13.6043701171875, 14.08349609375, 14.5626220703125, 15.041748046875, 15.5208740234375, 16.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 28.0, 96.0, 313.0, 319.0, 148.0, 44.0, 20.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.9063720703125, -93.5420150756836, -84.17765808105469, -74.81330108642578, -65.44894409179688, -56.08458709716797, -46.72023010253906, -37.355873107910156, -27.99151611328125, -18.627159118652344, -9.262802124023438, 0.10155487060546875, 9.465911865234375, 18.83026885986328, 28.194625854492188, 37.558982849121094, 46.92333984375, 56.287696838378906, 65.65205383300781, 75.01641082763672, 84.38076782226562, 93.74512481689453, 103.10948181152344, 112.47383880615234, 121.83819580078125, 131.20254516601562, 140.56690979003906, 149.9312744140625, 159.29562377929688, 168.65997314453125, 178.0243377685547, 187.38870239257812, 196.7530517578125, 206.11740112304688, 215.4817657470703, 224.84613037109375, 234.21047973632812, 243.5748291015625, 252.93919372558594, 262.3035583496094, 271.66790771484375, 281.0322570800781, 290.3966064453125, 299.760986328125, 309.1253356933594, 318.48968505859375, 327.85406494140625, 337.2184143066406, 346.582763671875, 355.9471130371094, 365.31146240234375, 374.67584228515625, 384.0401916503906, 393.404541015625, 402.7689208984375, 412.1332702636719, 421.49761962890625, 430.8619689941406, 440.226318359375, 449.5906982421875, 458.9550476074219, 468.31939697265625, 477.68377685546875, 487.0481262207031, 496.4124755859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 10.0, 7.0, 11.0, 10.0, 18.0, 11.0, 20.0, 28.0, 15.0, 36.0, 40.0, 38.0, 41.0, 41.0, 46.0, 45.0, 53.0, 43.0, 57.0, 50.0, 44.0, 41.0, 42.0, 28.0, 39.0, 20.0, 28.0, 26.0, 19.0, 20.0, 15.0, 8.0, 13.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.92298889160156, -126.03353118896484, -122.14407348632812, -118.25460815429688, -114.36515045166016, -110.47569274902344, -106.58622741699219, -102.69676971435547, -98.80731201171875, -94.91785430908203, -91.02839660644531, -87.13893127441406, -83.24947357177734, -79.36001586914062, -75.47055053710938, -71.58109283447266, -67.69163513183594, -63.80217742919922, -59.912715911865234, -56.02325439453125, -52.13379669189453, -48.24433898925781, -44.35487747192383, -40.465415954589844, -36.575958251953125, -32.686500549316406, -28.797039031982422, -24.90757942199707, -21.01811981201172, -17.128660202026367, -13.239200592041016, -9.349740982055664, -5.4602813720703125, -1.570821762084961, 2.3186378479003906, 6.208097457885742, 10.097557067871094, 13.987016677856445, 17.876476287841797, 21.76593589782715, 25.6553955078125, 29.54485511779785, 33.4343147277832, 37.32377624511719, 41.213233947753906, 45.102691650390625, 48.99215316772461, 52.881614685058594, 56.77107238769531, 60.66053009033203, 64.54998779296875, 68.439453125, 72.32891082763672, 76.21836853027344, 80.10783386230469, 83.9972915649414, 87.88674926757812, 91.77620697021484, 95.66566467285156, 99.55513000488281, 103.44458770751953, 107.33404541015625, 111.2235107421875, 115.11296844482422, 119.00242614746094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 11.0, 13.0, 22.0, 26.0, 28.0, 47.0, 50.0, 54.0, 95.0, 110.0, 155.0, 167.0, 229.0, 311.0, 412.0, 473.0, 521.0, 763.0, 1471.0, 1040028.0, 771.0, 579.0, 447.0, 347.0, 322.0, 245.0, 196.0, 154.0, 116.0, 76.0, 72.0, 47.0, 55.0, 31.0, 22.0, 18.0, 9.0, 9.0, 7.0, 11.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.341537475585938, -29.36426544189453, -28.386991500854492, -27.409719467163086, -26.432445526123047, -25.45517349243164, -24.477901458740234, -23.500627517700195, -22.523353576660156, -21.54608154296875, -20.56880760192871, -19.591535568237305, -18.614261627197266, -17.63698959350586, -16.659717559814453, -15.682443618774414, -14.705171585083008, -13.727898597717285, -12.750625610351562, -11.773353576660156, -10.796079635620117, -9.818807601928711, -8.841534614562988, -7.864261627197266, -6.886988639831543, -5.90971565246582, -4.932442665100098, -3.955170154571533, -2.9778971672058105, -2.000624179840088, -1.0233516693115234, -0.04607868194580078, 0.9311943054199219, 1.908467173576355, 2.885740041732788, 3.8630127906799316, 4.840285778045654, 5.817558765411377, 6.794831275939941, 7.772104263305664, 8.749377250671387, 9.72665023803711, 10.703923225402832, 11.681196212768555, 12.658468246459961, 13.6357421875, 14.613014221191406, 15.590287208557129, 16.56756019592285, 17.544832229614258, 18.522106170654297, 19.499378204345703, 20.476652145385742, 21.45392417907715, 22.431198120117188, 23.408470153808594, 24.3857421875, 25.363014221191406, 26.340288162231445, 27.31756019592285, 28.29483413696289, 29.272106170654297, 30.249378204345703, 31.226652145385742, 32.20392608642578]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 12.0, 26.0, 25.0, 37.0, 82.0, 234.0, 120112.0, 51342560.0, 259.0, 57.0, 25.0, 19.0, 11.0, 7.0, 5.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1996.619873046875, -1946.710693359375, -1896.8016357421875, -1846.8924560546875, -1796.9833984375, -1747.07421875, -1697.1650390625, -1647.2559814453125, -1597.3468017578125, -1547.4376220703125, -1497.528564453125, -1447.619384765625, -1397.7103271484375, -1347.8011474609375, -1297.89208984375, -1247.98291015625, -1198.07373046875, -1148.16455078125, -1098.2554931640625, -1048.3463134765625, -998.4371948242188, -948.528076171875, -898.6189575195312, -848.7098388671875, -798.80078125, -748.8916625976562, -698.9825439453125, -649.0733642578125, -599.1642456054688, -549.255126953125, -499.34600830078125, -449.4368591308594, -399.5277099609375, -349.61859130859375, -299.7094421386719, -249.80032348632812, -199.8911895751953, -149.9820556640625, -100.07293701171875, -50.163787841796875, -0.254669189453125, 49.65446090698242, 99.56359100341797, 149.47271728515625, 199.38185119628906, 249.29098510742188, 299.2001037597656, 349.1092529296875, 399.01837158203125, 448.927490234375, 498.8366394042969, 548.7457275390625, 598.6549072265625, 648.5640258789062, 698.47314453125, 748.38232421875, 798.2913818359375, 848.2005004882812, 898.109619140625, 948.018798828125, 997.9279174804688, 1047.8370361328125, 1097.74609375, 1147.6552734375, 1197.564453125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 13.0, 14.0, 27.0, 41.0, 50.0, 61.0, 90.0, 139.0, 189.0, 324.0, 483.0, 746.0, 1079.0, 1743.0, 2764.0, 4256.0, 6813.0, 11148.0, 18251.0, 29892.0, 49717.0, 83167.0, 142782.0, 266478.0, 591608.0, 4075678.0, 472707.0, 222321.0, 123369.0, 72456.0, 43701.0, 26404.0, 16049.0, 10146.0, 6020.0, 3774.0, 2436.0, 1587.0, 958.0, 678.0, 438.0, 271.0, 183.0, 128.0, 80.0, 62.0, 35.0, 23.0, 17.0, 13.0, 8.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.101318359375, -0.09818840026855469, -0.09505844116210938, -0.09192848205566406, -0.08879852294921875, -0.08566856384277344, -0.08253860473632812, -0.07940864562988281, -0.0762786865234375, -0.07314872741699219, -0.07001876831054688, -0.06688880920410156, -0.06375885009765625, -0.06062889099121094, -0.057498931884765625, -0.05436897277832031, -0.051239013671875, -0.04810905456542969, -0.044979095458984375, -0.04184913635253906, -0.03871917724609375, -0.03558921813964844, -0.032459259033203125, -0.029329299926757812, -0.0261993408203125, -0.023069381713867188, -0.019939422607421875, -0.016809463500976562, -0.01367950439453125, -0.010549545288085938, -0.007419586181640625, -0.0042896270751953125, -0.00115966796875, 0.0019702911376953125, 0.005100250244140625, 0.008230209350585938, 0.01136016845703125, 0.014490127563476562, 0.017620086669921875, 0.020750045776367188, 0.0238800048828125, 0.027009963989257812, 0.030139923095703125, 0.03326988220214844, 0.03639984130859375, 0.03952980041503906, 0.042659759521484375, 0.04578971862792969, 0.048919677734375, 0.05204963684082031, 0.055179595947265625, 0.05830955505371094, 0.06143951416015625, 0.06456947326660156, 0.06769943237304688, 0.07082939147949219, 0.0739593505859375, 0.07708930969238281, 0.08021926879882812, 0.08334922790527344, 0.08647918701171875, 0.08960914611816406, 0.09273910522460938, 0.09586906433105469, 0.0989990234375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 13.0, 8.0, 11.0, 19.0, 25.0, 22.0, 37.0, 26.0, 23.0, 34.0, 41.0, 33.0, 30.0, 40.0, 39.0, 1069.0, 33.0, 54.0, 55.0, 44.0, 39.0, 31.0, 38.0, 28.0, 36.0, 26.0, 26.0, 22.0, 14.0, 18.0, 12.0, 21.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.296875, -13.817626953125, -13.33837890625, -12.859130859375, -12.3798828125, -11.900634765625, -11.42138671875, -10.942138671875, -10.462890625, -9.983642578125, -9.50439453125, -9.025146484375, -8.5458984375, -8.066650390625, -7.58740234375, -7.108154296875, -6.62890625, -6.149658203125, -5.67041015625, -5.191162109375, -4.7119140625, -4.232666015625, -3.75341796875, -3.274169921875, -2.794921875, -2.315673828125, -1.83642578125, -1.357177734375, -0.8779296875, -0.398681640625, 0.08056640625, 0.559814453125, 1.0390625, 1.518310546875, 1.99755859375, 2.476806640625, 2.9560546875, 3.435302734375, 3.91455078125, 4.393798828125, 4.873046875, 5.352294921875, 5.83154296875, 6.310791015625, 6.7900390625, 7.269287109375, 7.74853515625, 8.227783203125, 8.70703125, 9.186279296875, 9.66552734375, 10.144775390625, 10.6240234375, 11.103271484375, 11.58251953125, 12.061767578125, 12.541015625, 13.020263671875, 13.49951171875, 13.978759765625, 14.4580078125, 14.937255859375, 15.41650390625, 15.895751953125, 16.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 4.0, 7.0, 19.0, 28.0, 45.0, 42.0, 69.0, 116.0, 184.0, 210.0, 330.0, 478.0, 695.0, 915.0, 1404.0, 2115.0, 2982.0, 4445.0, 6577.0, 10065.0, 15507.0, 23893.0, 38134.0, 60700.0, 100150.0, 169191.0, 310873.0, 624007.0, 3924688.0, 434143.0, 222109.0, 127098.0, 77113.0, 47436.0, 29689.0, 19003.0, 12203.0, 8152.0, 5412.0, 3561.0, 2329.0, 1622.0, 1130.0, 774.0, 473.0, 369.0, 304.0, 193.0, 137.0, 104.0, 70.0, 43.0, 31.0, 22.0, 19.0, 12.0, 5.0, 7.0, 2.0, 4.0, 2.0], "bins": [-0.07647705078125, -0.07402896881103516, -0.07158088684082031, -0.06913280487060547, -0.06668472290039062, -0.06423664093017578, -0.06178855895996094, -0.059340476989746094, -0.05689239501953125, -0.054444313049316406, -0.05199623107910156, -0.04954814910888672, -0.047100067138671875, -0.04465198516845703, -0.04220390319824219, -0.039755821228027344, -0.0373077392578125, -0.034859657287597656, -0.03241157531738281, -0.02996349334716797, -0.027515411376953125, -0.02506732940673828, -0.022619247436523438, -0.020171165466308594, -0.01772308349609375, -0.015275001525878906, -0.012826919555664062, -0.010378837585449219, -0.007930755615234375, -0.005482673645019531, -0.0030345916748046875, -0.0005865097045898438, 0.001861572265625, 0.004309654235839844, 0.0067577362060546875, 0.009205818176269531, 0.011653900146484375, 0.014101982116699219, 0.016550064086914062, 0.018998146057128906, 0.02144622802734375, 0.023894309997558594, 0.026342391967773438, 0.02879047393798828, 0.031238555908203125, 0.03368663787841797, 0.03613471984863281, 0.038582801818847656, 0.0410308837890625, 0.043478965759277344, 0.04592704772949219, 0.04837512969970703, 0.050823211669921875, 0.05327129364013672, 0.05571937561035156, 0.058167457580566406, 0.06061553955078125, 0.0630636215209961, 0.06551170349121094, 0.06795978546142578, 0.07040786743164062, 0.07285594940185547, 0.07530403137207031, 0.07775211334228516, 0.0802001953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 0.0, 6.0, 0.0, 14.0, 8.0, 13.0, 18.0, 15.0, 25.0, 25.0, 24.0, 30.0, 28.0, 32.0, 37.0, 48.0, 38.0, 50.0, 41.0, 1070.0, 45.0, 49.0, 38.0, 47.0, 44.0, 36.0, 29.0, 31.0, 30.0, 24.0, 19.0, 19.0, 19.0, 19.0, 11.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.609375, -12.2337646484375, -11.858154296875, -11.4825439453125, -11.10693359375, -10.7313232421875, -10.355712890625, -9.9801025390625, -9.6044921875, -9.2288818359375, -8.853271484375, -8.4776611328125, -8.10205078125, -7.7264404296875, -7.350830078125, -6.9752197265625, -6.599609375, -6.2239990234375, -5.848388671875, -5.4727783203125, -5.09716796875, -4.7215576171875, -4.345947265625, -3.9703369140625, -3.5947265625, -3.2191162109375, -2.843505859375, -2.4678955078125, -2.09228515625, -1.7166748046875, -1.341064453125, -0.9654541015625, -0.58984375, -0.2142333984375, 0.161376953125, 0.5369873046875, 0.91259765625, 1.2882080078125, 1.663818359375, 2.0394287109375, 2.4150390625, 2.7906494140625, 3.166259765625, 3.5418701171875, 3.91748046875, 4.2930908203125, 4.668701171875, 5.0443115234375, 5.419921875, 5.7955322265625, 6.171142578125, 6.5467529296875, 6.92236328125, 7.2979736328125, 7.673583984375, 8.0491943359375, 8.4248046875, 8.8004150390625, 9.176025390625, 9.5516357421875, 9.92724609375, 10.3028564453125, 10.678466796875, 11.0540771484375, 11.4296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 9.0, 5.0, 7.0, 6.0, 9.0, 6.0, 12.0, 24.0, 34.0, 48.0, 46.0, 47.0, 59.0, 86.0, 108.0, 125.0, 141.0, 216.0, 272.0, 326.0, 504.0, 723.0, 1282.0, 3934.0, 19601.0, 158735.0, 6034468.0, 55662.0, 9478.0, 2250.0, 933.0, 556.0, 376.0, 263.0, 198.0, 168.0, 141.0, 93.0, 97.0, 56.0, 73.0, 52.0, 47.0, 40.0, 21.0, 32.0, 21.0, 5.0, 15.0, 15.0, 2.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.44140625, -0.4272918701171875, -0.413177490234375, -0.3990631103515625, -0.38494873046875, -0.3708343505859375, -0.356719970703125, -0.3426055908203125, -0.3284912109375, -0.3143768310546875, -0.300262451171875, -0.2861480712890625, -0.27203369140625, -0.2579193115234375, -0.243804931640625, -0.2296905517578125, -0.215576171875, -0.2014617919921875, -0.187347412109375, -0.1732330322265625, -0.15911865234375, -0.1450042724609375, -0.130889892578125, -0.1167755126953125, -0.1026611328125, -0.0885467529296875, -0.074432373046875, -0.0603179931640625, -0.04620361328125, -0.0320892333984375, -0.017974853515625, -0.0038604736328125, 0.01025390625, 0.0243682861328125, 0.038482666015625, 0.0525970458984375, 0.06671142578125, 0.0808258056640625, 0.094940185546875, 0.1090545654296875, 0.1231689453125, 0.1372833251953125, 0.151397705078125, 0.1655120849609375, 0.17962646484375, 0.1937408447265625, 0.207855224609375, 0.2219696044921875, 0.236083984375, 0.2501983642578125, 0.264312744140625, 0.2784271240234375, 0.29254150390625, 0.3066558837890625, 0.320770263671875, 0.3348846435546875, 0.3489990234375, 0.3631134033203125, 0.377227783203125, 0.3913421630859375, 0.40545654296875, 0.4195709228515625, 0.433685302734375, 0.4477996826171875, 0.4619140625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 10.0, 11.0, 16.0, 11.0, 14.0, 11.0, 26.0, 23.0, 19.0, 24.0, 24.0, 40.0, 36.0, 36.0, 36.0, 34.0, 37.0, 37.0, 39.0, 1050.0, 49.0, 35.0, 42.0, 40.0, 34.0, 32.0, 32.0, 27.0, 25.0, 24.0, 19.0, 14.0, 19.0, 19.0, 10.0, 15.0, 14.0, 6.0, 8.0, 9.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.7578125, -7.510986328125, -7.26416015625, -7.017333984375, -6.7705078125, -6.523681640625, -6.27685546875, -6.030029296875, -5.783203125, -5.536376953125, -5.28955078125, -5.042724609375, -4.7958984375, -4.549072265625, -4.30224609375, -4.055419921875, -3.80859375, -3.561767578125, -3.31494140625, -3.068115234375, -2.8212890625, -2.574462890625, -2.32763671875, -2.080810546875, -1.833984375, -1.587158203125, -1.34033203125, -1.093505859375, -0.8466796875, -0.599853515625, -0.35302734375, -0.106201171875, 0.140625, 0.387451171875, 0.63427734375, 0.881103515625, 1.1279296875, 1.374755859375, 1.62158203125, 1.868408203125, 2.115234375, 2.362060546875, 2.60888671875, 2.855712890625, 3.1025390625, 3.349365234375, 3.59619140625, 3.843017578125, 4.08984375, 4.336669921875, 4.58349609375, 4.830322265625, 5.0771484375, 5.323974609375, 5.57080078125, 5.817626953125, 6.064453125, 6.311279296875, 6.55810546875, 6.804931640625, 7.0517578125, 7.298583984375, 7.54541015625, 7.792236328125, 8.0390625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 650.0, 356.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.42967224121094, -31.19765853881836, -28.96564292907715, -26.73362922668457, -24.50161361694336, -22.26959991455078, -20.037586212158203, -17.805572509765625, -15.573556900024414, -13.34154224395752, -11.109527587890625, -8.877513885498047, -6.645499229431152, -4.413484573364258, -2.1814708709716797, 0.050543785095214844, 2.2825584411621094, 4.514573097229004, 6.74658727645874, 8.978601455688477, 11.210616111755371, 13.442630767822266, 15.674644470214844, 17.906658172607422, 20.138673782348633, 22.37068748474121, 24.602703094482422, 26.834716796875, 29.066730499267578, 31.29874610900879, 33.53076171875, 35.76277542114258, 37.994789123535156, 40.226802825927734, 42.45881652832031, 44.690834045410156, 46.922847747802734, 49.15486145019531, 51.38687515258789, 53.61888885498047, 55.85090637207031, 58.08292007446289, 60.31493377685547, 62.54695129394531, 64.77896118164062, 67.01097869873047, 69.24299621582031, 71.47500610351562, 73.70701599121094, 75.93903350830078, 78.1710433959961, 80.40306091308594, 82.63507080078125, 84.8670883178711, 87.09910583496094, 89.33111572265625, 91.5631332397461, 93.79515075683594, 96.02716064453125, 98.2591781616211, 100.4911880493164, 102.72320556640625, 104.95521545410156, 107.1872329711914, 109.41925048828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 6.0, 7.0, 10.0, 15.0, 16.0, 11.0, 14.0, 18.0, 21.0, 29.0, 18.0, 17.0, 25.0, 35.0, 31.0, 31.0, 43.0, 33.0, 47.0, 37.0, 33.0, 44.0, 53.0, 49.0, 34.0, 19.0, 24.0, 29.0, 28.0, 24.0, 20.0, 22.0, 17.0, 14.0, 17.0, 21.0, 13.0, 9.0, 8.0, 7.0, 8.0, 9.0, 10.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.5479736328125, -16.06859588623047, -15.589218139648438, -15.109840393066406, -14.630461692810059, -14.151083946228027, -13.671706199645996, -13.192328453063965, -12.712950706481934, -12.233572959899902, -11.754195213317871, -11.274816513061523, -10.795438766479492, -10.316061019897461, -9.83668327331543, -9.357305526733398, -8.877927780151367, -8.398550033569336, -7.9191718101501465, -7.439794063568115, -6.960416316986084, -6.4810380935668945, -6.001660346984863, -5.522282600402832, -5.042903900146484, -4.563526153564453, -4.084147930145264, -3.6047701835632324, -3.125392436981201, -2.646014451980591, -2.1666364669799805, -1.6872587203979492, -1.207880973815918, -0.7285031080245972, -0.2491251826286316, 0.23025274276733398, 0.7096306085586548, 1.1890084743499756, 1.668386459350586, 2.147764205932617, 2.6271421909332275, 3.106520175933838, 3.585897922515869, 4.065276145935059, 4.54465389251709, 5.024031639099121, 5.503409385681152, 5.982787132263184, 6.462165355682373, 6.941543102264404, 7.420921325683594, 7.900299072265625, 8.379676818847656, 8.859054565429688, 9.338432312011719, 9.81781005859375, 10.297188758850098, 10.776566505432129, 11.25594425201416, 11.735322952270508, 12.214700698852539, 12.69407844543457, 13.173456192016602, 13.652833938598633, 14.132211685180664]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 9.0, 3.0, 11.0, 11.0, 12.0, 21.0, 33.0, 28.0, 33.0, 64.0, 82.0, 65.0, 102.0, 151.0, 195.0, 294.0, 419.0, 770.0, 3967.0, 17672.0, 3853001.0, 300593.0, 10316.0, 3324.0, 841.0, 522.0, 375.0, 296.0, 232.0, 164.0, 114.0, 122.0, 76.0, 81.0, 56.0, 39.0, 31.0, 20.0, 18.0, 25.0, 9.0, 13.0, 16.0, 4.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.036346435546875, -0.03517293930053711, -0.03399944305419922, -0.03282594680786133, -0.03165245056152344, -0.030478954315185547, -0.029305458068847656, -0.028131961822509766, -0.026958465576171875, -0.025784969329833984, -0.024611473083496094, -0.023437976837158203, -0.022264480590820312, -0.021090984344482422, -0.01991748809814453, -0.01874399185180664, -0.01757049560546875, -0.01639699935913086, -0.015223503112792969, -0.014050006866455078, -0.012876510620117188, -0.011703014373779297, -0.010529518127441406, -0.009356021881103516, -0.008182525634765625, -0.007009029388427734, -0.005835533142089844, -0.004662036895751953, -0.0034885406494140625, -0.002315044403076172, -0.0011415481567382812, 3.1948089599609375e-05, 0.0012054443359375, 0.0023789405822753906, 0.0035524368286132812, 0.004725933074951172, 0.0058994293212890625, 0.007072925567626953, 0.008246421813964844, 0.009419918060302734, 0.010593414306640625, 0.011766910552978516, 0.012940406799316406, 0.014113903045654297, 0.015287399291992188, 0.016460895538330078, 0.01763439178466797, 0.01880788803100586, 0.01998138427734375, 0.02115488052368164, 0.02232837677001953, 0.023501873016357422, 0.024675369262695312, 0.025848865509033203, 0.027022361755371094, 0.028195858001708984, 0.029369354248046875, 0.030542850494384766, 0.031716346740722656, 0.03288984298706055, 0.03406333923339844, 0.03523683547973633, 0.03641033172607422, 0.03758382797241211, 0.03875732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 0.0, 5.0, 7.0, 5.0, 6.0, 14.0, 7.0, 14.0, 22.0, 781.0, 36.0, 11.0, 12.0, 14.0, 10.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0189361572265625, -0.0183258056640625, -0.0177154541015625, -0.0171051025390625, -0.0164947509765625, -0.0158843994140625, -0.0152740478515625, -0.0146636962890625, -0.0140533447265625, -0.0134429931640625, -0.0128326416015625, -0.0122222900390625, -0.0116119384765625, -0.0110015869140625, -0.0103912353515625, -0.0097808837890625, -0.0091705322265625, -0.0085601806640625, -0.0079498291015625, -0.0073394775390625, -0.0067291259765625, -0.0061187744140625, -0.0055084228515625, -0.0048980712890625, -0.0042877197265625, -0.0036773681640625, -0.0030670166015625, -0.0024566650390625, -0.0018463134765625, -0.0012359619140625, -0.0006256103515625, -1.52587890625e-05, 0.0005950927734375, 0.0012054443359375, 0.0018157958984375, 0.0024261474609375, 0.0030364990234375, 0.0036468505859375, 0.0042572021484375, 0.0048675537109375, 0.0054779052734375, 0.0060882568359375, 0.0066986083984375, 0.0073089599609375, 0.0079193115234375, 0.0085296630859375, 0.0091400146484375, 0.0097503662109375, 0.0103607177734375, 0.0109710693359375, 0.0115814208984375, 0.0121917724609375, 0.0128021240234375, 0.0134124755859375, 0.0140228271484375, 0.0146331787109375, 0.0152435302734375, 0.0158538818359375, 0.0164642333984375, 0.0170745849609375, 0.0176849365234375, 0.0182952880859375, 0.0189056396484375, 0.0195159912109375, 0.0201263427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 15.0, 10.0, 14.0, 17.0, 24.0, 37.0, 49.0, 96.0, 243.0, 992.0, 6034.0, 569871.0, 3608951.0, 5860.0, 1334.0, 324.0, 141.0, 72.0, 52.0, 29.0, 14.0, 12.0, 11.0, 11.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.10882568359375, -0.10552978515625, -0.10223388671875, -0.09893798828125, -0.09564208984375, -0.09234619140625, -0.08905029296875, -0.08575439453125, -0.08245849609375, -0.07916259765625, -0.07586669921875, -0.07257080078125, -0.06927490234375, -0.06597900390625, -0.06268310546875, -0.05938720703125, -0.05609130859375, -0.05279541015625, -0.04949951171875, -0.04620361328125, -0.04290771484375, -0.03961181640625, -0.03631591796875, -0.03302001953125, -0.02972412109375, -0.02642822265625, -0.02313232421875, -0.01983642578125, -0.01654052734375, -0.01324462890625, -0.00994873046875, -0.00665283203125, -0.00335693359375, -6.103515625e-05, 0.00323486328125, 0.00653076171875, 0.00982666015625, 0.01312255859375, 0.01641845703125, 0.01971435546875, 0.02301025390625, 0.02630615234375, 0.02960205078125, 0.03289794921875, 0.03619384765625, 0.03948974609375, 0.04278564453125, 0.04608154296875, 0.04937744140625, 0.05267333984375, 0.05596923828125, 0.05926513671875, 0.06256103515625, 0.06585693359375, 0.06915283203125, 0.07244873046875, 0.07574462890625, 0.07904052734375, 0.08233642578125, 0.08563232421875, 0.08892822265625, 0.09222412109375, 0.09552001953125, 0.09881591796875, 0.10211181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 5.0, 4.0, 7.0, 8.0, 5.0, 13.0, 7.0, 49.0, 208.0, 1669.0, 1761.0, 190.0, 53.0, 19.0, 9.0, 4.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.036468505859375, -0.03529214859008789, -0.03411579132080078, -0.03293943405151367, -0.03176307678222656, -0.030586719512939453, -0.029410362243652344, -0.028234004974365234, -0.027057647705078125, -0.025881290435791016, -0.024704933166503906, -0.023528575897216797, -0.022352218627929688, -0.021175861358642578, -0.01999950408935547, -0.01882314682006836, -0.01764678955078125, -0.01647043228149414, -0.015294075012207031, -0.014117717742919922, -0.012941360473632812, -0.011765003204345703, -0.010588645935058594, -0.009412288665771484, -0.008235931396484375, -0.007059574127197266, -0.005883216857910156, -0.004706859588623047, -0.0035305023193359375, -0.002354145050048828, -0.0011777877807617188, -1.430511474609375e-06, 0.0011749267578125, 0.0023512840270996094, 0.0035276412963867188, 0.004703998565673828, 0.0058803558349609375, 0.007056713104248047, 0.008233070373535156, 0.009409427642822266, 0.010585784912109375, 0.011762142181396484, 0.012938499450683594, 0.014114856719970703, 0.015291213989257812, 0.016467571258544922, 0.01764392852783203, 0.01882028579711914, 0.01999664306640625, 0.02117300033569336, 0.02234935760498047, 0.023525714874267578, 0.024702072143554688, 0.025878429412841797, 0.027054786682128906, 0.028231143951416016, 0.029407501220703125, 0.030583858489990234, 0.031760215759277344, 0.03293657302856445, 0.03411293029785156, 0.03528928756713867, 0.03646564483642578, 0.03764200210571289, 0.038818359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1016.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939869165420532, -0.2597557604312897, -0.22552458941936493, -0.19129341840744019, -0.15706226229667664, -0.12283110618591309, -0.08859993517398834, -0.0543687641620636, -0.02013760805130005, 0.014093555510044098, 0.048324719071388245, 0.08255588263273239, 0.11678704619407654, 0.1510182023048401, 0.18524937331676483, 0.21948054432868958, 0.2537117004394531, 0.2879428565502167, 0.3221740126609802, 0.35640519857406616, 0.3906363546848297, 0.42486751079559326, 0.4590986967086792, 0.49332985281944275, 0.5275610089302063, 0.5617921948432922, 0.5960233211517334, 0.6302545070648193, 0.6644856929779053, 0.6987168192863464, 0.7329480051994324, 0.7671791315078735, 0.8014103174209595, 0.8356415033340454, 0.8698726296424866, 0.9041038155555725, 0.9383349418640137, 0.9725661277770996, 1.0067973136901855, 1.0410284996032715, 1.0752596855163574, 1.1094908714294434, 1.1437220573425293, 1.1779531240463257, 1.2121843099594116, 1.2464154958724976, 1.2806466817855835, 1.3148778676986694, 1.3491089344024658, 1.3833401203155518, 1.4175713062286377, 1.451802372932434, 1.48603355884552, 1.520264744758606, 1.554495930671692, 1.5887271165847778, 1.6229581832885742, 1.6571893692016602, 1.691420555114746, 1.7256516218185425, 1.7598828077316284, 1.7941139936447144, 1.8283451795578003, 1.8625763654708862, 1.8968075513839722]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 22.0, 24.0, 42.0, 50.0, 68.0, 76.0, 94.0, 112.0, 90.0, 82.0, 63.0, 40.0, 39.0, 29.0, 20.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11265707015991211, -0.10868007689714432, -0.10470308363437653, -0.10072609037160873, -0.09674909710884094, -0.09277210384607315, -0.08879511058330536, -0.08481811732053757, -0.08084112405776978, -0.07686413079500198, -0.07288713753223419, -0.0689101442694664, -0.06493315100669861, -0.06095615774393082, -0.056979164481163025, -0.05300217121839523, -0.04902517795562744, -0.04504818469285965, -0.04107119143009186, -0.037094198167324066, -0.033117204904556274, -0.029140211641788483, -0.02516321837902069, -0.0211862251162529, -0.017209231853485107, -0.013232238590717316, -0.009255245327949524, -0.005278252065181732, -0.0013012588024139404, 0.0026757344603538513, 0.006652727723121643, 0.010629720985889435, 0.014606714248657227, 0.01858370751142502, 0.02256070077419281, 0.026537694036960602, 0.030514687299728394, 0.034491680562496185, 0.03846867382526398, 0.04244566708803177, 0.04642266035079956, 0.05039965361356735, 0.054376646876335144, 0.058353640139102936, 0.06233063340187073, 0.06630762666463852, 0.07028461992740631, 0.0742616131901741, 0.0782386064529419, 0.08221559971570969, 0.08619259297847748, 0.09016958624124527, 0.09414657950401306, 0.09812357276678085, 0.10210056602954865, 0.10607755929231644, 0.11005455255508423, 0.11403154581785202, 0.11800853908061981, 0.1219855323433876, 0.1259625256061554, 0.12993952631950378, 0.13391651213169098, 0.13789349794387817, 0.14187049865722656]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 6.0, 6.0, 14.0, 20.0, 28.0, 37.0, 62.0, 76.0, 109.0, 147.0, 213.0, 279.0, 374.0, 493.0, 743.0, 1064.0, 1574.0, 2263.0, 3521.0, 5967.0, 10781.0, 25431.0, 903992.0, 53916.0, 16257.0, 7750.0, 4448.0, 2725.0, 1816.0, 1286.0, 883.0, 613.0, 457.0, 333.0, 237.0, 176.0, 133.0, 101.0, 79.0, 47.0, 28.0, 21.0, 18.0, 10.0, 6.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0206298828125, -0.019959211349487305, -0.01928853988647461, -0.018617868423461914, -0.01794719696044922, -0.017276525497436523, -0.016605854034423828, -0.015935182571411133, -0.015264511108398438, -0.014593839645385742, -0.013923168182373047, -0.013252496719360352, -0.012581825256347656, -0.011911153793334961, -0.011240482330322266, -0.01056981086730957, -0.009899139404296875, -0.00922846794128418, -0.008557796478271484, -0.007887125015258789, -0.007216453552246094, -0.0065457820892333984, -0.005875110626220703, -0.005204439163208008, -0.0045337677001953125, -0.003863096237182617, -0.003192424774169922, -0.0025217533111572266, -0.0018510818481445312, -0.001180410385131836, -0.0005097389221191406, 0.0001609325408935547, 0.00083160400390625, 0.0015022754669189453, 0.0021729469299316406, 0.002843618392944336, 0.0035142898559570312, 0.0041849613189697266, 0.004855632781982422, 0.005526304244995117, 0.0061969757080078125, 0.006867647171020508, 0.007538318634033203, 0.008208990097045898, 0.008879661560058594, 0.009550333023071289, 0.010221004486083984, 0.01089167594909668, 0.011562347412109375, 0.01223301887512207, 0.012903690338134766, 0.013574361801147461, 0.014245033264160156, 0.014915704727172852, 0.015586376190185547, 0.016257047653198242, 0.016927719116210938, 0.017598390579223633, 0.018269062042236328, 0.018939733505249023, 0.01961040496826172, 0.020281076431274414, 0.02095174789428711, 0.021622419357299805, 0.0222930908203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 12.0, 8.0, 9.0, 17.0, 27.0, 777.0, 34.0, 10.0, 14.0, 9.0, 12.0, 2.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0182342529296875, -0.017642498016357422, -0.017050743103027344, -0.016458988189697266, -0.015867233276367188, -0.01527547836303711, -0.014683723449707031, -0.014091968536376953, -0.013500213623046875, -0.012908458709716797, -0.012316703796386719, -0.01172494888305664, -0.011133193969726562, -0.010541439056396484, -0.009949684143066406, -0.009357929229736328, -0.00876617431640625, -0.008174419403076172, -0.007582664489746094, -0.006990909576416016, -0.0063991546630859375, -0.005807399749755859, -0.005215644836425781, -0.004623889923095703, -0.004032135009765625, -0.003440380096435547, -0.0028486251831054688, -0.0022568702697753906, -0.0016651153564453125, -0.0010733604431152344, -0.00048160552978515625, 0.00011014938354492188, 0.000701904296875, 0.0012936592102050781, 0.0018854141235351562, 0.0024771690368652344, 0.0030689239501953125, 0.0036606788635253906, 0.004252433776855469, 0.004844188690185547, 0.005435943603515625, 0.006027698516845703, 0.006619453430175781, 0.007211208343505859, 0.0078029632568359375, 0.008394718170166016, 0.008986473083496094, 0.009578227996826172, 0.01016998291015625, 0.010761737823486328, 0.011353492736816406, 0.011945247650146484, 0.012537002563476562, 0.01312875747680664, 0.013720512390136719, 0.014312267303466797, 0.014904022216796875, 0.015495777130126953, 0.01608753204345703, 0.01667928695678711, 0.017271041870117188, 0.017862796783447266, 0.018454551696777344, 0.019046306610107422, 0.0196380615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 16.0, 19.0, 8.0, 21.0, 25.0, 29.0, 49.0, 38.0, 69.0, 77.0, 118.0, 133.0, 197.0, 348.0, 860.0, 3310.0, 31131.0, 879679.0, 122150.0, 7400.0, 1420.0, 491.0, 254.0, 141.0, 97.0, 83.0, 63.0, 59.0, 44.0, 36.0, 31.0, 21.0, 25.0, 24.0, 9.0, 8.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07224559783935547, -0.06996726989746094, -0.0676889419555664, -0.06541061401367188, -0.06313228607177734, -0.06085395812988281, -0.05857563018798828, -0.05629730224609375, -0.05401897430419922, -0.05174064636230469, -0.049462318420410156, -0.047183990478515625, -0.044905662536621094, -0.04262733459472656, -0.04034900665283203, -0.0380706787109375, -0.03579235076904297, -0.03351402282714844, -0.031235694885253906, -0.028957366943359375, -0.026679039001464844, -0.024400711059570312, -0.02212238311767578, -0.01984405517578125, -0.01756572723388672, -0.015287399291992188, -0.013009071350097656, -0.010730743408203125, -0.008452415466308594, -0.0061740875244140625, -0.0038957595825195312, -0.001617431640625, 0.0006608963012695312, 0.0029392242431640625, 0.005217552185058594, 0.007495880126953125, 0.009774208068847656, 0.012052536010742188, 0.014330863952636719, 0.01660919189453125, 0.01888751983642578, 0.021165847778320312, 0.023444175720214844, 0.025722503662109375, 0.028000831604003906, 0.030279159545898438, 0.03255748748779297, 0.0348358154296875, 0.03711414337158203, 0.03939247131347656, 0.041670799255371094, 0.043949127197265625, 0.046227455139160156, 0.04850578308105469, 0.05078411102294922, 0.05306243896484375, 0.05534076690673828, 0.05761909484863281, 0.059897422790527344, 0.062175750732421875, 0.0644540786743164, 0.06673240661621094, 0.06901073455810547, 0.0712890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 15.0, 13.0, 6.0, 15.0, 17.0, 15.0, 29.0, 18.0, 25.0, 28.0, 40.0, 31.0, 34.0, 39.0, 36.0, 39.0, 41.0, 45.0, 33.0, 44.0, 34.0, 31.0, 37.0, 33.0, 24.0, 27.0, 20.0, 29.0, 25.0, 16.0, 26.0, 13.0, 18.0, 23.0, 7.0, 6.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.0652627944946289, -0.06320381164550781, -0.06114482879638672, -0.059085845947265625, -0.05702686309814453, -0.05496788024902344, -0.052908897399902344, -0.05084991455078125, -0.048790931701660156, -0.04673194885253906, -0.04467296600341797, -0.042613983154296875, -0.04055500030517578, -0.03849601745605469, -0.036437034606933594, -0.0343780517578125, -0.032319068908691406, -0.030260086059570312, -0.02820110321044922, -0.026142120361328125, -0.02408313751220703, -0.022024154663085938, -0.019965171813964844, -0.01790618896484375, -0.015847206115722656, -0.013788223266601562, -0.011729240417480469, -0.009670257568359375, -0.007611274719238281, -0.0055522918701171875, -0.0034933090209960938, -0.001434326171875, 0.0006246566772460938, 0.0026836395263671875, 0.004742622375488281, 0.006801605224609375, 0.008860588073730469, 0.010919570922851562, 0.012978553771972656, 0.01503753662109375, 0.017096519470214844, 0.019155502319335938, 0.02121448516845703, 0.023273468017578125, 0.02533245086669922, 0.027391433715820312, 0.029450416564941406, 0.0315093994140625, 0.033568382263183594, 0.03562736511230469, 0.03768634796142578, 0.039745330810546875, 0.04180431365966797, 0.04386329650878906, 0.045922279357910156, 0.04798126220703125, 0.050040245056152344, 0.05209922790527344, 0.05415821075439453, 0.056217193603515625, 0.05827617645263672, 0.06033515930175781, 0.062394142150878906, 0.064453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 11.0, 9.0, 13.0, 26.0, 28.0, 29.0, 50.0, 69.0, 85.0, 158.0, 237.0, 447.0, 784.0, 1823.0, 6740.0, 45448.0, 937093.0, 45165.0, 6293.0, 2084.0, 795.0, 461.0, 181.0, 140.0, 117.0, 71.0, 45.0, 34.0, 17.0, 16.0, 19.0, 8.0, 6.0, 14.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.6226043701171875e-05, -2.54875048995018e-05, -2.4748966097831726e-05, -2.401042729616165e-05, -2.3271888494491577e-05, -2.2533349692821503e-05, -2.1794810891151428e-05, -2.1056272089481354e-05, -2.031773328781128e-05, -1.9579194486141205e-05, -1.884065568447113e-05, -1.8102116882801056e-05, -1.736357808113098e-05, -1.6625039279460907e-05, -1.5886500477790833e-05, -1.5147961676120758e-05, -1.4409422874450684e-05, -1.3670884072780609e-05, -1.2932345271110535e-05, -1.219380646944046e-05, -1.1455267667770386e-05, -1.0716728866100311e-05, -9.978190064430237e-06, -9.239651262760162e-06, -8.501112461090088e-06, -7.762573659420013e-06, -7.024034857749939e-06, -6.2854960560798645e-06, -5.54695725440979e-06, -4.8084184527397156e-06, -4.069879651069641e-06, -3.3313408493995667e-06, -2.592802047729492e-06, -1.8542632460594177e-06, -1.1157244443893433e-06, -3.771856427192688e-07, 3.6135315895080566e-07, 1.0998919606208801e-06, 1.8384307622909546e-06, 2.576969563961029e-06, 3.3155083656311035e-06, 4.054047167301178e-06, 4.7925859689712524e-06, 5.531124770641327e-06, 6.269663572311401e-06, 7.008202373981476e-06, 7.74674117565155e-06, 8.485279977321625e-06, 9.2238187789917e-06, 9.962357580661774e-06, 1.0700896382331848e-05, 1.1439435184001923e-05, 1.2177973985671997e-05, 1.2916512787342072e-05, 1.3655051589012146e-05, 1.439359039068222e-05, 1.5132129192352295e-05, 1.587066799402237e-05, 1.6609206795692444e-05, 1.734774559736252e-05, 1.8086284399032593e-05, 1.8824823200702667e-05, 1.9563362002372742e-05, 2.0301900804042816e-05, 2.104043960571289e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 1.0, 11.0, 9.0, 20.0, 13.0, 20.0, 35.0, 15.0, 32.0, 28.0, 41.0, 55.0, 51.0, 48.0, 53.0, 55.0, 61.0, 34.0, 45.0, 71.0, 60.0, 40.0, 34.0, 27.0, 32.0, 25.0, 14.0, 18.0, 2.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3974647521972656e-06, -3.2838433980941772e-06, -3.170222043991089e-06, -3.0566006898880005e-06, -2.942979335784912e-06, -2.8293579816818237e-06, -2.7157366275787354e-06, -2.602115273475647e-06, -2.4884939193725586e-06, -2.3748725652694702e-06, -2.261251211166382e-06, -2.1476298570632935e-06, -2.034008502960205e-06, -1.9203871488571167e-06, -1.8067657947540283e-06, -1.69314444065094e-06, -1.5795230865478516e-06, -1.4659017324447632e-06, -1.3522803783416748e-06, -1.2386590242385864e-06, -1.125037670135498e-06, -1.0114163160324097e-06, -8.977949619293213e-07, -7.841736078262329e-07, -6.705522537231445e-07, -5.569308996200562e-07, -4.4330954551696777e-07, -3.296881914138794e-07, -2.1606683731079102e-07, -1.0244548320770264e-07, 1.1175870895385742e-08, 1.2479722499847412e-07, 2.384185791015625e-07, 3.520399332046509e-07, 4.6566128730773926e-07, 5.792826414108276e-07, 6.92903995513916e-07, 8.065253496170044e-07, 9.201467037200928e-07, 1.0337680578231812e-06, 1.1473894119262695e-06, 1.261010766029358e-06, 1.3746321201324463e-06, 1.4882534742355347e-06, 1.601874828338623e-06, 1.7154961824417114e-06, 1.8291175365447998e-06, 1.942738890647888e-06, 2.0563602447509766e-06, 2.169981598854065e-06, 2.2836029529571533e-06, 2.3972243070602417e-06, 2.51084566116333e-06, 2.6244670152664185e-06, 2.738088369369507e-06, 2.8517097234725952e-06, 2.9653310775756836e-06, 3.078952431678772e-06, 3.1925737857818604e-06, 3.3061951398849487e-06, 3.419816493988037e-06, 3.5334378480911255e-06, 3.647059202194214e-06, 3.7606805562973022e-06, 3.874301910400391e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 5.0, 4.0, 9.0, 12.0, 18.0, 24.0, 21.0, 28.0, 49.0, 57.0, 89.0, 91.0, 164.0, 335.0, 1073.0, 6464.0, 329889.0, 700357.0, 7728.0, 1115.0, 380.0, 184.0, 137.0, 76.0, 59.0, 44.0, 26.0, 20.0, 19.0, 18.0, 13.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7179718017578125e-05, -2.640392631292343e-05, -2.5628134608268738e-05, -2.4852342903614044e-05, -2.407655119895935e-05, -2.3300759494304657e-05, -2.2524967789649963e-05, -2.174917608499527e-05, -2.0973384380340576e-05, -2.0197592675685883e-05, -1.942180097103119e-05, -1.8646009266376495e-05, -1.7870217561721802e-05, -1.7094425857067108e-05, -1.6318634152412415e-05, -1.554284244775772e-05, -1.4767050743103027e-05, -1.3991259038448334e-05, -1.321546733379364e-05, -1.2439675629138947e-05, -1.1663883924484253e-05, -1.088809221982956e-05, -1.0112300515174866e-05, -9.336508810520172e-06, -8.560717105865479e-06, -7.784925401210785e-06, -7.009133696556091e-06, -6.233341991901398e-06, -5.457550287246704e-06, -4.6817585825920105e-06, -3.905966877937317e-06, -3.1301751732826233e-06, -2.3543834686279297e-06, -1.578591763973236e-06, -8.028000593185425e-07, -2.7008354663848877e-08, 7.487833499908447e-07, 1.5245750546455383e-06, 2.300366759300232e-06, 3.0761584639549255e-06, 3.851950168609619e-06, 4.627741873264313e-06, 5.403533577919006e-06, 6.1793252825737e-06, 6.9551169872283936e-06, 7.730908691883087e-06, 8.50670039653778e-06, 9.282492101192474e-06, 1.0058283805847168e-05, 1.0834075510501862e-05, 1.1609867215156555e-05, 1.2385658919811249e-05, 1.3161450624465942e-05, 1.3937242329120636e-05, 1.471303403377533e-05, 1.5488825738430023e-05, 1.6264617443084717e-05, 1.704040914773941e-05, 1.7816200852394104e-05, 1.8591992557048798e-05, 1.936778426170349e-05, 2.0143575966358185e-05, 2.091936767101288e-05, 2.1695159375667572e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 19.0, 13.0, 15.0, 25.0, 30.0, 37.0, 20.0, 35.0, 37.0, 69.0, 69.0, 63.0, 71.0, 62.0, 69.0, 49.0, 57.0, 45.0, 27.0, 27.0, 24.0, 14.0, 15.0, 10.0, 12.0, 11.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4557113647460938e-05, -2.3855827748775482e-05, -2.3154541850090027e-05, -2.245325595140457e-05, -2.1751970052719116e-05, -2.105068415403366e-05, -2.0349398255348206e-05, -1.964811235666275e-05, -1.8946826457977295e-05, -1.824554055929184e-05, -1.7544254660606384e-05, -1.684296876192093e-05, -1.6141682863235474e-05, -1.544039696455002e-05, -1.4739111065864563e-05, -1.4037825167179108e-05, -1.3336539268493652e-05, -1.2635253369808197e-05, -1.1933967471122742e-05, -1.1232681572437286e-05, -1.0531395673751831e-05, -9.830109775066376e-06, -9.12882387638092e-06, -8.427537977695465e-06, -7.72625207901001e-06, -7.0249661803245544e-06, -6.323680281639099e-06, -5.622394382953644e-06, -4.9211084842681885e-06, -4.219822585582733e-06, -3.518536686897278e-06, -2.8172507882118225e-06, -2.115964889526367e-06, -1.4146789908409119e-06, -7.133930921554565e-07, -1.210719347000122e-08, 6.891787052154541e-07, 1.3904646039009094e-06, 2.0917505025863647e-06, 2.79303640127182e-06, 3.4943222999572754e-06, 4.195608198642731e-06, 4.896894097328186e-06, 5.598179996013641e-06, 6.299465894699097e-06, 7.000751793384552e-06, 7.702037692070007e-06, 8.403323590755463e-06, 9.104609489440918e-06, 9.805895388126373e-06, 1.0507181286811829e-05, 1.1208467185497284e-05, 1.190975308418274e-05, 1.2611038982868195e-05, 1.331232488155365e-05, 1.4013610780239105e-05, 1.471489667892456e-05, 1.5416182577610016e-05, 1.611746847629547e-05, 1.6818754374980927e-05, 1.7520040273666382e-05, 1.8221326172351837e-05, 1.8922612071037292e-05, 1.9623897969722748e-05, 2.0325183868408203e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 875.0, 136.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.669297218322754, -4.587241172790527, -4.505185127258301, -4.423129081726074, -4.341073036193848, -4.259017467498779, -4.176961421966553, -4.094905376434326, -4.0128493309021, -3.930793285369873, -3.8487372398376465, -3.766681432723999, -3.6846253871917725, -3.602569341659546, -3.5205135345458984, -3.438457489013672, -3.3564014434814453, -3.2743453979492188, -3.192289352416992, -3.1102335453033447, -3.028177499771118, -2.9461214542388916, -2.864065647125244, -2.7820096015930176, -2.699953556060791, -2.6178975105285645, -2.535841464996338, -2.4537856578826904, -2.371729612350464, -2.2896735668182373, -2.20761775970459, -2.1255617141723633, -2.0435056686401367, -1.9614496231079102, -1.8793936967849731, -1.7973377704620361, -1.7152817249298096, -1.633225679397583, -1.551169753074646, -1.469113826751709, -1.3870577812194824, -1.3050017356872559, -1.2229458093643188, -1.1408898830413818, -1.0588338375091553, -0.9767778515815735, -0.8947218656539917, -0.8126658797264099, -0.7306098341941833, -0.6485538482666016, -0.5664978623390198, -0.484441876411438, -0.4023858904838562, -0.3203299045562744, -0.23827391862869263, -0.15621793270111084, -0.07416194677352905, 0.007894039154052734, 0.08995002508163452, 0.1720060110092163, 0.2540619969367981, 0.3361179828643799, 0.41817396879196167, 0.5002299547195435, 0.5822859406471252]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 6.0, 5.0, 11.0, 14.0, 16.0, 18.0, 26.0, 49.0, 112.0, 144.0, 178.0, 141.0, 104.0, 59.0, 35.0, 16.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.386279821395874, -1.339289665222168, -1.2922996282577515, -1.2453094720840454, -1.198319435119629, -1.1513292789459229, -1.1043391227722168, -1.0573489665985107, -1.0103589296340942, -0.963368833065033, -0.9163787364959717, -0.8693885803222656, -0.8223984837532043, -0.7754083871841431, -0.728418231010437, -0.6814281344413757, -0.6344380378723145, -0.5874479413032532, -0.5404578447341919, -0.49346768856048584, -0.44647759199142456, -0.3994874954223633, -0.3524973690509796, -0.30550724267959595, -0.25851714611053467, -0.2115270346403122, -0.16453692317008972, -0.11754681169986725, -0.07055670022964478, -0.023566588759422302, 0.02342352271080017, 0.07041364908218384, 0.11740386486053467, 0.16439397633075714, 0.21138408780097961, 0.2583742141723633, 0.30536431074142456, 0.35235440731048584, 0.3993445336818695, 0.4463346600532532, 0.49332475662231445, 0.5403148531913757, 0.587304949760437, 0.6342951059341431, 0.6812852025032043, 0.7282752990722656, 0.7752654552459717, 0.822255551815033, 0.8692456483840942, 0.9162357449531555, 0.9632258415222168, 1.0102159976959229, 1.057206153869629, 1.1041961908340454, 1.1511863470077515, 1.198176383972168, 1.245166540145874, 1.29215669631958, 1.3391467332839966, 1.3861368894577026, 1.4331269264221191, 1.4801170825958252, 1.5271072387695312, 1.5740973949432373, 1.6210874319076538]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 10.0, 9.0, 7.0, 23.0, 33.0, 52.0, 105.0, 198.0, 500.0, 1144.0, 3897.0, 52441.0, 4125752.0, 6156.0, 2087.0, 877.0, 449.0, 213.0, 123.0, 63.0, 36.0, 17.0, 24.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.19035911560058594, -0.18333053588867188, -0.1763019561767578, -0.16927337646484375, -0.1622447967529297, -0.15521621704101562, -0.14818763732910156, -0.1411590576171875, -0.13413047790527344, -0.12710189819335938, -0.12007331848144531, -0.11304473876953125, -0.10601615905761719, -0.09898757934570312, -0.09195899963378906, -0.084930419921875, -0.07790184020996094, -0.07087326049804688, -0.06384468078613281, -0.05681610107421875, -0.04978752136230469, -0.042758941650390625, -0.03573036193847656, -0.0287017822265625, -0.021673202514648438, -0.014644622802734375, -0.0076160430908203125, -0.00058746337890625, 0.0064411163330078125, 0.013469696044921875, 0.020498275756835938, 0.02752685546875, 0.03455543518066406, 0.041584014892578125, 0.04861259460449219, 0.05564117431640625, 0.06266975402832031, 0.06969833374023438, 0.07672691345214844, 0.0837554931640625, 0.09078407287597656, 0.09781265258789062, 0.10484123229980469, 0.11186981201171875, 0.11889839172363281, 0.12592697143554688, 0.13295555114746094, 0.139984130859375, 0.14701271057128906, 0.15404129028320312, 0.1610698699951172, 0.16809844970703125, 0.1751270294189453, 0.18215560913085938, 0.18918418884277344, 0.1962127685546875, 0.20324134826660156, 0.21026992797851562, 0.2172985076904297, 0.22432708740234375, 0.2313556671142578, 0.23838424682617188, 0.24541282653808594, 0.25244140625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 10.0, 9.0, 4.0, 8.0, 4.0, 13.0, 15.0, 24.0, 613.0, 175.0, 17.0, 13.0, 10.0, 7.0, 8.0, 8.0, 6.0, 6.0, 4.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01276397705078125, -0.012310385704040527, -0.011856794357299805, -0.011403203010559082, -0.01094961166381836, -0.010496020317077637, -0.010042428970336914, -0.009588837623596191, -0.009135246276855469, -0.008681654930114746, -0.008228063583374023, -0.007774472236633301, -0.007320880889892578, -0.0068672895431518555, -0.006413698196411133, -0.00596010684967041, -0.0055065155029296875, -0.005052924156188965, -0.004599332809448242, -0.0041457414627075195, -0.003692150115966797, -0.0032385587692260742, -0.0027849674224853516, -0.002331376075744629, -0.0018777847290039062, -0.0014241933822631836, -0.0009706020355224609, -0.0005170106887817383, -6.341934204101562e-05, 0.00039017200469970703, 0.0008437633514404297, 0.0012973546981811523, 0.001750946044921875, 0.0022045373916625977, 0.0026581287384033203, 0.003111720085144043, 0.0035653114318847656, 0.004018902778625488, 0.004472494125366211, 0.004926085472106934, 0.005379676818847656, 0.005833268165588379, 0.0062868595123291016, 0.006740450859069824, 0.007194042205810547, 0.0076476335525512695, 0.008101224899291992, 0.008554816246032715, 0.009008407592773438, 0.00946199893951416, 0.009915590286254883, 0.010369181632995605, 0.010822772979736328, 0.01127636432647705, 0.011729955673217773, 0.012183547019958496, 0.012637138366699219, 0.013090729713439941, 0.013544321060180664, 0.013997912406921387, 0.01445150375366211, 0.014905095100402832, 0.015358686447143555, 0.015812277793884277, 0.016265869140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 3.0, 6.0, 9.0, 6.0, 12.0, 17.0, 19.0, 12.0, 28.0, 31.0, 49.0, 62.0, 113.0, 174.0, 394.0, 1131.0, 5581.0, 58051.0, 4104599.0, 19744.0, 2783.0, 719.0, 272.0, 135.0, 64.0, 58.0, 40.0, 28.0, 19.0, 24.0, 10.0, 15.0, 10.0, 8.0, 12.0, 5.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1766357421875, -0.17148590087890625, -0.1663360595703125, -0.16118621826171875, -0.156036376953125, -0.15088653564453125, -0.1457366943359375, -0.14058685302734375, -0.13543701171875, -0.13028717041015625, -0.1251373291015625, -0.11998748779296875, -0.114837646484375, -0.10968780517578125, -0.1045379638671875, -0.09938812255859375, -0.09423828125, -0.08908843994140625, -0.0839385986328125, -0.07878875732421875, -0.073638916015625, -0.06848907470703125, -0.0633392333984375, -0.05818939208984375, -0.05303955078125, -0.04788970947265625, -0.0427398681640625, -0.03759002685546875, -0.032440185546875, -0.02729034423828125, -0.0221405029296875, -0.01699066162109375, -0.0118408203125, -0.00669097900390625, -0.0015411376953125, 0.00360870361328125, 0.008758544921875, 0.01390838623046875, 0.0190582275390625, 0.02420806884765625, 0.02935791015625, 0.03450775146484375, 0.0396575927734375, 0.04480743408203125, 0.049957275390625, 0.05510711669921875, 0.0602569580078125, 0.06540679931640625, 0.070556640625, 0.07570648193359375, 0.0808563232421875, 0.08600616455078125, 0.091156005859375, 0.09630584716796875, 0.1014556884765625, 0.10660552978515625, 0.11175537109375, 0.11690521240234375, 0.1220550537109375, 0.12720489501953125, 0.132354736328125, 0.13750457763671875, 0.1426544189453125, 0.14780426025390625, 0.1529541015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 5.0, 8.0, 12.0, 19.0, 6.0, 19.0, 13.0, 21.0, 22.0, 36.0, 59.0, 3597.0, 30.0, 24.0, 22.0, 17.0, 14.0, 11.0, 13.0, 11.0, 15.0, 4.0, 14.0, 7.0, 7.0, 6.0, 5.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.025299072265625, -0.024561405181884766, -0.02382373809814453, -0.023086071014404297, -0.022348403930664062, -0.021610736846923828, -0.020873069763183594, -0.02013540267944336, -0.019397735595703125, -0.01866006851196289, -0.017922401428222656, -0.017184734344482422, -0.016447067260742188, -0.015709400177001953, -0.014971733093261719, -0.014234066009521484, -0.01349639892578125, -0.012758731842041016, -0.012021064758300781, -0.011283397674560547, -0.010545730590820312, -0.009808063507080078, -0.009070396423339844, -0.00833272933959961, -0.007595062255859375, -0.006857395172119141, -0.006119728088378906, -0.005382061004638672, -0.0046443939208984375, -0.003906726837158203, -0.0031690597534179688, -0.0024313926696777344, -0.0016937255859375, -0.0009560585021972656, -0.00021839141845703125, 0.0005192756652832031, 0.0012569427490234375, 0.001994609832763672, 0.0027322769165039062, 0.0034699440002441406, 0.004207611083984375, 0.004945278167724609, 0.005682945251464844, 0.006420612335205078, 0.0071582794189453125, 0.007895946502685547, 0.008633613586425781, 0.009371280670166016, 0.01010894775390625, 0.010846614837646484, 0.011584281921386719, 0.012321949005126953, 0.013059616088867188, 0.013797283172607422, 0.014534950256347656, 0.01527261734008789, 0.016010284423828125, 0.01674795150756836, 0.017485618591308594, 0.018223285675048828, 0.018960952758789062, 0.019698619842529297, 0.02043628692626953, 0.021173954010009766, 0.02191162109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1016.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814591646194458, -1.782610297203064, -1.75062894821167, -1.7186474800109863, -1.6866661310195923, -1.6546847820281982, -1.6227034330368042, -1.5907220840454102, -1.5587407350540161, -1.526759386062622, -1.494778037071228, -1.462796688079834, -1.4308152198791504, -1.3988338708877563, -1.3668525218963623, -1.3348711729049683, -1.3028898239135742, -1.2709084749221802, -1.2389271259307861, -1.2069456577301025, -1.1749643087387085, -1.1429829597473145, -1.1110016107559204, -1.0790202617645264, -1.0470387935638428, -1.0150574445724487, -0.9830760359764099, -0.9510946869850159, -0.9191133379936218, -0.887131929397583, -0.855150580406189, -0.8231692314147949, -0.7911879420280457, -0.7592065930366516, -0.7272251844406128, -0.6952438354492188, -0.6632624864578247, -0.6312811374664307, -0.5992997288703918, -0.5673183798789978, -0.5353370308876038, -0.5033556818962097, -0.4713743031024933, -0.43939292430877686, -0.4074115753173828, -0.3754301965236664, -0.34344881772994995, -0.3114674687385559, -0.2794860601425171, -0.24750469624996185, -0.21552333235740662, -0.18354195356369019, -0.15156058967113495, -0.11957922577857971, -0.08759784698486328, -0.055616483092308044, -0.023635134100914, 0.008346233516931534, 0.04032760113477707, 0.0723089724779129, 0.10429033637046814, 0.13627170026302338, 0.1682530790567398, 0.20023444294929504, 0.23221580684185028]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 10.0, 6.0, 18.0, 22.0, 42.0, 67.0, 109.0, 138.0, 171.0, 112.0, 95.0, 73.0, 32.0, 15.0, 12.0, 13.0, 10.0, 5.0, 10.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13524079322814941, -0.13109557330608368, -0.12695035338401794, -0.1228051483631134, -0.11865992844104767, -0.11451470851898193, -0.1103694960474968, -0.10622428357601166, -0.10207906365394592, -0.09793384373188019, -0.09378863126039505, -0.08964341878890991, -0.08549819886684418, -0.08135297894477844, -0.0772077664732933, -0.07306255400180817, -0.06891733407974243, -0.0647721141576767, -0.06062690168619156, -0.05648168548941612, -0.052336469292640686, -0.04819125309586525, -0.04404603689908981, -0.03990082070231438, -0.03575560450553894, -0.031610388308763504, -0.027465172111988068, -0.02331995591521263, -0.019174739718437195, -0.015029523521661758, -0.010884307324886322, -0.006739091128110886, -0.0025938749313354492, 0.0015513412654399872, 0.005696557462215424, 0.00984177365899086, 0.013986989855766296, 0.018132206052541733, 0.02227742224931717, 0.026422638446092606, 0.030567854642868042, 0.03471307083964348, 0.038858287036418915, 0.04300350323319435, 0.04714871942996979, 0.051293935626745224, 0.05543915182352066, 0.0595843680202961, 0.06372958421707153, 0.06787480413913727, 0.0720200166106224, 0.07616522908210754, 0.08031044900417328, 0.08445566892623901, 0.08860088139772415, 0.09274609386920929, 0.09689131379127502, 0.10103653371334076, 0.1051817461848259, 0.10932695865631104, 0.11347217857837677, 0.1176173985004425, 0.12176261097192764, 0.12590782344341278, 0.13005304336547852]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 21.0, 17.0, 29.0, 38.0, 38.0, 69.0, 91.0, 121.0, 152.0, 262.0, 322.0, 430.0, 607.0, 945.0, 1301.0, 2051.0, 2925.0, 4724.0, 7996.0, 13771.0, 29600.0, 866889.0, 70211.0, 18750.0, 10110.0, 5828.0, 3669.0, 2255.0, 1568.0, 1073.0, 747.0, 557.0, 372.0, 274.0, 214.0, 135.0, 101.0, 71.0, 58.0, 34.0, 22.0, 17.0, 17.0, 7.0, 10.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.043182373046875, -0.04190206527709961, -0.04062175750732422, -0.03934144973754883, -0.03806114196777344, -0.03678083419799805, -0.035500526428222656, -0.034220218658447266, -0.032939910888671875, -0.031659603118896484, -0.030379295349121094, -0.029098987579345703, -0.027818679809570312, -0.026538372039794922, -0.02525806427001953, -0.02397775650024414, -0.02269744873046875, -0.02141714096069336, -0.02013683319091797, -0.018856525421142578, -0.017576217651367188, -0.016295909881591797, -0.015015602111816406, -0.013735294342041016, -0.012454986572265625, -0.011174678802490234, -0.009894371032714844, -0.008614063262939453, -0.0073337554931640625, -0.006053447723388672, -0.004773139953613281, -0.0034928321838378906, -0.0022125244140625, -0.0009322166442871094, 0.00034809112548828125, 0.0016283988952636719, 0.0029087066650390625, 0.004189014434814453, 0.005469322204589844, 0.006749629974365234, 0.008029937744140625, 0.009310245513916016, 0.010590553283691406, 0.011870861053466797, 0.013151168823242188, 0.014431476593017578, 0.01571178436279297, 0.01699209213256836, 0.01827239990234375, 0.01955270767211914, 0.02083301544189453, 0.022113323211669922, 0.023393630981445312, 0.024673938751220703, 0.025954246520996094, 0.027234554290771484, 0.028514862060546875, 0.029795169830322266, 0.031075477600097656, 0.03235578536987305, 0.03363609313964844, 0.03491640090942383, 0.03619670867919922, 0.03747701644897461, 0.03875732421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 10.0, 4.0, 8.0, 9.0, 11.0, 15.0, 25.0, 482.0, 297.0, 24.0, 5.0, 12.0, 7.0, 9.0, 6.0, 8.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.01237177848815918, -0.01194906234741211, -0.011526346206665039, -0.011103630065917969, -0.010680913925170898, -0.010258197784423828, -0.009835481643676758, -0.009412765502929688, -0.008990049362182617, -0.008567333221435547, -0.008144617080688477, -0.007721900939941406, -0.007299184799194336, -0.006876468658447266, -0.006453752517700195, -0.006031036376953125, -0.005608320236206055, -0.005185604095458984, -0.004762887954711914, -0.004340171813964844, -0.0039174556732177734, -0.003494739532470703, -0.003072023391723633, -0.0026493072509765625, -0.002226591110229492, -0.0018038749694824219, -0.0013811588287353516, -0.0009584426879882812, -0.0005357265472412109, -0.00011301040649414062, 0.0003097057342529297, 0.000732421875, 0.0011551380157470703, 0.0015778541564941406, 0.002000570297241211, 0.0024232864379882812, 0.0028460025787353516, 0.003268718719482422, 0.003691434860229492, 0.0041141510009765625, 0.004536867141723633, 0.004959583282470703, 0.0053822994232177734, 0.005805015563964844, 0.006227731704711914, 0.006650447845458984, 0.007073163986206055, 0.007495880126953125, 0.007918596267700195, 0.008341312408447266, 0.008764028549194336, 0.009186744689941406, 0.009609460830688477, 0.010032176971435547, 0.010454893112182617, 0.010877609252929688, 0.011300325393676758, 0.011723041534423828, 0.012145757675170898, 0.012568473815917969, 0.012991189956665039, 0.01341390609741211, 0.01383662223815918, 0.01425933837890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 16.0, 10.0, 19.0, 13.0, 24.0, 39.0, 49.0, 53.0, 50.0, 58.0, 88.0, 116.0, 102.0, 169.0, 198.0, 366.0, 704.0, 3680.0, 90265.0, 927741.0, 21300.0, 1710.0, 523.0, 272.0, 191.0, 124.0, 111.0, 119.0, 76.0, 62.0, 53.0, 48.0, 37.0, 35.0, 21.0, 21.0, 17.0, 14.0, 10.0, 4.0, 7.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.0791482925415039, -0.07644844055175781, -0.07374858856201172, -0.07104873657226562, -0.06834888458251953, -0.06564903259277344, -0.06294918060302734, -0.06024932861328125, -0.057549476623535156, -0.05484962463378906, -0.05214977264404297, -0.049449920654296875, -0.04675006866455078, -0.04405021667480469, -0.041350364685058594, -0.0386505126953125, -0.035950660705566406, -0.03325080871582031, -0.03055095672607422, -0.027851104736328125, -0.02515125274658203, -0.022451400756835938, -0.019751548767089844, -0.01705169677734375, -0.014351844787597656, -0.011651992797851562, -0.008952140808105469, -0.006252288818359375, -0.0035524368286132812, -0.0008525848388671875, 0.0018472671508789062, 0.004547119140625, 0.007246971130371094, 0.009946823120117188, 0.012646675109863281, 0.015346527099609375, 0.01804637908935547, 0.020746231079101562, 0.023446083068847656, 0.02614593505859375, 0.028845787048339844, 0.03154563903808594, 0.03424549102783203, 0.036945343017578125, 0.03964519500732422, 0.04234504699707031, 0.045044898986816406, 0.0477447509765625, 0.050444602966308594, 0.05314445495605469, 0.05584430694580078, 0.058544158935546875, 0.06124401092529297, 0.06394386291503906, 0.06664371490478516, 0.06934356689453125, 0.07204341888427734, 0.07474327087402344, 0.07744312286376953, 0.08014297485351562, 0.08284282684326172, 0.08554267883300781, 0.0882425308227539, 0.0909423828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 7.0, 5.0, 8.0, 13.0, 6.0, 10.0, 4.0, 11.0, 15.0, 24.0, 21.0, 19.0, 25.0, 22.0, 30.0, 30.0, 41.0, 32.0, 40.0, 44.0, 36.0, 38.0, 44.0, 37.0, 38.0, 44.0, 37.0, 37.0, 38.0, 25.0, 39.0, 15.0, 18.0, 26.0, 24.0, 16.0, 12.0, 14.0, 9.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03826904296875, -0.03700685501098633, -0.035744667053222656, -0.034482479095458984, -0.03322029113769531, -0.03195810317993164, -0.03069591522216797, -0.029433727264404297, -0.028171539306640625, -0.026909351348876953, -0.02564716339111328, -0.02438497543334961, -0.023122787475585938, -0.021860599517822266, -0.020598411560058594, -0.019336223602294922, -0.01807403564453125, -0.016811847686767578, -0.015549659729003906, -0.014287471771240234, -0.013025283813476562, -0.01176309585571289, -0.010500907897949219, -0.009238719940185547, -0.007976531982421875, -0.006714344024658203, -0.005452156066894531, -0.004189968109130859, -0.0029277801513671875, -0.0016655921936035156, -0.00040340423583984375, 0.0008587837219238281, 0.0021209716796875, 0.003383159637451172, 0.004645347595214844, 0.005907535552978516, 0.0071697235107421875, 0.00843191146850586, 0.009694099426269531, 0.010956287384033203, 0.012218475341796875, 0.013480663299560547, 0.014742851257324219, 0.01600503921508789, 0.017267227172851562, 0.018529415130615234, 0.019791603088378906, 0.021053791046142578, 0.02231597900390625, 0.023578166961669922, 0.024840354919433594, 0.026102542877197266, 0.027364730834960938, 0.02862691879272461, 0.02988910675048828, 0.031151294708251953, 0.032413482666015625, 0.0336756706237793, 0.03493785858154297, 0.03620004653930664, 0.03746223449707031, 0.038724422454833984, 0.039986610412597656, 0.04124879837036133, 0.042510986328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 23.0, 47.0, 64.0, 165.0, 391.0, 1362.0, 9701.0, 1005077.0, 28689.0, 2099.0, 531.0, 185.0, 73.0, 42.0, 27.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001360177993774414, -0.00013185106217861176, -0.0001276843249797821, -0.00012351758778095245, -0.0001193508505821228, -0.00011518411338329315, -0.0001110173761844635, -0.00010685063898563385, -0.0001026839017868042, -9.851716458797455e-05, -9.43504273891449e-05, -9.018369019031525e-05, -8.60169529914856e-05, -8.185021579265594e-05, -7.76834785938263e-05, -7.351674139499664e-05, -6.935000419616699e-05, -6.518326699733734e-05, -6.101652979850769e-05, -5.684979259967804e-05, -5.268305540084839e-05, -4.851631820201874e-05, -4.434958100318909e-05, -4.0182843804359436e-05, -3.6016106605529785e-05, -3.1849369406700134e-05, -2.7682632207870483e-05, -2.3515895009040833e-05, -1.934915781021118e-05, -1.518242061138153e-05, -1.101568341255188e-05, -6.848946213722229e-06, -2.682209014892578e-06, 1.4845281839370728e-06, 5.651265382766724e-06, 9.818002581596375e-06, 1.3984739780426025e-05, 1.8151476979255676e-05, 2.2318214178085327e-05, 2.6484951376914978e-05, 3.065168857574463e-05, 3.481842577457428e-05, 3.898516297340393e-05, 4.315190017223358e-05, 4.731863737106323e-05, 5.148537456989288e-05, 5.5652111768722534e-05, 5.9818848967552185e-05, 6.398558616638184e-05, 6.815232336521149e-05, 7.231906056404114e-05, 7.648579776287079e-05, 8.065253496170044e-05, 8.481927216053009e-05, 8.898600935935974e-05, 9.315274655818939e-05, 9.731948375701904e-05, 0.0001014862209558487, 0.00010565295815467834, 0.000109819695353508, 0.00011398643255233765, 0.0001181531697511673, 0.00012231990694999695, 0.0001264866441488266, 0.00013065338134765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 5.0, 11.0, 15.0, 12.0, 24.0, 51.0, 65.0, 74.0, 90.0, 138.0, 98.0, 96.0, 80.0, 84.0, 52.0, 24.0, 20.0, 14.0, 18.0, 7.0, 7.0, 0.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0848045349121094e-05, -1.0595656931400299e-05, -1.0343268513679504e-05, -1.009088009595871e-05, -9.838491678237915e-06, -9.58610326051712e-06, -9.333714842796326e-06, -9.081326425075531e-06, -8.828938007354736e-06, -8.576549589633942e-06, -8.324161171913147e-06, -8.071772754192352e-06, -7.819384336471558e-06, -7.566995918750763e-06, -7.314607501029968e-06, -7.062219083309174e-06, -6.809830665588379e-06, -6.557442247867584e-06, -6.3050538301467896e-06, -6.052665412425995e-06, -5.8002769947052e-06, -5.5478885769844055e-06, -5.295500159263611e-06, -5.043111741542816e-06, -4.7907233238220215e-06, -4.538334906101227e-06, -4.285946488380432e-06, -4.0335580706596375e-06, -3.7811696529388428e-06, -3.528781235218048e-06, -3.2763928174972534e-06, -3.0240043997764587e-06, -2.771615982055664e-06, -2.5192275643348694e-06, -2.2668391466140747e-06, -2.01445072889328e-06, -1.7620623111724854e-06, -1.5096738934516907e-06, -1.257285475730896e-06, -1.0048970580101013e-06, -7.525086402893066e-07, -5.00120222568512e-07, -2.477318048477173e-07, 4.6566128730773926e-09, 2.5704503059387207e-07, 5.094334483146667e-07, 7.618218660354614e-07, 1.014210283756256e-06, 1.2665987014770508e-06, 1.5189871191978455e-06, 1.7713755369186401e-06, 2.023763954639435e-06, 2.2761523723602295e-06, 2.528540790081024e-06, 2.780929207801819e-06, 3.0333176255226135e-06, 3.285706043243408e-06, 3.538094460964203e-06, 3.7904828786849976e-06, 4.042871296405792e-06, 4.295259714126587e-06, 4.547648131847382e-06, 4.800036549568176e-06, 5.052424967288971e-06, 5.304813385009766e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 14.0, 16.0, 11.0, 31.0, 33.0, 45.0, 51.0, 76.0, 101.0, 143.0, 225.0, 321.0, 915.0, 7959.0, 966429.0, 68347.0, 2316.0, 552.0, 267.0, 175.0, 126.0, 81.0, 57.0, 57.0, 34.0, 31.0, 27.0, 18.0, 16.0, 7.0, 7.0, 9.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.328655242919922e-05, -5.13661652803421e-05, -4.9445778131484985e-05, -4.752539098262787e-05, -4.560500383377075e-05, -4.3684616684913635e-05, -4.176422953605652e-05, -3.98438423871994e-05, -3.7923455238342285e-05, -3.600306808948517e-05, -3.408268094062805e-05, -3.2162293791770935e-05, -3.024190664291382e-05, -2.83215194940567e-05, -2.6401132345199585e-05, -2.4480745196342468e-05, -2.256035804748535e-05, -2.0639970898628235e-05, -1.8719583749771118e-05, -1.6799196600914e-05, -1.4878809452056885e-05, -1.2958422303199768e-05, -1.1038035154342651e-05, -9.117648005485535e-06, -7.197260856628418e-06, -5.276873707771301e-06, -3.3564865589141846e-06, -1.4360994100570679e-06, 4.842877388000488e-07, 2.4046748876571655e-06, 4.325062036514282e-06, 6.245449185371399e-06, 8.165836334228516e-06, 1.0086223483085632e-05, 1.2006610631942749e-05, 1.3926997780799866e-05, 1.5847384929656982e-05, 1.77677720785141e-05, 1.9688159227371216e-05, 2.1608546376228333e-05, 2.352893352508545e-05, 2.5449320673942566e-05, 2.7369707822799683e-05, 2.92900949716568e-05, 3.1210482120513916e-05, 3.313086926937103e-05, 3.505125641822815e-05, 3.6971643567085266e-05, 3.889203071594238e-05, 4.08124178647995e-05, 4.2732805013656616e-05, 4.465319216251373e-05, 4.657357931137085e-05, 4.8493966460227966e-05, 5.041435360908508e-05, 5.23347407579422e-05, 5.4255127906799316e-05, 5.617551505565643e-05, 5.809590220451355e-05, 6.0016289353370667e-05, 6.193667650222778e-05, 6.38570636510849e-05, 6.577745079994202e-05, 6.769783794879913e-05, 6.961822509765625e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 6.0, 5.0, 5.0, 18.0, 12.0, 16.0, 19.0, 23.0, 40.0, 42.0, 41.0, 49.0, 62.0, 65.0, 87.0, 79.0, 64.0, 56.0, 47.0, 44.0, 44.0, 30.0, 20.0, 19.0, 18.0, 9.0, 16.0, 12.0, 9.0, 7.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.491474151611328e-05, -2.401694655418396e-05, -2.311915159225464e-05, -2.2221356630325317e-05, -2.1323561668395996e-05, -2.0425766706466675e-05, -1.9527971744537354e-05, -1.8630176782608032e-05, -1.773238182067871e-05, -1.683458685874939e-05, -1.593679189682007e-05, -1.5038996934890747e-05, -1.4141201972961426e-05, -1.3243407011032104e-05, -1.2345612049102783e-05, -1.1447817087173462e-05, -1.055002212524414e-05, -9.65222716331482e-06, -8.754432201385498e-06, -7.856637239456177e-06, -6.9588422775268555e-06, -6.061047315597534e-06, -5.163252353668213e-06, -4.265457391738892e-06, -3.3676624298095703e-06, -2.469867467880249e-06, -1.5720725059509277e-06, -6.742775440216064e-07, 2.2351741790771484e-07, 1.1213123798370361e-06, 2.0191073417663574e-06, 2.9169023036956787e-06, 3.814697265625e-06, 4.712492227554321e-06, 5.610287189483643e-06, 6.508082151412964e-06, 7.405877113342285e-06, 8.303672075271606e-06, 9.201467037200928e-06, 1.0099261999130249e-05, 1.099705696105957e-05, 1.1894851922988892e-05, 1.2792646884918213e-05, 1.3690441846847534e-05, 1.4588236808776855e-05, 1.5486031770706177e-05, 1.6383826732635498e-05, 1.728162169456482e-05, 1.817941665649414e-05, 1.9077211618423462e-05, 1.9975006580352783e-05, 2.0872801542282104e-05, 2.1770596504211426e-05, 2.2668391466140747e-05, 2.356618642807007e-05, 2.446398138999939e-05, 2.536177635192871e-05, 2.6259571313858032e-05, 2.7157366275787354e-05, 2.8055161237716675e-05, 2.8952956199645996e-05, 2.9850751161575317e-05, 3.074854612350464e-05, 3.164634108543396e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 965.0, 37.0, 6.0, 0.0, 1.0], "bins": [-2.155596971511841, -2.1194586753845215, -2.083320379257202, -2.0471818447113037, -2.0110435485839844, -1.974905252456665, -1.9387669563293457, -1.9026286602020264, -1.8664902448654175, -1.8303519487380981, -1.7942135334014893, -1.75807523727417, -1.7219369411468506, -1.6857985258102417, -1.6496602296829224, -1.6135218143463135, -1.5773835182189941, -1.5412452220916748, -1.505106806755066, -1.4689685106277466, -1.4328300952911377, -1.3966917991638184, -1.360553503036499, -1.3244152069091797, -1.2882767915725708, -1.2521384954452515, -1.2160000801086426, -1.1798617839813232, -1.143723487854004, -1.107585072517395, -1.0714467763900757, -1.0353083610534668, -0.9991700053215027, -0.9630316495895386, -0.9268933534622192, -0.8907549977302551, -0.854616641998291, -0.8184782862663269, -0.7823399305343628, -0.7462016344070435, -0.7100632786750793, -0.6739249229431152, -0.6377866268157959, -0.6016482710838318, -0.5655099153518677, -0.5293715596199036, -0.49323323369026184, -0.4570949077606201, -0.420956552028656, -0.3848181962966919, -0.34867987036705017, -0.31254154443740845, -0.27640318870544434, -0.24026484787464142, -0.2041265070438385, -0.16798818111419678, -0.13184982538223267, -0.09571148455142975, -0.05957314372062683, -0.023434802889823914, 0.012703537940979004, 0.04884187877178192, 0.08498021960258484, 0.12111854553222656, 0.15725690126419067]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 13.0, 12.0, 15.0, 21.0, 28.0, 40.0, 50.0, 72.0, 79.0, 107.0, 96.0, 96.0, 82.0, 71.0, 38.0, 45.0, 29.0, 22.0, 13.0, 12.0, 8.0, 6.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48047685623168945, -0.4644232988357544, -0.44836974143981934, -0.4323161840438843, -0.4162626266479492, -0.40020906925201416, -0.3841554820537567, -0.36810192465782166, -0.3520483672618866, -0.33599480986595154, -0.3199412524700165, -0.3038876950740814, -0.287834107875824, -0.2717805504798889, -0.25572699308395386, -0.2396734356880188, -0.22361987829208374, -0.20756632089614868, -0.19151276350021362, -0.17545919120311737, -0.1594056338071823, -0.14335207641124725, -0.127298504114151, -0.11124494671821594, -0.09519138932228088, -0.07913783192634583, -0.06308426707983017, -0.04703070595860481, -0.030977144837379456, -0.014923587441444397, 0.0011299774050712585, 0.017183542251586914, 0.0332370400428772, 0.049290601164102554, 0.06534416228532791, 0.08139772713184357, 0.09745128452777863, 0.11350484192371368, 0.12955841422080994, 0.145611971616745, 0.16166552901268005, 0.1777190864086151, 0.19377264380455017, 0.20982621610164642, 0.22587977349758148, 0.24193333089351654, 0.2579869031906128, 0.27404046058654785, 0.2900940179824829, 0.30614757537841797, 0.322201132774353, 0.3382546901702881, 0.35430824756622314, 0.3703618049621582, 0.38641539216041565, 0.4024689495563507, 0.41852250695228577, 0.4345760643482208, 0.4506296217441559, 0.46668317914009094, 0.4827367663383484, 0.49879032373428345, 0.5148438811302185, 0.5308974385261536, 0.5469509959220886]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 6.0, 15.0, 12.0, 27.0, 32.0, 51.0, 110.0, 171.0, 312.0, 607.0, 1264.0, 3046.0, 9516.0, 4055298.0, 105873.0, 10079.0, 3851.0, 1783.0, 940.0, 529.0, 278.0, 165.0, 101.0, 62.0, 42.0, 24.0, 23.0, 15.0, 10.0, 9.0, 3.0, 3.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134521484375, -0.1301727294921875, -0.125823974609375, -0.1214752197265625, -0.11712646484375, -0.1127777099609375, -0.108428955078125, -0.1040802001953125, -0.0997314453125, -0.0953826904296875, -0.091033935546875, -0.0866851806640625, -0.08233642578125, -0.0779876708984375, -0.073638916015625, -0.0692901611328125, -0.06494140625, -0.0605926513671875, -0.056243896484375, -0.0518951416015625, -0.04754638671875, -0.0431976318359375, -0.038848876953125, -0.0345001220703125, -0.0301513671875, -0.0258026123046875, -0.021453857421875, -0.0171051025390625, -0.01275634765625, -0.0084075927734375, -0.004058837890625, 0.0002899169921875, 0.004638671875, 0.0089874267578125, 0.013336181640625, 0.0176849365234375, 0.02203369140625, 0.0263824462890625, 0.030731201171875, 0.0350799560546875, 0.0394287109375, 0.0437774658203125, 0.048126220703125, 0.0524749755859375, 0.05682373046875, 0.0611724853515625, 0.065521240234375, 0.0698699951171875, 0.07421875, 0.0785675048828125, 0.082916259765625, 0.0872650146484375, 0.09161376953125, 0.0959625244140625, 0.100311279296875, 0.1046600341796875, 0.1090087890625, 0.1133575439453125, 0.117706298828125, 0.1220550537109375, 0.12640380859375, 0.1307525634765625, 0.135101318359375, 0.1394500732421875, 0.143798828125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 8.0, 8.0, 5.0, 12.0, 14.0, 13.0, 61.0, 586.0, 163.0, 17.0, 9.0, 9.0, 11.0, 11.0, 5.0, 8.0, 4.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01287078857421875, -0.012455344200134277, -0.012039899826049805, -0.011624455451965332, -0.01120901107788086, -0.010793566703796387, -0.010378122329711914, -0.009962677955627441, -0.009547233581542969, -0.009131789207458496, -0.008716344833374023, -0.00830090045928955, -0.007885456085205078, -0.0074700117111206055, -0.007054567337036133, -0.00663912296295166, -0.0062236785888671875, -0.005808234214782715, -0.005392789840698242, -0.0049773454666137695, -0.004561901092529297, -0.004146456718444824, -0.0037310123443603516, -0.003315567970275879, -0.0029001235961914062, -0.0024846792221069336, -0.002069234848022461, -0.0016537904739379883, -0.0012383460998535156, -0.000822901725769043, -0.0004074573516845703, 7.987022399902344e-06, 0.000423431396484375, 0.0008388757705688477, 0.0012543201446533203, 0.001669764518737793, 0.0020852088928222656, 0.0025006532669067383, 0.002916097640991211, 0.0033315420150756836, 0.0037469863891601562, 0.004162430763244629, 0.0045778751373291016, 0.004993319511413574, 0.005408763885498047, 0.0058242082595825195, 0.006239652633666992, 0.006655097007751465, 0.0070705413818359375, 0.00748598575592041, 0.007901430130004883, 0.008316874504089355, 0.008732318878173828, 0.0091477632522583, 0.009563207626342773, 0.009978652000427246, 0.010394096374511719, 0.010809540748596191, 0.011224985122680664, 0.011640429496765137, 0.01205587387084961, 0.012471318244934082, 0.012886762619018555, 0.013302206993103027, 0.0137176513671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 8.0, 15.0, 22.0, 17.0, 35.0, 34.0, 54.0, 80.0, 124.0, 188.0, 349.0, 933.0, 6635.0, 4133695.0, 48788.0, 2022.0, 522.0, 241.0, 146.0, 102.0, 64.0, 50.0, 29.0, 22.0, 14.0, 23.0, 11.0, 9.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.254638671875, -0.24686241149902344, -0.23908615112304688, -0.2313098907470703, -0.22353363037109375, -0.2157573699951172, -0.20798110961914062, -0.20020484924316406, -0.1924285888671875, -0.18465232849121094, -0.17687606811523438, -0.1690998077392578, -0.16132354736328125, -0.1535472869873047, -0.14577102661132812, -0.13799476623535156, -0.130218505859375, -0.12244224548339844, -0.11466598510742188, -0.10688972473144531, -0.09911346435546875, -0.09133720397949219, -0.08356094360351562, -0.07578468322753906, -0.0680084228515625, -0.06023216247558594, -0.052455902099609375, -0.04467964172363281, -0.03690338134765625, -0.029127120971679688, -0.021350860595703125, -0.013574600219726562, -0.00579833984375, 0.0019779205322265625, 0.009754180908203125, 0.017530441284179688, 0.02530670166015625, 0.03308296203613281, 0.040859222412109375, 0.04863548278808594, 0.0564117431640625, 0.06418800354003906, 0.07196426391601562, 0.07974052429199219, 0.08751678466796875, 0.09529304504394531, 0.10306930541992188, 0.11084556579589844, 0.118621826171875, 0.12639808654785156, 0.13417434692382812, 0.1419506072998047, 0.14972686767578125, 0.1575031280517578, 0.16527938842773438, 0.17305564880371094, 0.1808319091796875, 0.18860816955566406, 0.19638442993164062, 0.2041606903076172, 0.21193695068359375, 0.2197132110595703, 0.22748947143554688, 0.23526573181152344, 0.2430419921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 8.0, 4.0, 9.0, 16.0, 18.0, 20.0, 30.0, 32.0, 56.0, 54.0, 71.0, 135.0, 2481.0, 701.0, 117.0, 89.0, 54.0, 36.0, 32.0, 25.0, 18.0, 7.0, 10.0, 10.0, 8.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036457061767578125, -0.03531646728515625, -0.034175872802734375, -0.0330352783203125, -0.031894683837890625, -0.03075408935546875, -0.029613494873046875, -0.028472900390625, -0.027332305908203125, -0.02619171142578125, -0.025051116943359375, -0.0239105224609375, -0.022769927978515625, -0.02162933349609375, -0.020488739013671875, -0.01934814453125, -0.018207550048828125, -0.01706695556640625, -0.015926361083984375, -0.0147857666015625, -0.013645172119140625, -0.01250457763671875, -0.011363983154296875, -0.010223388671875, -0.009082794189453125, -0.00794219970703125, -0.006801605224609375, -0.0056610107421875, -0.004520416259765625, -0.00337982177734375, -0.002239227294921875, -0.0010986328125, 4.1961669921875e-05, 0.00118255615234375, 0.002323150634765625, 0.0034637451171875, 0.004604339599609375, 0.00574493408203125, 0.006885528564453125, 0.008026123046875, 0.009166717529296875, 0.01030731201171875, 0.011447906494140625, 0.0125885009765625, 0.013729095458984375, 0.01486968994140625, 0.016010284423828125, 0.01715087890625, 0.018291473388671875, 0.01943206787109375, 0.020572662353515625, 0.0217132568359375, 0.022853851318359375, 0.02399444580078125, 0.025135040283203125, 0.026275634765625, 0.027416229248046875, 0.02855682373046875, 0.029697418212890625, 0.0308380126953125, 0.031978607177734375, 0.03311920166015625, 0.034259796142578125, 0.035400390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 98.0, 855.0, 38.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262847900390625, -0.2575269937515259, -0.25220605731010437, -0.24688513576984406, -0.24156421422958374, -0.23624329268932343, -0.2309223711490631, -0.225601464509964, -0.22028052806854248, -0.21495960652828217, -0.20963868498802185, -0.20431776344776154, -0.19899684190750122, -0.1936759203672409, -0.1883549988269806, -0.18303409218788147, -0.17771317064762115, -0.17239224910736084, -0.16707132756710052, -0.1617504060268402, -0.1564294844865799, -0.15110856294631958, -0.14578765630722046, -0.14046671986579895, -0.13514581322669983, -0.12982489168643951, -0.1245039701461792, -0.11918304860591888, -0.11386212706565857, -0.10854120552539825, -0.10322029143571854, -0.09789936989545822, -0.09257844090461731, -0.087257519364357, -0.08193659782409668, -0.07661567628383636, -0.07129475474357605, -0.06597383320331573, -0.06065291911363602, -0.0553319975733757, -0.05001107603311539, -0.04469015449285507, -0.03936923295259476, -0.03404831513762474, -0.028727393597364426, -0.02340647205710411, -0.018085554242134094, -0.01276463270187378, -0.007443711161613464, -0.002122790552675724, 0.0031981300562620163, 0.008519049733877182, 0.013839971274137497, 0.019160892814397812, 0.02448181062936783, 0.029802732169628143, 0.03512365370988846, 0.04044457525014877, 0.04576549679040909, 0.051086414605379105, 0.05640733614563942, 0.061728257685899734, 0.06704917550086975, 0.07237009704113007, 0.07769101858139038]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 7.0, 2.0, 8.0, 11.0, 8.0, 11.0, 20.0, 25.0, 42.0, 54.0, 65.0, 99.0, 85.0, 92.0, 99.0, 94.0, 62.0, 53.0, 41.0, 37.0, 19.0, 17.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1677730679512024, -0.1625528782606125, -0.15733268857002258, -0.15211249887943268, -0.14689230918884277, -0.14167211949825287, -0.13645192980766296, -0.13123172521591187, -0.12601155042648315, -0.12079136073589325, -0.11557117104530334, -0.11035098135471344, -0.10513079166412354, -0.09991060197353363, -0.09469040483236313, -0.08947021514177322, -0.08425001800060272, -0.07902982831001282, -0.07380963861942291, -0.06858944892883301, -0.0633692592382431, -0.0581490658223629, -0.0529288724064827, -0.04770868271589279, -0.04248849302530289, -0.03726830333471298, -0.03204811364412308, -0.026827920228242874, -0.02160773053765297, -0.016387540847063065, -0.011167347431182861, -0.0059471577405929565, -0.0007269680500030518, 0.004493222571909428, 0.009713413193821907, 0.014933604747056961, 0.020153794437646866, 0.02537398412823677, 0.030594177544116974, 0.03581436723470688, 0.04103455692529678, 0.04625474661588669, 0.05147493630647659, 0.056695129722356796, 0.0619153194129467, 0.0671355128288269, 0.07235570251941681, 0.07757589221000671, 0.08279608190059662, 0.08801627159118652, 0.09323646128177643, 0.09845665097236633, 0.10367684066295624, 0.10889703035354614, 0.11411722749471664, 0.11933741718530655, 0.12455760687589645, 0.12977780401706696, 0.13499799370765686, 0.14021818339824677, 0.14543837308883667, 0.15065856277942657, 0.15587875247001648, 0.16109894216060638, 0.1663191318511963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 30.0, 33.0, 52.0, 63.0, 96.0, 143.0, 166.0, 251.0, 397.0, 527.0, 846.0, 1283.0, 2041.0, 3472.0, 6262.0, 13193.0, 42240.0, 904518.0, 43173.0, 13474.0, 6511.0, 3510.0, 2046.0, 1334.0, 842.0, 585.0, 401.0, 290.0, 201.0, 134.0, 111.0, 80.0, 57.0, 47.0, 28.0, 23.0, 13.0, 16.0, 7.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039581298828125, -0.0382843017578125, -0.0369873046875, -0.0356903076171875, -0.034393310546875, -0.0330963134765625, -0.03179931640625, -0.0305023193359375, -0.029205322265625, -0.0279083251953125, -0.026611328125, -0.0253143310546875, -0.024017333984375, -0.0227203369140625, -0.02142333984375, -0.0201263427734375, -0.018829345703125, -0.0175323486328125, -0.0162353515625, -0.0149383544921875, -0.013641357421875, -0.0123443603515625, -0.01104736328125, -0.0097503662109375, -0.008453369140625, -0.0071563720703125, -0.005859375, -0.0045623779296875, -0.003265380859375, -0.0019683837890625, -0.00067138671875, 0.0006256103515625, 0.001922607421875, 0.0032196044921875, 0.0045166015625, 0.0058135986328125, 0.007110595703125, 0.0084075927734375, 0.00970458984375, 0.0110015869140625, 0.012298583984375, 0.0135955810546875, 0.014892578125, 0.0161895751953125, 0.017486572265625, 0.0187835693359375, 0.02008056640625, 0.0213775634765625, 0.022674560546875, 0.0239715576171875, 0.0252685546875, 0.0265655517578125, 0.027862548828125, 0.0291595458984375, 0.03045654296875, 0.0317535400390625, 0.033050537109375, 0.0343475341796875, 0.03564453125, 0.0369415283203125, 0.038238525390625, 0.0395355224609375, 0.04083251953125, 0.0421295166015625, 0.043426513671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 10.0, 11.0, 6.0, 13.0, 10.0, 38.0, 259.0, 438.0, 84.0, 14.0, 13.0, 8.0, 9.0, 11.0, 7.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01080322265625, -0.010449647903442383, -0.010096073150634766, -0.009742498397827148, -0.009388923645019531, -0.009035348892211914, -0.008681774139404297, -0.00832819938659668, -0.007974624633789062, -0.007621049880981445, -0.007267475128173828, -0.006913900375366211, -0.006560325622558594, -0.0062067508697509766, -0.005853176116943359, -0.005499601364135742, -0.005146026611328125, -0.004792451858520508, -0.004438877105712891, -0.0040853023529052734, -0.0037317276000976562, -0.003378152847290039, -0.003024578094482422, -0.0026710033416748047, -0.0023174285888671875, -0.0019638538360595703, -0.0016102790832519531, -0.001256704330444336, -0.0009031295776367188, -0.0005495548248291016, -0.00019598007202148438, 0.0001575946807861328, 0.00051116943359375, 0.0008647441864013672, 0.0012183189392089844, 0.0015718936920166016, 0.0019254684448242188, 0.002279043197631836, 0.002632617950439453, 0.0029861927032470703, 0.0033397674560546875, 0.0036933422088623047, 0.004046916961669922, 0.004400491714477539, 0.004754066467285156, 0.0051076412200927734, 0.005461215972900391, 0.005814790725708008, 0.006168365478515625, 0.006521940231323242, 0.006875514984130859, 0.0072290897369384766, 0.007582664489746094, 0.007936239242553711, 0.008289813995361328, 0.008643388748168945, 0.008996963500976562, 0.00935053825378418, 0.009704113006591797, 0.010057687759399414, 0.010411262512207031, 0.010764837265014648, 0.011118412017822266, 0.011471986770629883, 0.0118255615234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 11.0, 13.0, 21.0, 24.0, 36.0, 34.0, 42.0, 46.0, 66.0, 70.0, 87.0, 97.0, 125.0, 175.0, 254.0, 539.0, 2198.0, 49141.0, 979576.0, 13276.0, 1228.0, 407.0, 223.0, 163.0, 134.0, 110.0, 81.0, 59.0, 57.0, 47.0, 31.0, 31.0, 25.0, 21.0, 19.0, 15.0, 11.0, 13.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0966796875, -0.093780517578125, -0.09088134765625, -0.087982177734375, -0.0850830078125, -0.082183837890625, -0.07928466796875, -0.076385498046875, -0.073486328125, -0.070587158203125, -0.06768798828125, -0.064788818359375, -0.0618896484375, -0.058990478515625, -0.05609130859375, -0.053192138671875, -0.05029296875, -0.047393798828125, -0.04449462890625, -0.041595458984375, -0.0386962890625, -0.035797119140625, -0.03289794921875, -0.029998779296875, -0.027099609375, -0.024200439453125, -0.02130126953125, -0.018402099609375, -0.0155029296875, -0.012603759765625, -0.00970458984375, -0.006805419921875, -0.00390625, -0.001007080078125, 0.00189208984375, 0.004791259765625, 0.0076904296875, 0.010589599609375, 0.01348876953125, 0.016387939453125, 0.019287109375, 0.022186279296875, 0.02508544921875, 0.027984619140625, 0.0308837890625, 0.033782958984375, 0.03668212890625, 0.039581298828125, 0.04248046875, 0.045379638671875, 0.04827880859375, 0.051177978515625, 0.0540771484375, 0.056976318359375, 0.05987548828125, 0.062774658203125, 0.065673828125, 0.068572998046875, 0.07147216796875, 0.074371337890625, 0.0772705078125, 0.080169677734375, 0.08306884765625, 0.085968017578125, 0.0888671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 5.0, 6.0, 9.0, 12.0, 17.0, 14.0, 24.0, 17.0, 27.0, 28.0, 28.0, 23.0, 27.0, 36.0, 44.0, 48.0, 50.0, 39.0, 56.0, 54.0, 38.0, 41.0, 35.0, 43.0, 44.0, 47.0, 21.0, 23.0, 15.0, 22.0, 14.0, 11.0, 9.0, 8.0, 9.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0308074951171875, -0.029883384704589844, -0.028959274291992188, -0.02803516387939453, -0.027111053466796875, -0.02618694305419922, -0.025262832641601562, -0.024338722229003906, -0.02341461181640625, -0.022490501403808594, -0.021566390991210938, -0.02064228057861328, -0.019718170166015625, -0.01879405975341797, -0.017869949340820312, -0.016945838928222656, -0.016021728515625, -0.015097618103027344, -0.014173507690429688, -0.013249397277832031, -0.012325286865234375, -0.011401176452636719, -0.010477066040039062, -0.009552955627441406, -0.00862884521484375, -0.007704734802246094, -0.0067806243896484375, -0.005856513977050781, -0.004932403564453125, -0.004008293151855469, -0.0030841827392578125, -0.0021600723266601562, -0.0012359619140625, -0.00031185150146484375, 0.0006122589111328125, 0.0015363693237304688, 0.002460479736328125, 0.0033845901489257812, 0.0043087005615234375, 0.005232810974121094, 0.00615692138671875, 0.007081031799316406, 0.008005142211914062, 0.008929252624511719, 0.009853363037109375, 0.010777473449707031, 0.011701583862304688, 0.012625694274902344, 0.0135498046875, 0.014473915100097656, 0.015398025512695312, 0.01632213592529297, 0.017246246337890625, 0.01817035675048828, 0.019094467163085938, 0.020018577575683594, 0.02094268798828125, 0.021866798400878906, 0.022790908813476562, 0.02371501922607422, 0.024639129638671875, 0.02556324005126953, 0.026487350463867188, 0.027411460876464844, 0.0283355712890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 14.0, 23.0, 42.0, 42.0, 57.0, 85.0, 153.0, 200.0, 368.0, 828.0, 2850.0, 51927.0, 981696.0, 7426.0, 1506.0, 490.0, 271.0, 170.0, 107.0, 69.0, 53.0, 39.0, 31.0, 14.0, 14.0, 13.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019669532775878906, -0.00019059516489505768, -0.0001844950020313263, -0.0001783948391675949, -0.00017229467630386353, -0.00016619451344013214, -0.00016009435057640076, -0.00015399418771266937, -0.000147894024848938, -0.0001417938619852066, -0.00013569369912147522, -0.00012959353625774384, -0.00012349337339401245, -0.00011739321053028107, -0.00011129304766654968, -0.0001051928848028183, -9.909272193908691e-05, -9.299255907535553e-05, -8.689239621162415e-05, -8.079223334789276e-05, -7.469207048416138e-05, -6.859190762042999e-05, -6.249174475669861e-05, -5.6391581892967224e-05, -5.029141902923584e-05, -4.4191256165504456e-05, -3.809109330177307e-05, -3.199093043804169e-05, -2.5890767574310303e-05, -1.979060471057892e-05, -1.3690441846847534e-05, -7.59027898311615e-06, -1.4901161193847656e-06, 4.610046744346619e-06, 1.0710209608078003e-05, 1.6810372471809387e-05, 2.291053533554077e-05, 2.9010698199272156e-05, 3.511086106300354e-05, 4.1211023926734924e-05, 4.731118679046631e-05, 5.341134965419769e-05, 5.951151251792908e-05, 6.561167538166046e-05, 7.171183824539185e-05, 7.781200110912323e-05, 8.391216397285461e-05, 9.0012326836586e-05, 9.611248970031738e-05, 0.00010221265256404877, 0.00010831281542778015, 0.00011441297829151154, 0.00012051314115524292, 0.0001266133040189743, 0.0001327134668827057, 0.00013881362974643707, 0.00014491379261016846, 0.00015101395547389984, 0.00015711411833763123, 0.0001632142812013626, 0.000169314444065094, 0.00017541460692882538, 0.00018151476979255676, 0.00018761493265628815, 0.00019371509552001953]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 14.0, 20.0, 33.0, 40.0, 65.0, 85.0, 61.0, 108.0, 81.0, 101.0, 76.0, 79.0, 43.0, 57.0, 23.0, 29.0, 19.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -4.974193871021271e-06, -4.762783646583557e-06, -4.5513734221458435e-06, -4.33996319770813e-06, -4.128552973270416e-06, -3.917142748832703e-06, -3.705732524394989e-06, -3.4943222999572754e-06, -3.2829120755195618e-06, -3.071501851081848e-06, -2.8600916266441345e-06, -2.648681402206421e-06, -2.4372711777687073e-06, -2.2258609533309937e-06, -2.01445072889328e-06, -1.8030405044555664e-06, -1.5916302800178528e-06, -1.3802200555801392e-06, -1.1688098311424255e-06, -9.57399606704712e-07, -7.459893822669983e-07, -5.345791578292847e-07, -3.2316893339157104e-07, -1.1175870895385742e-07, 9.96515154838562e-08, 3.110617399215698e-07, 5.224719643592834e-07, 7.338821887969971e-07, 9.452924132347107e-07, 1.1567026376724243e-06, 1.368112862110138e-06, 1.5795230865478516e-06, 1.7909333109855652e-06, 2.002343535423279e-06, 2.2137537598609924e-06, 2.425163984298706e-06, 2.6365742087364197e-06, 2.8479844331741333e-06, 3.059394657611847e-06, 3.2708048820495605e-06, 3.482215106487274e-06, 3.693625330924988e-06, 3.905035555362701e-06, 4.116445779800415e-06, 4.327856004238129e-06, 4.539266228675842e-06, 4.750676453113556e-06, 4.9620866775512695e-06, 5.173496901988983e-06, 5.384907126426697e-06, 5.59631735086441e-06, 5.807727575302124e-06, 6.019137799739838e-06, 6.230548024177551e-06, 6.441958248615265e-06, 6.6533684730529785e-06, 6.864778697490692e-06, 7.076188921928406e-06, 7.287599146366119e-06, 7.499009370803833e-06, 7.710419595241547e-06, 7.92182981967926e-06, 8.133240044116974e-06, 8.344650268554688e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 13.0, 19.0, 28.0, 27.0, 52.0, 94.0, 158.0, 367.0, 1885.0, 1031367.0, 13345.0, 654.0, 238.0, 107.0, 57.0, 43.0, 31.0, 26.0, 5.0, 9.0, 11.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002770423889160156, -0.0002666749060153961, -0.0002563074231147766, -0.0002459399402141571, -0.0002355724573135376, -0.0002252049744129181, -0.00021483749151229858, -0.00020447000861167908, -0.00019410252571105957, -0.00018373504281044006, -0.00017336755990982056, -0.00016300007700920105, -0.00015263259410858154, -0.00014226511120796204, -0.00013189762830734253, -0.00012153014540672302, -0.00011116266250610352, -0.00010079517960548401, -9.04276967048645e-05, -8.0060213804245e-05, -6.969273090362549e-05, -5.932524800300598e-05, -4.8957765102386475e-05, -3.859028220176697e-05, -2.822279930114746e-05, -1.7855316400527954e-05, -7.487833499908447e-06, 2.8796494007110596e-06, 1.3247132301330566e-05, 2.3614615201950073e-05, 3.398209810256958e-05, 4.434958100318909e-05, 5.4717063903808594e-05, 6.50845468044281e-05, 7.545202970504761e-05, 8.581951260566711e-05, 9.618699550628662e-05, 0.00010655447840690613, 0.00011692196130752563, 0.00012728944420814514, 0.00013765692710876465, 0.00014802441000938416, 0.00015839189291000366, 0.00016875937581062317, 0.00017912685871124268, 0.00018949434161186218, 0.0001998618245124817, 0.0002102293074131012, 0.0002205967903137207, 0.0002309642732143402, 0.00024133175611495972, 0.0002516992390155792, 0.00026206672191619873, 0.00027243420481681824, 0.00028280168771743774, 0.00029316917061805725, 0.00030353665351867676, 0.00031390413641929626, 0.00032427161931991577, 0.0003346391022205353, 0.0003450065851211548, 0.0003553740680217743, 0.0003657415509223938, 0.0003761090338230133, 0.0003864765167236328]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 3.0, 11.0, 11.0, 12.0, 36.0, 35.0, 62.0, 106.0, 131.0, 165.0, 153.0, 94.0, 54.0, 40.0, 22.0, 18.0, 9.0, 11.0, 5.0, 4.0, 5.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.641315460205078e-05, -7.329508662223816e-05, -7.017701864242554e-05, -6.705895066261292e-05, -6.394088268280029e-05, -6.082281470298767e-05, -5.770474672317505e-05, -5.458667874336243e-05, -5.1468610763549805e-05, -4.835054278373718e-05, -4.523247480392456e-05, -4.211440682411194e-05, -3.8996338844299316e-05, -3.5878270864486694e-05, -3.276020288467407e-05, -2.964213490486145e-05, -2.6524066925048828e-05, -2.3405998945236206e-05, -2.0287930965423584e-05, -1.7169862985610962e-05, -1.405179500579834e-05, -1.0933727025985718e-05, -7.815659046173096e-06, -4.697591066360474e-06, -1.5795230865478516e-06, 1.5385448932647705e-06, 4.656612873077393e-06, 7.774680852890015e-06, 1.0892748832702637e-05, 1.4010816812515259e-05, 1.712888479232788e-05, 2.0246952772140503e-05, 2.3365020751953125e-05, 2.6483088731765747e-05, 2.960115671157837e-05, 3.271922469139099e-05, 3.583729267120361e-05, 3.8955360651016235e-05, 4.207342863082886e-05, 4.519149661064148e-05, 4.83095645904541e-05, 5.1427632570266724e-05, 5.4545700550079346e-05, 5.766376852989197e-05, 6.078183650970459e-05, 6.389990448951721e-05, 6.701797246932983e-05, 7.013604044914246e-05, 7.325410842895508e-05, 7.63721764087677e-05, 7.949024438858032e-05, 8.260831236839294e-05, 8.572638034820557e-05, 8.884444832801819e-05, 9.196251630783081e-05, 9.508058428764343e-05, 9.819865226745605e-05, 0.00010131672024726868, 0.0001044347882270813, 0.00010755285620689392, 0.00011067092418670654, 0.00011378899216651917, 0.00011690706014633179, 0.00012002512812614441, 0.00012314319610595703]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 977.0, 35.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.464580774307251, -1.4350593090057373, -1.4055379629135132, -1.3760164976119995, -1.3464950323104858, -1.3169736862182617, -1.287452220916748, -1.2579307556152344, -1.2284094095230103, -1.1988879442214966, -1.1693665981292725, -1.1398451328277588, -1.1103236675262451, -1.080802321434021, -1.0512808561325073, -1.0217595100402832, -0.9922380447387695, -0.9627166390419006, -0.933195173740387, -0.9036737680435181, -0.8741523623466492, -0.8446309566497803, -0.8151094913482666, -0.7855880856513977, -0.756066620349884, -0.7265452146530151, -0.6970237493515015, -0.6675023436546326, -0.6379809379577637, -0.60845947265625, -0.5789380669593811, -0.5494166612625122, -0.5198952555656433, -0.490373820066452, -0.46085241436958313, -0.43133097887039185, -0.40180957317352295, -0.37228813767433167, -0.3427667021751404, -0.3132452964782715, -0.2837238907814026, -0.2542024552822113, -0.2246810495853424, -0.19515961408615112, -0.16563820838928223, -0.13611677289009094, -0.10659535229206085, -0.07707393169403076, -0.04755249619483948, -0.018031073734164238, 0.011490348726511002, 0.04101177304983139, 0.07053319364786148, 0.10005462169647217, 0.12957604229450226, 0.15909746289253235, 0.18861888349056244, 0.21814030408859253, 0.24766172468662262, 0.2771831452846527, 0.306704580783844, 0.3362259864807129, 0.3657474219799042, 0.39526885747909546, 0.42479026317596436]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 4.0, 11.0, 11.0, 17.0, 19.0, 35.0, 31.0, 48.0, 44.0, 60.0, 69.0, 69.0, 67.0, 59.0, 77.0, 66.0, 65.0, 51.0, 43.0, 25.0, 37.0, 20.0, 17.0, 21.0, 10.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.42555153369903564, -0.4158328175544739, -0.4061141014099121, -0.39639535546302795, -0.3866766393184662, -0.3769579231739044, -0.36723917722702026, -0.3575204610824585, -0.34780174493789673, -0.33808302879333496, -0.3283643126487732, -0.31864556670188904, -0.30892685055732727, -0.2992081344127655, -0.28948938846588135, -0.2797706723213196, -0.2700519561767578, -0.26033324003219604, -0.2506145238876343, -0.24089577794075012, -0.23117706179618835, -0.2214583456516266, -0.21173961460590363, -0.20202088356018066, -0.1923021674156189, -0.18258345127105713, -0.17286472022533417, -0.1631459891796112, -0.15342727303504944, -0.14370855689048767, -0.1339898258447647, -0.12427110224962234, -0.11455237865447998, -0.10483365505933762, -0.09511493146419525, -0.08539620786905289, -0.07567748427391052, -0.06595876067876816, -0.05624003708362579, -0.04652131348848343, -0.036802589893341064, -0.0270838662981987, -0.017365142703056335, -0.007646419107913971, 0.0020723044872283936, 0.011791028082370758, 0.021509751677513123, 0.031228475272655487, 0.04094719886779785, 0.050665922462940216, 0.06038464605808258, 0.07010336965322495, 0.07982209324836731, 0.08954081684350967, 0.09925954043865204, 0.1089782640337944, 0.11869698762893677, 0.12841570377349854, 0.1381344348192215, 0.14785316586494446, 0.15757188200950623, 0.167290598154068, 0.17700932919979095, 0.18672806024551392, 0.19644677639007568]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 11.0, 8.0, 8.0, 23.0, 31.0, 59.0, 109.0, 273.0, 839.0, 4639.0, 4180180.0, 5912.0, 1271.0, 457.0, 189.0, 95.0, 52.0, 28.0, 18.0, 9.0, 13.0, 6.0, 9.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.156494140625, -0.1513671875, -0.146240234375, -0.14111328125, -0.135986328125, -0.130859375, -0.125732421875, -0.12060546875, -0.115478515625, -0.1103515625, -0.105224609375, -0.10009765625, -0.094970703125, -0.08984375, -0.084716796875, -0.07958984375, -0.074462890625, -0.0693359375, -0.064208984375, -0.05908203125, -0.053955078125, -0.048828125, -0.043701171875, -0.03857421875, -0.033447265625, -0.0283203125, -0.023193359375, -0.01806640625, -0.012939453125, -0.0078125, -0.002685546875, 0.00244140625, 0.007568359375, 0.0126953125, 0.017822265625, 0.02294921875, 0.028076171875, 0.033203125, 0.038330078125, 0.04345703125, 0.048583984375, 0.0537109375, 0.058837890625, 0.06396484375, 0.069091796875, 0.07421875, 0.079345703125, 0.08447265625, 0.089599609375, 0.0947265625, 0.099853515625, 0.10498046875, 0.110107421875, 0.115234375, 0.120361328125, 0.12548828125, 0.130615234375, 0.1357421875, 0.140869140625, 0.14599609375, 0.151123046875, 0.15625, 0.161376953125, 0.16650390625, 0.171630859375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 9.0, 4.0, 3.0, 13.0, 9.0, 7.0, 10.0, 11.0, 50.0, 282.0, 383.0, 98.0, 19.0, 12.0, 8.0, 10.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01043701171875, -0.01009523868560791, -0.00975346565246582, -0.00941169261932373, -0.00906991958618164, -0.00872814655303955, -0.008386373519897461, -0.008044600486755371, -0.007702827453613281, -0.007361054420471191, -0.0070192813873291016, -0.006677508354187012, -0.006335735321044922, -0.005993962287902832, -0.005652189254760742, -0.005310416221618652, -0.0049686431884765625, -0.004626870155334473, -0.004285097122192383, -0.003943324089050293, -0.003601551055908203, -0.0032597780227661133, -0.0029180049896240234, -0.0025762319564819336, -0.0022344589233398438, -0.001892685890197754, -0.001550912857055664, -0.0012091398239135742, -0.0008673667907714844, -0.0005255937576293945, -0.0001838207244873047, 0.00015795230865478516, 0.000499725341796875, 0.0008414983749389648, 0.0011832714080810547, 0.0015250444412231445, 0.0018668174743652344, 0.0022085905075073242, 0.002550363540649414, 0.002892136573791504, 0.0032339096069335938, 0.0035756826400756836, 0.0039174556732177734, 0.004259228706359863, 0.004601001739501953, 0.004942774772644043, 0.005284547805786133, 0.005626320838928223, 0.0059680938720703125, 0.006309866905212402, 0.006651639938354492, 0.006993412971496582, 0.007335186004638672, 0.007676959037780762, 0.008018732070922852, 0.008360505104064941, 0.008702278137207031, 0.009044051170349121, 0.009385824203491211, 0.0097275972366333, 0.01006937026977539, 0.01041114330291748, 0.01075291633605957, 0.01109468936920166, 0.01143646240234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 13.0, 8.0, 11.0, 6.0, 18.0, 21.0, 23.0, 43.0, 51.0, 71.0, 96.0, 152.0, 421.0, 2049.0, 4070474.0, 118211.0, 1677.0, 421.0, 149.0, 102.0, 63.0, 47.0, 34.0, 26.0, 18.0, 15.0, 8.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.121826171875, -0.11730384826660156, -0.11278152465820312, -0.10825920104980469, -0.10373687744140625, -0.09921455383300781, -0.09469223022460938, -0.09016990661621094, -0.0856475830078125, -0.08112525939941406, -0.07660293579101562, -0.07208061218261719, -0.06755828857421875, -0.06303596496582031, -0.058513641357421875, -0.05399131774902344, -0.049468994140625, -0.04494667053222656, -0.040424346923828125, -0.03590202331542969, -0.03137969970703125, -0.026857376098632812, -0.022335052490234375, -0.017812728881835938, -0.0132904052734375, -0.008768081665039062, -0.004245758056640625, 0.0002765655517578125, 0.00479888916015625, 0.009321212768554688, 0.013843536376953125, 0.018365859985351562, 0.02288818359375, 0.027410507202148438, 0.031932830810546875, 0.03645515441894531, 0.04097747802734375, 0.04549980163574219, 0.050022125244140625, 0.05454444885253906, 0.0590667724609375, 0.06358909606933594, 0.06811141967773438, 0.07263374328613281, 0.07715606689453125, 0.08167839050292969, 0.08620071411132812, 0.09072303771972656, 0.095245361328125, 0.09976768493652344, 0.10429000854492188, 0.10881233215332031, 0.11333465576171875, 0.11785697937011719, 0.12237930297851562, 0.12690162658691406, 0.1314239501953125, 0.13594627380371094, 0.14046859741210938, 0.1449909210205078, 0.14951324462890625, 0.1540355682373047, 0.15855789184570312, 0.16308021545410156, 0.1676025390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 9.0, 9.0, 10.0, 14.0, 21.0, 14.0, 14.0, 36.0, 58.0, 132.0, 3195.0, 327.0, 65.0, 39.0, 21.0, 19.0, 16.0, 12.0, 7.0, 8.0, 6.0, 4.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.017974853515625, -0.017302513122558594, -0.016630172729492188, -0.01595783233642578, -0.015285491943359375, -0.014613151550292969, -0.013940811157226562, -0.013268470764160156, -0.01259613037109375, -0.011923789978027344, -0.011251449584960938, -0.010579109191894531, -0.009906768798828125, -0.009234428405761719, -0.008562088012695312, -0.007889747619628906, -0.0072174072265625, -0.006545066833496094, -0.0058727264404296875, -0.005200386047363281, -0.004528045654296875, -0.0038557052612304688, -0.0031833648681640625, -0.0025110244750976562, -0.00183868408203125, -0.0011663436889648438, -0.0004940032958984375, 0.00017833709716796875, 0.000850677490234375, 0.0015230178833007812, 0.0021953582763671875, 0.0028676986694335938, 0.0035400390625, 0.004212379455566406, 0.0048847198486328125, 0.005557060241699219, 0.006229400634765625, 0.006901741027832031, 0.0075740814208984375, 0.008246421813964844, 0.00891876220703125, 0.009591102600097656, 0.010263442993164062, 0.010935783386230469, 0.011608123779296875, 0.012280464172363281, 0.012952804565429688, 0.013625144958496094, 0.0142974853515625, 0.014969825744628906, 0.015642166137695312, 0.01631450653076172, 0.016986846923828125, 0.01765918731689453, 0.018331527709960938, 0.019003868103027344, 0.01967620849609375, 0.020348548889160156, 0.021020889282226562, 0.02169322967529297, 0.022365570068359375, 0.02303791046142578, 0.023710250854492188, 0.024382591247558594, 0.025054931640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 996.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16822035610675812, -0.15810665488243103, -0.14799295365810394, -0.13787925243377686, -0.12776553630828857, -0.11765184253454208, -0.1075381338596344, -0.09742443263530731, -0.08731073141098022, -0.07719703018665314, -0.06708332896232605, -0.056969620287418365, -0.04685591906309128, -0.03674221783876419, -0.026628512889146805, -0.01651480793952942, -0.0064011067152023315, 0.003712596371769905, 0.013826299458742142, 0.02394000254571438, 0.034053705632686615, 0.0441674068570137, 0.05428111180663109, 0.06439481675624847, 0.07450851798057556, 0.08462221920490265, 0.09473592042922974, 0.10484962910413742, 0.11496333032846451, 0.1250770390033722, 0.13519074022769928, 0.14530444145202637, 0.15541812777519226, 0.16553182899951935, 0.17564553022384644, 0.18575923144817352, 0.1958729326725006, 0.2059866487979889, 0.21610035002231598, 0.22621405124664307, 0.23632775247097015, 0.24644145369529724, 0.2565551698207855, 0.2666688561439514, 0.2767825722694397, 0.2868962585926056, 0.29700997471809387, 0.30712366104125977, 0.31723737716674805, 0.32735109329223633, 0.3374647796154022, 0.3475784957408905, 0.3576921820640564, 0.3678058981895447, 0.37791958451271057, 0.38803330063819885, 0.39814698696136475, 0.408260703086853, 0.4183743894100189, 0.4284881055355072, 0.4386017918586731, 0.4487155079841614, 0.45882919430732727, 0.46894291043281555, 0.47905662655830383]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 10.0, 16.0, 26.0, 27.0, 19.0, 35.0, 46.0, 50.0, 68.0, 45.0, 60.0, 67.0, 54.0, 59.0, 55.0, 61.0, 52.0, 29.0, 37.0, 27.0, 27.0, 29.0, 10.0, 14.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0648425817489624, -0.06285306811332703, -0.06086354702711105, -0.05887402966618538, -0.056884512305259705, -0.05489499494433403, -0.052905477583408356, -0.05091596022248268, -0.04892644286155701, -0.04693692550063133, -0.04494740813970566, -0.042957890778779984, -0.04096837341785431, -0.038978856056928635, -0.03698933869600296, -0.034999821335077286, -0.03301030397415161, -0.031020786613225937, -0.029031269252300262, -0.027041751891374588, -0.025052234530448914, -0.02306271716952324, -0.021073199808597565, -0.01908368244767189, -0.017094165086746216, -0.015104647725820541, -0.013115130364894867, -0.011125613003969193, -0.009136095643043518, -0.007146578282117844, -0.005157060921192169, -0.0031675435602664948, -0.0011780261993408203, 0.0008114911615848541, 0.0028010085225105286, 0.004790525883436203, 0.0067800432443618774, 0.008769560605287552, 0.010759077966213226, 0.0127485953271389, 0.014738112688064575, 0.01672763004899025, 0.018717147409915924, 0.0207066647708416, 0.022696182131767273, 0.024685699492692947, 0.026675216853618622, 0.028664734214544296, 0.03065425157546997, 0.032643768936395645, 0.03463328629732132, 0.036622803658246994, 0.03861232101917267, 0.04060183838009834, 0.04259135574102402, 0.04458087310194969, 0.046570390462875366, 0.04855990782380104, 0.050549425184726715, 0.05253894254565239, 0.054528459906578064, 0.05651797726750374, 0.05850749462842941, 0.06049701198935509, 0.06248652935028076]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 13.0, 28.0, 41.0, 45.0, 86.0, 100.0, 183.0, 251.0, 384.0, 633.0, 1037.0, 1693.0, 2928.0, 5493.0, 11463.0, 30096.0, 875360.0, 83938.0, 17357.0, 7603.0, 4057.0, 2208.0, 1287.0, 787.0, 506.0, 315.0, 224.0, 134.0, 93.0, 61.0, 40.0, 27.0, 20.0, 11.0, 9.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03668212890625, -0.035594940185546875, -0.03450775146484375, -0.033420562744140625, -0.0323333740234375, -0.031246185302734375, -0.03015899658203125, -0.029071807861328125, -0.027984619140625, -0.026897430419921875, -0.02581024169921875, -0.024723052978515625, -0.0236358642578125, -0.022548675537109375, -0.02146148681640625, -0.020374298095703125, -0.019287109375, -0.018199920654296875, -0.01711273193359375, -0.016025543212890625, -0.0149383544921875, -0.013851165771484375, -0.01276397705078125, -0.011676788330078125, -0.010589599609375, -0.009502410888671875, -0.00841522216796875, -0.007328033447265625, -0.0062408447265625, -0.005153656005859375, -0.00406646728515625, -0.002979278564453125, -0.00189208984375, -0.000804901123046875, 0.00028228759765625, 0.001369476318359375, 0.0024566650390625, 0.003543853759765625, 0.00463104248046875, 0.005718231201171875, 0.006805419921875, 0.007892608642578125, 0.00897979736328125, 0.010066986083984375, 0.0111541748046875, 0.012241363525390625, 0.01332855224609375, 0.014415740966796875, 0.0155029296875, 0.016590118408203125, 0.01767730712890625, 0.018764495849609375, 0.0198516845703125, 0.020938873291015625, 0.02202606201171875, 0.023113250732421875, 0.024200439453125, 0.025287628173828125, 0.02637481689453125, 0.027462005615234375, 0.0285491943359375, 0.029636383056640625, 0.03072357177734375, 0.031810760498046875, 0.03289794921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 7.0, 3.0, 8.0, 8.0, 12.0, 9.0, 8.0, 18.0, 92.0, 354.0, 295.0, 67.0, 18.0, 7.0, 7.0, 15.0, 10.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0098876953125, -0.00956106185913086, -0.009234428405761719, -0.008907794952392578, -0.008581161499023438, -0.008254528045654297, -0.007927894592285156, -0.007601261138916016, -0.007274627685546875, -0.006947994232177734, -0.006621360778808594, -0.006294727325439453, -0.0059680938720703125, -0.005641460418701172, -0.005314826965332031, -0.004988193511962891, -0.00466156005859375, -0.004334926605224609, -0.004008293151855469, -0.003681659698486328, -0.0033550262451171875, -0.003028392791748047, -0.0027017593383789062, -0.0023751258850097656, -0.002048492431640625, -0.0017218589782714844, -0.0013952255249023438, -0.0010685920715332031, -0.0007419586181640625, -0.0004153251647949219, -8.869171142578125e-05, 0.00023794174194335938, 0.0005645751953125, 0.0008912086486816406, 0.0012178421020507812, 0.0015444755554199219, 0.0018711090087890625, 0.002197742462158203, 0.0025243759155273438, 0.0028510093688964844, 0.003177642822265625, 0.0035042762756347656, 0.0038309097290039062, 0.004157543182373047, 0.0044841766357421875, 0.004810810089111328, 0.005137443542480469, 0.005464076995849609, 0.00579071044921875, 0.006117343902587891, 0.006443977355957031, 0.006770610809326172, 0.0070972442626953125, 0.007423877716064453, 0.007750511169433594, 0.008077144622802734, 0.008403778076171875, 0.008730411529541016, 0.009057044982910156, 0.009383678436279297, 0.009710311889648438, 0.010036945343017578, 0.010363578796386719, 0.01069021224975586, 0.011016845703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 11.0, 7.0, 11.0, 14.0, 21.0, 27.0, 25.0, 33.0, 37.0, 39.0, 55.0, 69.0, 69.0, 98.0, 104.0, 121.0, 190.0, 288.0, 488.0, 1301.0, 9873.0, 942326.0, 88509.0, 2662.0, 732.0, 357.0, 220.0, 160.0, 127.0, 103.0, 70.0, 76.0, 52.0, 59.0, 50.0, 41.0, 29.0, 22.0, 19.0, 10.0, 12.0, 15.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0859375, -0.08339118957519531, -0.08084487915039062, -0.07829856872558594, -0.07575225830078125, -0.07320594787597656, -0.07065963745117188, -0.06811332702636719, -0.0655670166015625, -0.06302070617675781, -0.060474395751953125, -0.05792808532714844, -0.05538177490234375, -0.05283546447753906, -0.050289154052734375, -0.04774284362792969, -0.045196533203125, -0.04265022277832031, -0.040103912353515625, -0.03755760192871094, -0.03501129150390625, -0.03246498107910156, -0.029918670654296875, -0.027372360229492188, -0.0248260498046875, -0.022279739379882812, -0.019733428955078125, -0.017187118530273438, -0.01464080810546875, -0.012094497680664062, -0.009548187255859375, -0.0070018768310546875, -0.00445556640625, -0.0019092559814453125, 0.000637054443359375, 0.0031833648681640625, 0.00572967529296875, 0.008275985717773438, 0.010822296142578125, 0.013368606567382812, 0.0159149169921875, 0.018461227416992188, 0.021007537841796875, 0.023553848266601562, 0.02610015869140625, 0.028646469116210938, 0.031192779541015625, 0.03373908996582031, 0.036285400390625, 0.03883171081542969, 0.041378021240234375, 0.04392433166503906, 0.04647064208984375, 0.04901695251464844, 0.051563262939453125, 0.05410957336425781, 0.0566558837890625, 0.05920219421386719, 0.061748504638671875, 0.06429481506347656, 0.06684112548828125, 0.06938743591308594, 0.07193374633789062, 0.07448005676269531, 0.0770263671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 5.0, 4.0, 10.0, 8.0, 8.0, 12.0, 14.0, 9.0, 15.0, 17.0, 15.0, 35.0, 23.0, 31.0, 26.0, 31.0, 33.0, 38.0, 46.0, 27.0, 61.0, 48.0, 57.0, 47.0, 45.0, 39.0, 41.0, 42.0, 30.0, 28.0, 20.0, 24.0, 18.0, 17.0, 20.0, 17.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03399658203125, -0.03305482864379883, -0.032113075256347656, -0.031171321868896484, -0.030229568481445312, -0.02928781509399414, -0.02834606170654297, -0.027404308319091797, -0.026462554931640625, -0.025520801544189453, -0.02457904815673828, -0.02363729476928711, -0.022695541381835938, -0.021753787994384766, -0.020812034606933594, -0.019870281219482422, -0.01892852783203125, -0.017986774444580078, -0.017045021057128906, -0.016103267669677734, -0.015161514282226562, -0.01421976089477539, -0.013278007507324219, -0.012336254119873047, -0.011394500732421875, -0.010452747344970703, -0.009510993957519531, -0.00856924057006836, -0.0076274871826171875, -0.006685733795166016, -0.005743980407714844, -0.004802227020263672, -0.0038604736328125, -0.002918720245361328, -0.0019769668579101562, -0.0010352134704589844, -9.34600830078125e-05, 0.0008482933044433594, 0.0017900466918945312, 0.002731800079345703, 0.003673553466796875, 0.004615306854248047, 0.005557060241699219, 0.006498813629150391, 0.0074405670166015625, 0.008382320404052734, 0.009324073791503906, 0.010265827178955078, 0.01120758056640625, 0.012149333953857422, 0.013091087341308594, 0.014032840728759766, 0.014974594116210938, 0.01591634750366211, 0.01685810089111328, 0.017799854278564453, 0.018741607666015625, 0.019683361053466797, 0.02062511444091797, 0.02156686782836914, 0.022508621215820312, 0.023450374603271484, 0.024392127990722656, 0.025333881378173828, 0.026275634765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 2.0, 3.0, 3.0, 16.0, 17.0, 22.0, 33.0, 39.0, 78.0, 106.0, 204.0, 460.0, 1008.0, 3883.0, 218102.0, 817524.0, 4806.0, 1170.0, 462.0, 226.0, 130.0, 88.0, 43.0, 35.0, 23.0, 26.0, 9.0, 13.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015401840209960938, -0.00014974642544984818, -0.00014547444880008698, -0.00014120247215032578, -0.00013693049550056458, -0.00013265851885080338, -0.00012838654220104218, -0.00012411456555128098, -0.00011984258890151978, -0.00011557061225175858, -0.00011129863560199738, -0.00010702665895223618, -0.00010275468230247498, -9.848270565271378e-05, -9.421072900295258e-05, -8.993875235319138e-05, -8.566677570343018e-05, -8.139479905366898e-05, -7.712282240390778e-05, -7.285084575414658e-05, -6.857886910438538e-05, -6.430689245462418e-05, -6.0034915804862976e-05, -5.5762939155101776e-05, -5.1490962505340576e-05, -4.7218985855579376e-05, -4.2947009205818176e-05, -3.8675032556056976e-05, -3.4403055906295776e-05, -3.0131079256534576e-05, -2.5859102606773376e-05, -2.1587125957012177e-05, -1.7315149307250977e-05, -1.3043172657489777e-05, -8.771196007728577e-06, -4.499219357967377e-06, -2.2724270820617676e-07, 4.044733941555023e-06, 8.316710591316223e-06, 1.2588687241077423e-05, 1.6860663890838623e-05, 2.1132640540599823e-05, 2.5404617190361023e-05, 2.9676593840122223e-05, 3.394857048988342e-05, 3.822054713964462e-05, 4.249252378940582e-05, 4.676450043916702e-05, 5.103647708892822e-05, 5.530845373868942e-05, 5.958043038845062e-05, 6.385240703821182e-05, 6.812438368797302e-05, 7.239636033773422e-05, 7.666833698749542e-05, 8.094031363725662e-05, 8.521229028701782e-05, 8.948426693677902e-05, 9.375624358654022e-05, 9.802822023630142e-05, 0.00010230019688606262, 0.00010657217353582382, 0.00011084415018558502, 0.00011511612683534622, 0.00011938810348510742]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 11.0, 29.0, 22.0, 21.0, 35.0, 41.0, 43.0, 42.0, 68.0, 63.0, 67.0, 74.0, 80.0, 75.0, 54.0, 47.0, 22.0, 36.0, 29.0, 18.0, 21.0, 14.0, 11.0, 10.0, 12.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.702007234096527e-06, -3.5297125577926636e-06, -3.3574178814888e-06, -3.1851232051849365e-06, -3.012828528881073e-06, -2.8405338525772095e-06, -2.668239176273346e-06, -2.4959444999694824e-06, -2.323649823665619e-06, -2.1513551473617554e-06, -1.979060471057892e-06, -1.8067657947540283e-06, -1.6344711184501648e-06, -1.4621764421463013e-06, -1.2898817658424377e-06, -1.1175870895385742e-06, -9.452924132347107e-07, -7.729977369308472e-07, -6.007030606269836e-07, -4.284083843231201e-07, -2.561137080192566e-07, -8.381903171539307e-08, 8.847564458847046e-08, 2.60770320892334e-07, 4.330649971961975e-07, 6.05359673500061e-07, 7.776543498039246e-07, 9.499490261077881e-07, 1.1222437024116516e-06, 1.2945383787155151e-06, 1.4668330550193787e-06, 1.6391277313232422e-06, 1.8114224076271057e-06, 1.9837170839309692e-06, 2.1560117602348328e-06, 2.3283064365386963e-06, 2.50060111284256e-06, 2.6728957891464233e-06, 2.845190465450287e-06, 3.0174851417541504e-06, 3.189779818058014e-06, 3.3620744943618774e-06, 3.534369170665741e-06, 3.7066638469696045e-06, 3.878958523273468e-06, 4.0512531995773315e-06, 4.223547875881195e-06, 4.395842552185059e-06, 4.568137228488922e-06, 4.740431904792786e-06, 4.912726581096649e-06, 5.085021257400513e-06, 5.257315933704376e-06, 5.42961061000824e-06, 5.601905286312103e-06, 5.774199962615967e-06, 5.94649463891983e-06, 6.118789315223694e-06, 6.291083991527557e-06, 6.463378667831421e-06, 6.6356733441352844e-06, 6.807968020439148e-06, 6.9802626967430115e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 12.0, 22.0, 26.0, 37.0, 62.0, 127.0, 203.0, 441.0, 2022.0, 1026259.0, 17815.0, 820.0, 285.0, 152.0, 92.0, 64.0, 32.0, 29.0, 11.0, 4.0, 5.0, 3.0, 4.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00019228458404541016, -0.0001865886151790619, -0.00018089264631271362, -0.00017519667744636536, -0.0001695007085800171, -0.00016380473971366882, -0.00015810877084732056, -0.0001524128019809723, -0.00014671683311462402, -0.00014102086424827576, -0.0001353248953819275, -0.00012962892651557922, -0.00012393295764923096, -0.00011823698878288269, -0.00011254101991653442, -0.00010684505105018616, -0.00010114908218383789, -9.545311331748962e-05, -8.975714445114136e-05, -8.406117558479309e-05, -7.836520671844482e-05, -7.266923785209656e-05, -6.697326898574829e-05, -6.127730011940002e-05, -5.558133125305176e-05, -4.988536238670349e-05, -4.4189393520355225e-05, -3.849342465400696e-05, -3.279745578765869e-05, -2.7101486921310425e-05, -2.1405518054962158e-05, -1.570954918861389e-05, -1.0013580322265625e-05, -4.317611455917358e-06, 1.3783574104309082e-06, 7.074326276779175e-06, 1.2770295143127441e-05, 1.8466264009475708e-05, 2.4162232875823975e-05, 2.985820174217224e-05, 3.555417060852051e-05, 4.1250139474868774e-05, 4.694610834121704e-05, 5.264207720756531e-05, 5.8338046073913574e-05, 6.403401494026184e-05, 6.972998380661011e-05, 7.542595267295837e-05, 8.112192153930664e-05, 8.681789040565491e-05, 9.251385927200317e-05, 9.820982813835144e-05, 0.00010390579700469971, 0.00010960176587104797, 0.00011529773473739624, 0.00012099370360374451, 0.00012668967247009277, 0.00013238564133644104, 0.0001380816102027893, 0.00014377757906913757, 0.00014947354793548584, 0.0001551695168018341, 0.00016086548566818237, 0.00016656145453453064, 0.0001722574234008789]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 10.0, 10.0, 19.0, 41.0, 56.0, 96.0, 142.0, 167.0, 160.0, 97.0, 72.0, 36.0, 32.0, 22.0, 11.0, 10.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.617473602294922e-05, -7.397308945655823e-05, -7.177144289016724e-05, -6.956979632377625e-05, -6.736814975738525e-05, -6.516650319099426e-05, -6.296485662460327e-05, -6.076321005821228e-05, -5.856156349182129e-05, -5.63599169254303e-05, -5.415827035903931e-05, -5.1956623792648315e-05, -4.9754977226257324e-05, -4.755333065986633e-05, -4.535168409347534e-05, -4.315003752708435e-05, -4.094839096069336e-05, -3.874674439430237e-05, -3.654509782791138e-05, -3.4343451261520386e-05, -3.2141804695129395e-05, -2.9940158128738403e-05, -2.7738511562347412e-05, -2.553686499595642e-05, -2.333521842956543e-05, -2.113357186317444e-05, -1.8931925296783447e-05, -1.6730278730392456e-05, -1.4528632164001465e-05, -1.2326985597610474e-05, -1.0125339031219482e-05, -7.923692464828491e-06, -5.7220458984375e-06, -3.520399332046509e-06, -1.3187527656555176e-06, 8.828938007354736e-07, 3.084540367126465e-06, 5.286186933517456e-06, 7.487833499908447e-06, 9.689480066299438e-06, 1.189112663269043e-05, 1.4092773199081421e-05, 1.6294419765472412e-05, 1.8496066331863403e-05, 2.0697712898254395e-05, 2.2899359464645386e-05, 2.5101006031036377e-05, 2.7302652597427368e-05, 2.950429916381836e-05, 3.170594573020935e-05, 3.390759229660034e-05, 3.610923886299133e-05, 3.8310885429382324e-05, 4.0512531995773315e-05, 4.271417856216431e-05, 4.49158251285553e-05, 4.711747169494629e-05, 4.931911826133728e-05, 5.152076482772827e-05, 5.372241139411926e-05, 5.5924057960510254e-05, 5.8125704526901245e-05, 6.0327351093292236e-05, 6.252899765968323e-05, 6.473064422607422e-05]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 6.0, 27.0, 774.0, 193.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04335526376962662, -0.031961411237716675, -0.020567556843161583, -0.009173702448606491, 0.0022201500833034515, 0.013614002615213394, 0.025007858872413635, 0.03640171140432358, 0.04779556393623352, 0.05918941646814346, 0.0705832690000534, 0.08197712898254395, 0.09337097406387329, 0.10476483404636383, 0.11615868657827377, 0.12755253911018372, 0.13894638419151306, 0.1503402441740036, 0.16173408925533295, 0.1731279492378235, 0.18452179431915283, 0.19591565430164337, 0.2073095142841339, 0.21870335936546326, 0.2300972193479538, 0.24149107933044434, 0.2528849244117737, 0.264278769493103, 0.27567264437675476, 0.2870664894580841, 0.29846033453941345, 0.3098542094230652, 0.32124802470207214, 0.3326418697834015, 0.3440357446670532, 0.35542958974838257, 0.3668234348297119, 0.37821727991104126, 0.389611154794693, 0.40100499987602234, 0.4123988449573517, 0.42379269003868103, 0.43518656492233276, 0.4465804100036621, 0.45797425508499146, 0.4693681001663208, 0.48076197504997253, 0.4921558201313019, 0.5035496950149536, 0.514943540096283, 0.5263373851776123, 0.5377312302589417, 0.5491251349449158, 0.5605189800262451, 0.5719128251075745, 0.5833066701889038, 0.5947005152702332, 0.6060943603515625, 0.6174882054328918, 0.6288820505142212, 0.6402759552001953, 0.6516698002815247, 0.663063645362854, 0.6744574904441833, 0.6858513355255127]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 11.0, 13.0, 8.0, 20.0, 23.0, 33.0, 27.0, 35.0, 27.0, 45.0, 54.0, 49.0, 47.0, 44.0, 58.0, 42.0, 52.0, 60.0, 53.0, 47.0, 40.0, 43.0, 35.0, 28.0, 24.0, 15.0, 9.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2533220052719116, -0.24554792046546936, -0.2377738356590271, -0.22999975085258484, -0.22222565114498138, -0.21445156633853912, -0.20667748153209686, -0.1989033967256546, -0.19112929701805115, -0.1833552122116089, -0.17558112740516663, -0.16780704259872437, -0.1600329428911209, -0.15225885808467865, -0.1444847732782364, -0.13671068847179413, -0.12893660366535187, -0.1211625188589096, -0.11338842660188675, -0.10561434179544449, -0.09784024953842163, -0.09006616473197937, -0.08229207992553711, -0.07451799511909485, -0.06674390286207199, -0.05896981433033943, -0.05119572579860687, -0.04342164099216461, -0.03564755246043205, -0.027873463928699493, -0.020099379122257233, -0.012325290590524673, -0.004551202058792114, 0.0032228855416178703, 0.010996973142027855, 0.018771059811115265, 0.026545148342847824, 0.03431923687458038, 0.042093321681022644, 0.0498674102127552, 0.05764149874448776, 0.06541558355093002, 0.07318967580795288, 0.08096376061439514, 0.0887378454208374, 0.09651193767786026, 0.10428602248430252, 0.11206011474132538, 0.11983419954776764, 0.1276082843542099, 0.13538236916065216, 0.14315646886825562, 0.15093055367469788, 0.15870463848114014, 0.1664787232875824, 0.17425280809402466, 0.18202689290046692, 0.18980097770690918, 0.19757506251335144, 0.2053491473197937, 0.21312324702739716, 0.22089733183383942, 0.22867141664028168, 0.23644550144672394, 0.2442196011543274]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 6.0, 14.0, 12.0, 33.0, 28.0, 52.0, 66.0, 115.0, 128.0, 219.0, 325.0, 624.0, 1298.0, 18874.0, 4156866.0, 11910.0, 1524.0, 690.0, 401.0, 305.0, 207.0, 153.0, 107.0, 74.0, 60.0, 44.0, 35.0, 17.0, 21.0, 10.0, 19.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.03627634048461914, -0.03504657745361328, -0.03381681442260742, -0.03258705139160156, -0.0313572883605957, -0.030127525329589844, -0.028897762298583984, -0.027667999267578125, -0.026438236236572266, -0.025208473205566406, -0.023978710174560547, -0.022748947143554688, -0.021519184112548828, -0.02028942108154297, -0.01905965805053711, -0.01782989501953125, -0.01660013198852539, -0.015370368957519531, -0.014140605926513672, -0.012910842895507812, -0.011681079864501953, -0.010451316833496094, -0.009221553802490234, -0.007991790771484375, -0.006762027740478516, -0.005532264709472656, -0.004302501678466797, -0.0030727386474609375, -0.0018429756164550781, -0.0006132125854492188, 0.0006165504455566406, 0.0018463134765625, 0.0030760765075683594, 0.004305839538574219, 0.005535602569580078, 0.0067653656005859375, 0.007995128631591797, 0.009224891662597656, 0.010454654693603516, 0.011684417724609375, 0.012914180755615234, 0.014143943786621094, 0.015373706817626953, 0.016603469848632812, 0.017833232879638672, 0.01906299591064453, 0.02029275894165039, 0.02152252197265625, 0.02275228500366211, 0.02398204803466797, 0.025211811065673828, 0.026441574096679688, 0.027671337127685547, 0.028901100158691406, 0.030130863189697266, 0.031360626220703125, 0.032590389251708984, 0.033820152282714844, 0.0350499153137207, 0.03627967834472656, 0.03750944137573242, 0.03873920440673828, 0.03996896743774414, 0.04119873046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 13.0, 10.0, 6.0, 9.0, 17.0, 51.0, 243.0, 369.0, 128.0, 28.0, 14.0, 9.0, 12.0, 12.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00970458984375, -0.009387731552124023, -0.009070873260498047, -0.00875401496887207, -0.008437156677246094, -0.008120298385620117, -0.007803440093994141, -0.007486581802368164, -0.0071697235107421875, -0.006852865219116211, -0.006536006927490234, -0.006219148635864258, -0.005902290344238281, -0.005585432052612305, -0.005268573760986328, -0.0049517154693603516, -0.004634857177734375, -0.0043179988861083984, -0.004001140594482422, -0.0036842823028564453, -0.0033674240112304688, -0.003050565719604492, -0.0027337074279785156, -0.002416849136352539, -0.0020999908447265625, -0.001783132553100586, -0.0014662742614746094, -0.0011494159698486328, -0.0008325576782226562, -0.0005156993865966797, -0.00019884109497070312, 0.00011801719665527344, 0.00043487548828125, 0.0007517337799072266, 0.0010685920715332031, 0.0013854503631591797, 0.0017023086547851562, 0.002019166946411133, 0.0023360252380371094, 0.002652883529663086, 0.0029697418212890625, 0.003286600112915039, 0.0036034584045410156, 0.003920316696166992, 0.004237174987792969, 0.004554033279418945, 0.004870891571044922, 0.0051877498626708984, 0.005504608154296875, 0.0058214664459228516, 0.006138324737548828, 0.006455183029174805, 0.006772041320800781, 0.007088899612426758, 0.007405757904052734, 0.007722616195678711, 0.008039474487304688, 0.008356332778930664, 0.00867319107055664, 0.008990049362182617, 0.009306907653808594, 0.00962376594543457, 0.009940624237060547, 0.010257482528686523, 0.0105743408203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 12.0, 7.0, 15.0, 14.0, 21.0, 37.0, 53.0, 88.0, 154.0, 463.0, 2731.0, 4061645.0, 126088.0, 2112.0, 356.0, 174.0, 59.0, 39.0, 42.0, 24.0, 16.0, 19.0, 12.0, 15.0, 3.0, 10.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.0799713134765625, -0.077301025390625, -0.0746307373046875, -0.07196044921875, -0.0692901611328125, -0.066619873046875, -0.0639495849609375, -0.061279296875, -0.0586090087890625, -0.055938720703125, -0.0532684326171875, -0.05059814453125, -0.0479278564453125, -0.045257568359375, -0.0425872802734375, -0.0399169921875, -0.0372467041015625, -0.034576416015625, -0.0319061279296875, -0.02923583984375, -0.0265655517578125, -0.023895263671875, -0.0212249755859375, -0.0185546875, -0.0158843994140625, -0.013214111328125, -0.0105438232421875, -0.00787353515625, -0.0052032470703125, -0.002532958984375, 0.0001373291015625, 0.0028076171875, 0.0054779052734375, 0.008148193359375, 0.0108184814453125, 0.01348876953125, 0.0161590576171875, 0.018829345703125, 0.0214996337890625, 0.024169921875, 0.0268402099609375, 0.029510498046875, 0.0321807861328125, 0.03485107421875, 0.0375213623046875, 0.040191650390625, 0.0428619384765625, 0.0455322265625, 0.0482025146484375, 0.050872802734375, 0.0535430908203125, 0.05621337890625, 0.0588836669921875, 0.061553955078125, 0.0642242431640625, 0.06689453125, 0.0695648193359375, 0.072235107421875, 0.0749053955078125, 0.07757568359375, 0.0802459716796875, 0.082916259765625, 0.0855865478515625, 0.0882568359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 13.0, 11.0, 7.0, 21.0, 50.0, 73.0, 457.0, 3149.0, 135.0, 58.0, 20.0, 12.0, 5.0, 5.0, 6.0, 7.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.016998291015625, -0.01648545265197754, -0.015972614288330078, -0.015459775924682617, -0.014946937561035156, -0.014434099197387695, -0.013921260833740234, -0.013408422470092773, -0.012895584106445312, -0.012382745742797852, -0.01186990737915039, -0.01135706901550293, -0.010844230651855469, -0.010331392288208008, -0.009818553924560547, -0.009305715560913086, -0.008792877197265625, -0.008280038833618164, -0.007767200469970703, -0.007254362106323242, -0.006741523742675781, -0.00622868537902832, -0.005715847015380859, -0.0052030086517333984, -0.0046901702880859375, -0.0041773319244384766, -0.0036644935607910156, -0.0031516551971435547, -0.0026388168334960938, -0.002125978469848633, -0.0016131401062011719, -0.001100301742553711, -0.00058746337890625, -7.462501525878906e-05, 0.0004382133483886719, 0.0009510517120361328, 0.0014638900756835938, 0.0019767284393310547, 0.0024895668029785156, 0.0030024051666259766, 0.0035152435302734375, 0.0040280818939208984, 0.004540920257568359, 0.00505375862121582, 0.005566596984863281, 0.006079435348510742, 0.006592273712158203, 0.007105112075805664, 0.007617950439453125, 0.008130788803100586, 0.008643627166748047, 0.009156465530395508, 0.009669303894042969, 0.01018214225769043, 0.01069498062133789, 0.011207818984985352, 0.011720657348632812, 0.012233495712280273, 0.012746334075927734, 0.013259172439575195, 0.013772010803222656, 0.014284849166870117, 0.014797687530517578, 0.015310525894165039, 0.0158233642578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 960.0, 50.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26537030935287476, -0.2606084942817688, -0.25584667921066284, -0.2510848939418793, -0.24632307887077332, -0.24156126379966736, -0.2367994636297226, -0.23203766345977783, -0.22727584838867188, -0.22251403331756592, -0.21775223314762115, -0.2129904329776764, -0.20822861790657043, -0.20346680283546448, -0.19870500266551971, -0.19394320249557495, -0.189181387424469, -0.18441957235336304, -0.17965777218341827, -0.1748959720134735, -0.17013415694236755, -0.1653723418712616, -0.16061054170131683, -0.15584874153137207, -0.1510869264602661, -0.14632511138916016, -0.1415633112192154, -0.13680151104927063, -0.13203969597816467, -0.12727788090705872, -0.12251608073711395, -0.11775427311658859, -0.11299246549606323, -0.10823065787553787, -0.10346885025501251, -0.09870704263448715, -0.09394523501396179, -0.08918342739343643, -0.08442161977291107, -0.07965981215238571, -0.07489800453186035, -0.07013619691133499, -0.06537438929080963, -0.06061258167028427, -0.05585077404975891, -0.05108896642923355, -0.04632715880870819, -0.04156535118818283, -0.03680354356765747, -0.03204173594713211, -0.02727992832660675, -0.02251812070608139, -0.01775631308555603, -0.01299450546503067, -0.00823269784450531, -0.00347089022397995, 0.0012909173965454102, 0.00605272501707077, 0.01081453263759613, 0.01557634025812149, 0.02033814787864685, 0.02509995549917221, 0.02986176311969757, 0.03462357074022293, 0.03938537836074829]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 9.0, 5.0, 12.0, 12.0, 18.0, 21.0, 24.0, 25.0, 36.0, 37.0, 39.0, 41.0, 50.0, 56.0, 64.0, 54.0, 70.0, 67.0, 57.0, 45.0, 37.0, 38.0, 44.0, 30.0, 24.0, 23.0, 12.0, 13.0, 18.0, 8.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0466805100440979, -0.04540916532278061, -0.04413782060146332, -0.042866479605436325, -0.041595134884119034, -0.04032379016280174, -0.03905244916677475, -0.03778110444545746, -0.03650975972414017, -0.035238415002822876, -0.033967070281505585, -0.03269572928547859, -0.0314243845641613, -0.03015303984284401, -0.028881696984171867, -0.027610354125499725, -0.026339009404182434, -0.025067664682865143, -0.023796321824193, -0.02252497896552086, -0.021253634244203568, -0.019982289522886276, -0.018710946664214134, -0.017439603805541992, -0.0161682590842247, -0.014896915294229984, -0.013625571504235268, -0.012354227714240551, -0.011082883924245834, -0.009811540134251118, -0.008540196344256401, -0.007268852554261684, -0.005997508764266968, -0.004726164974272251, -0.0034548211842775345, -0.002183477394282818, -0.0009121336042881012, 0.00035921018570661545, 0.001630553975701332, 0.0029018977656960487, 0.004173241555690765, 0.005444585345685482, 0.006715929135680199, 0.007987272925674915, 0.009258616715669632, 0.010529960505664349, 0.011801304295659065, 0.013072648085653782, 0.014343991875648499, 0.015615335665643215, 0.016886679455637932, 0.018158022314310074, 0.019429367035627365, 0.020700711756944656, 0.0219720546156168, 0.02324339747428894, 0.02451474219560623, 0.025786086916923523, 0.027057429775595665, 0.028328772634267807, 0.0296001173555851, 0.03087146207690239, 0.03214280307292938, 0.033414147794246674, 0.034685492515563965]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 8.0, 12.0, 16.0, 20.0, 32.0, 37.0, 54.0, 64.0, 109.0, 135.0, 172.0, 275.0, 382.0, 546.0, 817.0, 1203.0, 1854.0, 3010.0, 5184.0, 9521.0, 21327.0, 190503.0, 759489.0, 27116.0, 11110.0, 5805.0, 3389.0, 2099.0, 1396.0, 862.0, 580.0, 422.0, 272.0, 205.0, 153.0, 95.0, 71.0, 53.0, 43.0, 27.0, 19.0, 15.0, 13.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0216217041015625, -0.020926713943481445, -0.02023172378540039, -0.019536733627319336, -0.01884174346923828, -0.018146753311157227, -0.017451763153076172, -0.016756772994995117, -0.016061782836914062, -0.015366792678833008, -0.014671802520751953, -0.013976812362670898, -0.013281822204589844, -0.012586832046508789, -0.011891841888427734, -0.01119685173034668, -0.010501861572265625, -0.00980687141418457, -0.009111881256103516, -0.008416891098022461, -0.007721900939941406, -0.0070269107818603516, -0.006331920623779297, -0.005636930465698242, -0.0049419403076171875, -0.004246950149536133, -0.003551959991455078, -0.0028569698333740234, -0.0021619796752929688, -0.001466989517211914, -0.0007719993591308594, -7.700920104980469e-05, 0.00061798095703125, 0.0013129711151123047, 0.0020079612731933594, 0.002702951431274414, 0.0033979415893554688, 0.0040929317474365234, 0.004787921905517578, 0.005482912063598633, 0.0061779022216796875, 0.006872892379760742, 0.007567882537841797, 0.008262872695922852, 0.008957862854003906, 0.009652853012084961, 0.010347843170166016, 0.01104283332824707, 0.011737823486328125, 0.01243281364440918, 0.013127803802490234, 0.013822793960571289, 0.014517784118652344, 0.015212774276733398, 0.015907764434814453, 0.016602754592895508, 0.017297744750976562, 0.017992734909057617, 0.018687725067138672, 0.019382715225219727, 0.02007770538330078, 0.020772695541381836, 0.02146768569946289, 0.022162675857543945, 0.022857666015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 7.0, 5.0, 4.0, 5.0, 14.0, 6.0, 8.0, 9.0, 20.0, 61.0, 253.0, 357.0, 117.0, 27.0, 14.0, 9.0, 9.0, 14.0, 8.0, 6.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 9.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00946807861328125, -0.009158492088317871, -0.008848905563354492, -0.008539319038391113, -0.008229732513427734, -0.007920145988464355, -0.0076105594635009766, -0.007300972938537598, -0.006991386413574219, -0.00668179988861084, -0.006372213363647461, -0.006062626838684082, -0.005753040313720703, -0.005443453788757324, -0.005133867263793945, -0.004824280738830566, -0.0045146942138671875, -0.004205107688903809, -0.0038955211639404297, -0.0035859346389770508, -0.003276348114013672, -0.002966761589050293, -0.002657175064086914, -0.002347588539123535, -0.0020380020141601562, -0.0017284154891967773, -0.0014188289642333984, -0.0011092424392700195, -0.0007996559143066406, -0.0004900693893432617, -0.0001804828643798828, 0.0001291036605834961, 0.000438690185546875, 0.0007482767105102539, 0.0010578632354736328, 0.0013674497604370117, 0.0016770362854003906, 0.0019866228103637695, 0.0022962093353271484, 0.0026057958602905273, 0.0029153823852539062, 0.003224968910217285, 0.003534555435180664, 0.003844141960144043, 0.004153728485107422, 0.004463315010070801, 0.00477290153503418, 0.005082488059997559, 0.0053920745849609375, 0.005701661109924316, 0.006011247634887695, 0.006320834159851074, 0.006630420684814453, 0.006940007209777832, 0.007249593734741211, 0.00755918025970459, 0.007868766784667969, 0.008178353309631348, 0.008487939834594727, 0.008797526359558105, 0.009107112884521484, 0.009416699409484863, 0.009726285934448242, 0.010035872459411621, 0.010345458984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 2.0, 6.0, 5.0, 7.0, 14.0, 12.0, 15.0, 25.0, 25.0, 21.0, 28.0, 46.0, 40.0, 64.0, 73.0, 92.0, 92.0, 146.0, 191.0, 254.0, 362.0, 668.0, 1702.0, 11452.0, 927394.0, 99224.0, 3734.0, 1054.0, 499.0, 295.0, 207.0, 155.0, 119.0, 91.0, 90.0, 61.0, 54.0, 54.0, 30.0, 23.0, 27.0, 23.0, 18.0, 15.0, 14.0, 8.0, 4.0, 9.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 5.0], "bins": [-0.0621337890625, -0.06029367446899414, -0.05845355987548828, -0.05661344528198242, -0.05477333068847656, -0.0529332160949707, -0.051093101501464844, -0.049252986907958984, -0.047412872314453125, -0.045572757720947266, -0.043732643127441406, -0.04189252853393555, -0.04005241394042969, -0.03821229934692383, -0.03637218475341797, -0.03453207015991211, -0.03269195556640625, -0.03085184097290039, -0.02901172637939453, -0.027171611785888672, -0.025331497192382812, -0.023491382598876953, -0.021651268005371094, -0.019811153411865234, -0.017971038818359375, -0.016130924224853516, -0.014290809631347656, -0.012450695037841797, -0.010610580444335938, -0.008770465850830078, -0.006930351257324219, -0.005090236663818359, -0.0032501220703125, -0.0014100074768066406, 0.00043010711669921875, 0.002270221710205078, 0.0041103363037109375, 0.005950450897216797, 0.007790565490722656, 0.009630680084228516, 0.011470794677734375, 0.013310909271240234, 0.015151023864746094, 0.016991138458251953, 0.018831253051757812, 0.020671367645263672, 0.02251148223876953, 0.02435159683227539, 0.02619171142578125, 0.02803182601928711, 0.02987194061279297, 0.03171205520629883, 0.03355216979980469, 0.03539228439331055, 0.037232398986816406, 0.039072513580322266, 0.040912628173828125, 0.042752742767333984, 0.044592857360839844, 0.0464329719543457, 0.04827308654785156, 0.05011320114135742, 0.05195331573486328, 0.05379343032836914, 0.055633544921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 5.0, 8.0, 9.0, 9.0, 9.0, 18.0, 11.0, 24.0, 20.0, 22.0, 37.0, 38.0, 36.0, 54.0, 31.0, 38.0, 57.0, 45.0, 47.0, 30.0, 43.0, 35.0, 48.0, 27.0, 40.0, 28.0, 36.0, 24.0, 21.0, 21.0, 22.0, 17.0, 15.0, 9.0, 13.0, 3.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.030426025390625, -0.029525041580200195, -0.02862405776977539, -0.027723073959350586, -0.02682209014892578, -0.025921106338500977, -0.025020122528076172, -0.024119138717651367, -0.023218154907226562, -0.022317171096801758, -0.021416187286376953, -0.02051520347595215, -0.019614219665527344, -0.01871323585510254, -0.017812252044677734, -0.01691126823425293, -0.016010284423828125, -0.01510930061340332, -0.014208316802978516, -0.013307332992553711, -0.012406349182128906, -0.011505365371704102, -0.010604381561279297, -0.009703397750854492, -0.008802413940429688, -0.007901430130004883, -0.007000446319580078, -0.0060994625091552734, -0.005198478698730469, -0.004297494888305664, -0.0033965110778808594, -0.0024955272674560547, -0.00159454345703125, -0.0006935596466064453, 0.00020742416381835938, 0.001108407974243164, 0.0020093917846679688, 0.0029103755950927734, 0.003811359405517578, 0.004712343215942383, 0.0056133270263671875, 0.006514310836791992, 0.007415294647216797, 0.008316278457641602, 0.009217262268066406, 0.010118246078491211, 0.011019229888916016, 0.01192021369934082, 0.012821197509765625, 0.01372218132019043, 0.014623165130615234, 0.015524148941040039, 0.016425132751464844, 0.01732611656188965, 0.018227100372314453, 0.019128084182739258, 0.020029067993164062, 0.020930051803588867, 0.021831035614013672, 0.022732019424438477, 0.02363300323486328, 0.024533987045288086, 0.02543497085571289, 0.026335954666137695, 0.0272369384765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 2.0, 12.0, 10.0, 18.0, 29.0, 37.0, 52.0, 69.0, 130.0, 157.0, 258.0, 462.0, 897.0, 2644.0, 13507.0, 881742.0, 137882.0, 6927.0, 1820.0, 779.0, 401.0, 219.0, 146.0, 95.0, 73.0, 45.0, 24.0, 24.0, 11.0, 23.0, 9.0, 9.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0471553802490234e-05, -3.9159320294857025e-05, -3.7847086787223816e-05, -3.653485327959061e-05, -3.52226197719574e-05, -3.391038626432419e-05, -3.259815275669098e-05, -3.128591924905777e-05, -2.997368574142456e-05, -2.866145223379135e-05, -2.7349218726158142e-05, -2.6036985218524933e-05, -2.4724751710891724e-05, -2.3412518203258514e-05, -2.2100284695625305e-05, -2.0788051187992096e-05, -1.9475817680358887e-05, -1.8163584172725677e-05, -1.6851350665092468e-05, -1.553911715745926e-05, -1.422688364982605e-05, -1.291465014219284e-05, -1.1602416634559631e-05, -1.0290183126926422e-05, -8.977949619293213e-06, -7.665716111660004e-06, -6.3534826040267944e-06, -5.041249096393585e-06, -3.729015588760376e-06, -2.4167820811271667e-06, -1.1045485734939575e-06, 2.076849341392517e-07, 1.519918441772461e-06, 2.83215194940567e-06, 4.144385457038879e-06, 5.456618964672089e-06, 6.768852472305298e-06, 8.081085979938507e-06, 9.393319487571716e-06, 1.0705552995204926e-05, 1.2017786502838135e-05, 1.3330020010471344e-05, 1.4642253518104553e-05, 1.5954487025737762e-05, 1.726672053337097e-05, 1.857895404100418e-05, 1.989118754863739e-05, 2.12034210562706e-05, 2.251565456390381e-05, 2.3827888071537018e-05, 2.5140121579170227e-05, 2.6452355086803436e-05, 2.7764588594436646e-05, 2.9076822102069855e-05, 3.0389055609703064e-05, 3.170128911733627e-05, 3.301352262496948e-05, 3.432575613260269e-05, 3.56379896402359e-05, 3.695022314786911e-05, 3.826245665550232e-05, 3.957469016313553e-05, 4.088692367076874e-05, 4.219915717840195e-05, 4.3511390686035156e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 8.0, 9.0, 15.0, 13.0, 10.0, 26.0, 35.0, 36.0, 31.0, 46.0, 47.0, 73.0, 60.0, 50.0, 76.0, 76.0, 59.0, 34.0, 45.0, 51.0, 46.0, 38.0, 23.0, 21.0, 16.0, 11.0, 5.0, 11.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.649162292480469e-06, -4.4833868741989136e-06, -4.317611455917358e-06, -4.151836037635803e-06, -3.986060619354248e-06, -3.820285201072693e-06, -3.6545097827911377e-06, -3.4887343645095825e-06, -3.3229589462280273e-06, -3.157183527946472e-06, -2.991408109664917e-06, -2.825632691383362e-06, -2.6598572731018066e-06, -2.4940818548202515e-06, -2.3283064365386963e-06, -2.162531018257141e-06, -1.996755599975586e-06, -1.8309801816940308e-06, -1.6652047634124756e-06, -1.4994293451309204e-06, -1.3336539268493652e-06, -1.16787850856781e-06, -1.0021030902862549e-06, -8.363276720046997e-07, -6.705522537231445e-07, -5.047768354415894e-07, -3.390014171600342e-07, -1.73225998878479e-07, -7.450580596923828e-09, 1.5832483768463135e-07, 3.241002559661865e-07, 4.898756742477417e-07, 6.556510925292969e-07, 8.21426510810852e-07, 9.872019290924072e-07, 1.1529773473739624e-06, 1.3187527656555176e-06, 1.4845281839370728e-06, 1.650303602218628e-06, 1.816079020500183e-06, 1.9818544387817383e-06, 2.1476298570632935e-06, 2.3134052753448486e-06, 2.479180693626404e-06, 2.644956111907959e-06, 2.810731530189514e-06, 2.9765069484710693e-06, 3.1422823667526245e-06, 3.3080577850341797e-06, 3.473833203315735e-06, 3.63960862159729e-06, 3.8053840398788452e-06, 3.9711594581604e-06, 4.1369348764419556e-06, 4.302710294723511e-06, 4.468485713005066e-06, 4.634261131286621e-06, 4.800036549568176e-06, 4.9658119678497314e-06, 5.131587386131287e-06, 5.297362804412842e-06, 5.463138222694397e-06, 5.628913640975952e-06, 5.794689059257507e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 15.0, 13.0, 26.0, 18.0, 41.0, 55.0, 105.0, 151.0, 252.0, 427.0, 1531.0, 65986.0, 975765.0, 2771.0, 577.0, 288.0, 169.0, 112.0, 72.0, 34.0, 33.0, 21.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.927417755126953e-05, -7.695145905017853e-05, -7.462874054908752e-05, -7.230602204799652e-05, -6.998330354690552e-05, -6.766058504581451e-05, -6.533786654472351e-05, -6.301514804363251e-05, -6.0692429542541504e-05, -5.83697110414505e-05, -5.60469925403595e-05, -5.3724274039268494e-05, -5.140155553817749e-05, -4.907883703708649e-05, -4.6756118535995483e-05, -4.443340003490448e-05, -4.2110681533813477e-05, -3.978796303272247e-05, -3.746524453163147e-05, -3.5142526030540466e-05, -3.281980752944946e-05, -3.049708902835846e-05, -2.8174370527267456e-05, -2.5851652026176453e-05, -2.352893352508545e-05, -2.1206215023994446e-05, -1.8883496522903442e-05, -1.656077802181244e-05, -1.4238059520721436e-05, -1.1915341019630432e-05, -9.592622518539429e-06, -7.269904017448425e-06, -4.947185516357422e-06, -2.6244670152664185e-06, -3.0174851417541504e-07, 2.0209699869155884e-06, 4.343688488006592e-06, 6.666406989097595e-06, 8.989125490188599e-06, 1.1311843991279602e-05, 1.3634562492370605e-05, 1.595728099346161e-05, 1.8279999494552612e-05, 2.0602717995643616e-05, 2.292543649673462e-05, 2.5248154997825623e-05, 2.7570873498916626e-05, 2.989359200000763e-05, 3.221631050109863e-05, 3.4539029002189636e-05, 3.686174750328064e-05, 3.918446600437164e-05, 4.1507184505462646e-05, 4.382990300655365e-05, 4.615262150764465e-05, 4.847534000873566e-05, 5.079805850982666e-05, 5.3120777010917664e-05, 5.544349551200867e-05, 5.776621401309967e-05, 6.0088932514190674e-05, 6.241165101528168e-05, 6.473436951637268e-05, 6.705708801746368e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 11.0, 4.0, 13.0, 22.0, 27.0, 41.0, 46.0, 52.0, 96.0, 118.0, 148.0, 114.0, 74.0, 48.0, 51.0, 40.0, 18.0, 21.0, 12.0, 8.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8743019104003906e-05, -3.764685243368149e-05, -3.655068576335907e-05, -3.545451909303665e-05, -3.4358352422714233e-05, -3.3262185752391815e-05, -3.21660190820694e-05, -3.106985241174698e-05, -2.997368574142456e-05, -2.8877519071102142e-05, -2.7781352400779724e-05, -2.6685185730457306e-05, -2.5589019060134888e-05, -2.449285238981247e-05, -2.339668571949005e-05, -2.2300519049167633e-05, -2.1204352378845215e-05, -2.0108185708522797e-05, -1.901201903820038e-05, -1.791585236787796e-05, -1.6819685697555542e-05, -1.5723519027233124e-05, -1.4627352356910706e-05, -1.3531185686588287e-05, -1.2435019016265869e-05, -1.1338852345943451e-05, -1.0242685675621033e-05, -9.146519005298615e-06, -8.050352334976196e-06, -6.954185664653778e-06, -5.85801899433136e-06, -4.761852324008942e-06, -3.6656856536865234e-06, -2.5695189833641052e-06, -1.473352313041687e-06, -3.771856427192688e-07, 7.189810276031494e-07, 1.8151476979255676e-06, 2.911314368247986e-06, 4.007481038570404e-06, 5.103647708892822e-06, 6.1998143792152405e-06, 7.295981049537659e-06, 8.392147719860077e-06, 9.488314390182495e-06, 1.0584481060504913e-05, 1.1680647730827332e-05, 1.277681440114975e-05, 1.3872981071472168e-05, 1.4969147741794586e-05, 1.6065314412117004e-05, 1.7161481082439423e-05, 1.825764775276184e-05, 1.935381442308426e-05, 2.0449981093406677e-05, 2.1546147763729095e-05, 2.2642314434051514e-05, 2.3738481104373932e-05, 2.483464777469635e-05, 2.593081444501877e-05, 2.7026981115341187e-05, 2.8123147785663605e-05, 2.9219314455986023e-05, 3.031548112630844e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [12.0, 938.0, 64.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03425495699048042, -0.014300649985671043, 0.005653657019138336, 0.025607962161302567, 0.045562271028757095, 0.06551657617092133, 0.08547088503837585, 0.10542519390583038, 0.1253795027732849, 0.14533381164073944, 0.16528812050819397, 0.1852424144744873, 0.20519673824310303, 0.22515103220939636, 0.2451053410768509, 0.2650596499443054, 0.28501394391059875, 0.3049682378768921, 0.3249225616455078, 0.34487685561180115, 0.36483117938041687, 0.3847854733467102, 0.4047397971153259, 0.42469409108161926, 0.444648414850235, 0.4646027088165283, 0.48455703258514404, 0.5045113563537598, 0.5244656205177307, 0.5444199442863464, 0.5643742680549622, 0.5843285322189331, 0.6042829155921936, 0.6242372393608093, 0.6441915035247803, 0.664145827293396, 0.6841001510620117, 0.7040544748306274, 0.7240087389945984, 0.7439630627632141, 0.7639173865318298, 0.7838717103004456, 0.8038259744644165, 0.8237802982330322, 0.843734622001648, 0.8636889457702637, 0.8836432099342346, 0.9035975337028503, 0.9235517978668213, 0.943506121635437, 0.963460385799408, 0.9834147095680237, 1.0033689737319946, 1.0233232975006104, 1.043277621269226, 1.0632319450378418, 1.0831862688064575, 1.1031405925750732, 1.123094916343689, 1.1430492401123047, 1.1630034446716309, 1.1829577684402466, 1.2029120922088623, 1.222866415977478, 1.2428207397460938]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 9.0, 12.0, 11.0, 14.0, 26.0, 31.0, 35.0, 50.0, 54.0, 42.0, 65.0, 76.0, 64.0, 77.0, 60.0, 67.0, 60.0, 55.0, 52.0, 36.0, 23.0, 20.0, 17.0, 16.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2950636148452759, -0.2866082191467285, -0.27815282344818115, -0.2696973979473114, -0.26124200224876404, -0.2527866065502167, -0.24433119595050812, -0.23587578535079956, -0.2274203896522522, -0.21896499395370483, -0.21050958335399628, -0.20205417275428772, -0.19359877705574036, -0.185143381357193, -0.17668797075748444, -0.16823256015777588, -0.15977716445922852, -0.15132176876068115, -0.1428663581609726, -0.13441094756126404, -0.12595555186271667, -0.11750014871358871, -0.10904474556446075, -0.1005893424153328, -0.09213393926620483, -0.08367853611707687, -0.07522313296794891, -0.06676772981882095, -0.05831232666969299, -0.04985692352056503, -0.04140152037143707, -0.03294611722230911, -0.024490714073181152, -0.016035310924053192, -0.007579907774925232, 0.0008754953742027283, 0.009330898523330688, 0.01778630167245865, 0.02624170482158661, 0.03469710797071457, 0.04315251111984253, 0.05160791426897049, 0.06006331741809845, 0.06851872056722641, 0.07697412371635437, 0.08542952686548233, 0.09388493001461029, 0.10234033316373825, 0.11079573631286621, 0.11925113946199417, 0.12770654261112213, 0.1361619532108307, 0.14461734890937805, 0.15307274460792542, 0.16152815520763397, 0.16998356580734253, 0.1784389615058899, 0.18689435720443726, 0.1953497678041458, 0.20380517840385437, 0.21226057410240173, 0.2207159698009491, 0.22917138040065765, 0.2376267910003662, 0.24608218669891357]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 5.0, 11.0, 10.0, 15.0, 15.0, 25.0, 26.0, 35.0, 52.0, 64.0, 84.0, 138.0, 220.0, 644.0, 11736.0, 4171602.0, 8169.0, 492.0, 257.0, 159.0, 98.0, 80.0, 64.0, 39.0, 39.0, 23.0, 29.0, 23.0, 20.0, 15.0, 13.0, 15.0, 10.0, 4.0, 9.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031219482421875, -0.03016185760498047, -0.029104232788085938, -0.028046607971191406, -0.026988983154296875, -0.025931358337402344, -0.024873733520507812, -0.02381610870361328, -0.02275848388671875, -0.02170085906982422, -0.020643234252929688, -0.019585609436035156, -0.018527984619140625, -0.017470359802246094, -0.016412734985351562, -0.015355110168457031, -0.0142974853515625, -0.013239860534667969, -0.012182235717773438, -0.011124610900878906, -0.010066986083984375, -0.009009361267089844, -0.007951736450195312, -0.006894111633300781, -0.00583648681640625, -0.004778861999511719, -0.0037212371826171875, -0.0026636123657226562, -0.001605987548828125, -0.0005483627319335938, 0.0005092620849609375, 0.0015668869018554688, 0.00262451171875, 0.0036821365356445312, 0.0047397613525390625, 0.005797386169433594, 0.006855010986328125, 0.007912635803222656, 0.008970260620117188, 0.010027885437011719, 0.01108551025390625, 0.012143135070800781, 0.013200759887695312, 0.014258384704589844, 0.015316009521484375, 0.016373634338378906, 0.017431259155273438, 0.01848888397216797, 0.0195465087890625, 0.02060413360595703, 0.021661758422851562, 0.022719383239746094, 0.023777008056640625, 0.024834632873535156, 0.025892257690429688, 0.02694988250732422, 0.02800750732421875, 0.02906513214111328, 0.030122756958007812, 0.031180381774902344, 0.032238006591796875, 0.033295631408691406, 0.03435325622558594, 0.03541088104248047, 0.036468505859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 7.0, 10.0, 10.0, 7.0, 14.0, 15.0, 69.0, 238.0, 326.0, 139.0, 44.0, 9.0, 12.0, 9.0, 11.0, 10.0, 7.0, 2.0, 3.0, 6.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.008418679237365723, -0.008124589920043945, -0.007830500602722168, -0.007536411285400391, -0.007242321968078613, -0.006948232650756836, -0.006654143333435059, -0.006360054016113281, -0.006065964698791504, -0.0057718753814697266, -0.005477786064147949, -0.005183696746826172, -0.0048896074295043945, -0.004595518112182617, -0.00430142879486084, -0.0040073394775390625, -0.003713250160217285, -0.003419160842895508, -0.0031250715255737305, -0.002830982208251953, -0.0025368928909301758, -0.0022428035736083984, -0.001948714256286621, -0.0016546249389648438, -0.0013605356216430664, -0.001066446304321289, -0.0007723569869995117, -0.0004782676696777344, -0.00018417835235595703, 0.00010991096496582031, 0.00040400028228759766, 0.000698089599609375, 0.0009921789169311523, 0.0012862682342529297, 0.001580357551574707, 0.0018744468688964844, 0.0021685361862182617, 0.002462625503540039, 0.0027567148208618164, 0.0030508041381835938, 0.003344893455505371, 0.0036389827728271484, 0.003933072090148926, 0.004227161407470703, 0.0045212507247924805, 0.004815340042114258, 0.005109429359436035, 0.0054035186767578125, 0.00569760799407959, 0.005991697311401367, 0.0062857866287231445, 0.006579875946044922, 0.006873965263366699, 0.0071680545806884766, 0.007462143898010254, 0.007756233215332031, 0.008050322532653809, 0.008344411849975586, 0.008638501167297363, 0.00893259048461914, 0.009226679801940918, 0.009520769119262695, 0.009814858436584473, 0.01010894775390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 8.0, 6.0, 14.0, 12.0, 21.0, 42.0, 98.0, 376.0, 3730.0, 4184109.0, 5113.0, 494.0, 116.0, 55.0, 22.0, 31.0, 6.0, 14.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0845947265625, -0.08234071731567383, -0.08008670806884766, -0.07783269882202148, -0.07557868957519531, -0.07332468032836914, -0.07107067108154297, -0.0688166618347168, -0.06656265258789062, -0.06430864334106445, -0.06205463409423828, -0.05980062484741211, -0.05754661560058594, -0.055292606353759766, -0.053038597106933594, -0.05078458786010742, -0.04853057861328125, -0.04627656936645508, -0.044022560119628906, -0.041768550872802734, -0.03951454162597656, -0.03726053237915039, -0.03500652313232422, -0.03275251388549805, -0.030498504638671875, -0.028244495391845703, -0.02599048614501953, -0.02373647689819336, -0.021482467651367188, -0.019228458404541016, -0.016974449157714844, -0.014720439910888672, -0.0124664306640625, -0.010212421417236328, -0.007958412170410156, -0.005704402923583984, -0.0034503936767578125, -0.0011963844299316406, 0.0010576248168945312, 0.003311634063720703, 0.005565643310546875, 0.007819652557373047, 0.010073661804199219, 0.01232767105102539, 0.014581680297851562, 0.016835689544677734, 0.019089698791503906, 0.021343708038330078, 0.02359771728515625, 0.025851726531982422, 0.028105735778808594, 0.030359745025634766, 0.03261375427246094, 0.03486776351928711, 0.03712177276611328, 0.03937578201293945, 0.041629791259765625, 0.0438838005065918, 0.04613780975341797, 0.04839181900024414, 0.05064582824707031, 0.052899837493896484, 0.055153846740722656, 0.05740785598754883, 0.059661865234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 6.0, 19.0, 47.0, 163.0, 3591.0, 150.0, 41.0, 14.0, 8.0, 5.0, 6.0, 4.0, 2.0, 8.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01169586181640625, -0.011237263679504395, -0.010778665542602539, -0.010320067405700684, -0.009861469268798828, -0.009402871131896973, -0.008944272994995117, -0.008485674858093262, -0.008027076721191406, -0.007568478584289551, -0.007109880447387695, -0.00665128231048584, -0.006192684173583984, -0.005734086036682129, -0.0052754878997802734, -0.004816889762878418, -0.0043582916259765625, -0.003899693489074707, -0.0034410953521728516, -0.002982497215270996, -0.0025238990783691406, -0.002065300941467285, -0.0016067028045654297, -0.0011481046676635742, -0.0006895065307617188, -0.00023090839385986328, 0.0002276897430419922, 0.0006862878799438477, 0.0011448860168457031, 0.0016034841537475586, 0.002062082290649414, 0.0025206804275512695, 0.002979278564453125, 0.0034378767013549805, 0.003896474838256836, 0.004355072975158691, 0.004813671112060547, 0.005272269248962402, 0.005730867385864258, 0.006189465522766113, 0.006648063659667969, 0.007106661796569824, 0.00756525993347168, 0.008023858070373535, 0.00848245620727539, 0.008941054344177246, 0.009399652481079102, 0.009858250617980957, 0.010316848754882812, 0.010775446891784668, 0.011234045028686523, 0.011692643165588379, 0.012151241302490234, 0.01260983943939209, 0.013068437576293945, 0.0135270357131958, 0.013985633850097656, 0.014444231986999512, 0.014902830123901367, 0.015361428260803223, 0.015820026397705078, 0.016278624534606934, 0.01673722267150879, 0.017195820808410645, 0.0176544189453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1001.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21490637958049774, -0.2060028314590454, -0.19709926843643188, -0.18819572031497955, -0.17929217219352722, -0.1703886240720749, -0.16148507595062256, -0.15258151292800903, -0.1436779648065567, -0.13477441668510437, -0.12587085366249084, -0.11696730554103851, -0.10806375741958618, -0.09916020929813385, -0.09025665372610092, -0.081353098154068, -0.07244955003261566, -0.06354600191116333, -0.0546424463391304, -0.04573889449238777, -0.03683534264564514, -0.02793179079890251, -0.01902823895215988, -0.010124687105417252, -0.0012211352586746216, 0.007682416588068008, 0.01658596843481064, 0.02548952028155327, 0.0343930721282959, 0.04329662397503853, 0.05220017582178116, 0.06110372766852379, 0.07000729441642761, 0.07891084253787994, 0.08781439810991287, 0.0967179536819458, 0.10562150180339813, 0.11452504992485046, 0.12342860549688339, 0.13233216106891632, 0.14123570919036865, 0.15013925731182098, 0.15904280543327332, 0.16794636845588684, 0.17684991657733917, 0.1857534646987915, 0.19465702772140503, 0.20356057584285736, 0.2124641239643097, 0.22136767208576202, 0.23027122020721436, 0.23917478322982788, 0.2480783313512802, 0.25698187947273254, 0.26588544249534607, 0.2747889757156372, 0.28369253873825073, 0.29259610176086426, 0.3014996349811554, 0.3104031980037689, 0.31930673122406006, 0.3282102942466736, 0.3371138572692871, 0.34601739048957825, 0.3549209535121918]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 17.0, 17.0, 14.0, 24.0, 29.0, 37.0, 40.0, 46.0, 56.0, 72.0, 59.0, 43.0, 58.0, 54.0, 64.0, 60.0, 45.0, 44.0, 35.0, 28.0, 31.0, 25.0, 31.0, 19.0, 6.0, 8.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.025498926639556885, -0.02464284375309944, -0.023786762729287148, -0.022930681705474854, -0.02207459881901741, -0.021218515932559967, -0.020362434908747673, -0.01950635388493538, -0.018650270998477936, -0.017794188112020493, -0.0169381070882082, -0.016082026064395905, -0.015225943177938461, -0.014369861222803593, -0.013513779267668724, -0.012657697312533855, -0.011801615357398987, -0.010945533402264118, -0.01008945144712925, -0.009233369491994381, -0.008377287536859512, -0.007521205581724644, -0.006665123626589775, -0.0058090416714549065, -0.004952959716320038, -0.004096877761185169, -0.0032407958060503006, -0.002384713850915432, -0.0015286318957805634, -0.0006725499406456947, 0.0001835320144891739, 0.0010396139696240425, 0.0018956959247589111, 0.0027517778798937798, 0.0036078598350286484, 0.004463941790163517, 0.005320023745298386, 0.006176105700433254, 0.007032187655568123, 0.007888269610702991, 0.00874435156583786, 0.009600433520972729, 0.010456515476107597, 0.011312597431242466, 0.012168679386377335, 0.013024761341512203, 0.013880843296647072, 0.01473692525178194, 0.015593007206916809, 0.016449090093374252, 0.017305171117186546, 0.01816125214099884, 0.019017335027456284, 0.019873417913913727, 0.02072949893772602, 0.021585579961538315, 0.022441662847995758, 0.0232977457344532, 0.024153826758265495, 0.02500990778207779, 0.025865990668535233, 0.026722073554992676, 0.02757815457880497, 0.028434235602617264, 0.029290318489074707]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 15.0, 18.0, 20.0, 25.0, 37.0, 52.0, 60.0, 98.0, 108.0, 180.0, 203.0, 284.0, 367.0, 553.0, 767.0, 1087.0, 1496.0, 2229.0, 3269.0, 5013.0, 8655.0, 16295.0, 54671.0, 839653.0, 70187.0, 17540.0, 9166.0, 5302.0, 3383.0, 2296.0, 1520.0, 1087.0, 749.0, 545.0, 411.0, 294.0, 231.0, 180.0, 129.0, 90.0, 60.0, 44.0, 45.0, 26.0, 19.0, 22.0, 15.0, 10.0, 11.0, 8.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.011460661888122559, -0.011072874069213867, -0.010685086250305176, -0.010297298431396484, -0.009909510612487793, -0.009521722793579102, -0.00913393497467041, -0.008746147155761719, -0.008358359336853027, -0.007970571517944336, -0.0075827836990356445, -0.007194995880126953, -0.006807208061218262, -0.00641942024230957, -0.006031632423400879, -0.0056438446044921875, -0.005256056785583496, -0.004868268966674805, -0.004480481147766113, -0.004092693328857422, -0.0037049055099487305, -0.003317117691040039, -0.0029293298721313477, -0.0025415420532226562, -0.002153754234313965, -0.0017659664154052734, -0.001378178596496582, -0.0009903907775878906, -0.0006026029586791992, -0.0002148151397705078, 0.0001729726791381836, 0.000560760498046875, 0.0009485483169555664, 0.0013363361358642578, 0.0017241239547729492, 0.0021119117736816406, 0.002499699592590332, 0.0028874874114990234, 0.003275275230407715, 0.0036630630493164062, 0.004050850868225098, 0.004438638687133789, 0.0048264265060424805, 0.005214214324951172, 0.005602002143859863, 0.005989789962768555, 0.006377577781677246, 0.0067653656005859375, 0.007153153419494629, 0.00754094123840332, 0.007928729057312012, 0.008316516876220703, 0.008704304695129395, 0.009092092514038086, 0.009479880332946777, 0.009867668151855469, 0.01025545597076416, 0.010643243789672852, 0.011031031608581543, 0.011418819427490234, 0.011806607246398926, 0.012194395065307617, 0.012582182884216309, 0.012969970703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 4.0, 4.0, 13.0, 8.0, 9.0, 8.0, 20.0, 57.0, 215.0, 331.0, 162.0, 49.0, 12.0, 12.0, 8.0, 11.0, 11.0, 6.0, 3.0, 3.0, 6.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0087432861328125, -0.008449196815490723, -0.008155107498168945, -0.007861018180847168, -0.007566928863525391, -0.007272839546203613, -0.006978750228881836, -0.006684660911560059, -0.006390571594238281, -0.006096482276916504, -0.0058023929595947266, -0.005508303642272949, -0.005214214324951172, -0.0049201250076293945, -0.004626035690307617, -0.00433194637298584, -0.0040378570556640625, -0.003743767738342285, -0.003449678421020508, -0.0031555891036987305, -0.002861499786376953, -0.0025674104690551758, -0.0022733211517333984, -0.001979231834411621, -0.0016851425170898438, -0.0013910531997680664, -0.001096963882446289, -0.0008028745651245117, -0.0005087852478027344, -0.00021469593048095703, 7.939338684082031e-05, 0.00037348270416259766, 0.000667572021484375, 0.0009616613388061523, 0.0012557506561279297, 0.001549839973449707, 0.0018439292907714844, 0.0021380186080932617, 0.002432107925415039, 0.0027261972427368164, 0.0030202865600585938, 0.003314375877380371, 0.0036084651947021484, 0.0039025545120239258, 0.004196643829345703, 0.0044907331466674805, 0.004784822463989258, 0.005078911781311035, 0.0053730010986328125, 0.00566709041595459, 0.005961179733276367, 0.0062552690505981445, 0.006549358367919922, 0.006843447685241699, 0.0071375370025634766, 0.007431626319885254, 0.007725715637207031, 0.008019804954528809, 0.008313894271850586, 0.008607983589172363, 0.00890207290649414, 0.009196162223815918, 0.009490251541137695, 0.009784340858459473, 0.01007843017578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 6.0, 14.0, 9.0, 10.0, 16.0, 22.0, 31.0, 36.0, 49.0, 50.0, 58.0, 73.0, 78.0, 116.0, 164.0, 213.0, 343.0, 583.0, 1034.0, 2825.0, 31626.0, 967953.0, 37388.0, 2842.0, 1105.0, 579.0, 315.0, 236.0, 167.0, 136.0, 100.0, 70.0, 55.0, 42.0, 42.0, 35.0, 23.0, 20.0, 17.0, 16.0, 9.0, 8.0, 4.0, 2.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.03950834274291992, -0.038123130798339844, -0.036737918853759766, -0.03535270690917969, -0.03396749496459961, -0.03258228302001953, -0.031197071075439453, -0.029811859130859375, -0.028426647186279297, -0.02704143524169922, -0.02565622329711914, -0.024271011352539062, -0.022885799407958984, -0.021500587463378906, -0.020115375518798828, -0.01873016357421875, -0.017344951629638672, -0.015959739685058594, -0.014574527740478516, -0.013189315795898438, -0.01180410385131836, -0.010418891906738281, -0.009033679962158203, -0.007648468017578125, -0.006263256072998047, -0.004878044128417969, -0.0034928321838378906, -0.0021076202392578125, -0.0007224082946777344, 0.0006628036499023438, 0.002048015594482422, 0.0034332275390625, 0.004818439483642578, 0.006203651428222656, 0.007588863372802734, 0.008974075317382812, 0.01035928726196289, 0.011744499206542969, 0.013129711151123047, 0.014514923095703125, 0.015900135040283203, 0.01728534698486328, 0.01867055892944336, 0.020055770874023438, 0.021440982818603516, 0.022826194763183594, 0.024211406707763672, 0.02559661865234375, 0.026981830596923828, 0.028367042541503906, 0.029752254486083984, 0.031137466430664062, 0.03252267837524414, 0.03390789031982422, 0.0352931022644043, 0.036678314208984375, 0.03806352615356445, 0.03944873809814453, 0.04083395004272461, 0.04221916198730469, 0.043604373931884766, 0.044989585876464844, 0.04637479782104492, 0.047760009765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 9.0, 14.0, 21.0, 20.0, 20.0, 31.0, 26.0, 29.0, 28.0, 36.0, 32.0, 35.0, 46.0, 26.0, 48.0, 55.0, 32.0, 43.0, 31.0, 35.0, 41.0, 39.0, 32.0, 31.0, 30.0, 28.0, 22.0, 10.0, 13.0, 16.0, 18.0, 14.0, 9.0, 12.0, 11.0, 6.0, 4.0, 4.0, 2.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235137939453125, -0.022716522216796875, -0.02191925048828125, -0.021121978759765625, -0.02032470703125, -0.019527435302734375, -0.01873016357421875, -0.017932891845703125, -0.0171356201171875, -0.016338348388671875, -0.01554107666015625, -0.014743804931640625, -0.013946533203125, -0.013149261474609375, -0.01235198974609375, -0.011554718017578125, -0.0107574462890625, -0.009960174560546875, -0.00916290283203125, -0.008365631103515625, -0.007568359375, -0.006771087646484375, -0.00597381591796875, -0.005176544189453125, -0.0043792724609375, -0.003582000732421875, -0.00278472900390625, -0.001987457275390625, -0.001190185546875, -0.000392913818359375, 0.00040435791015625, 0.001201629638671875, 0.0019989013671875, 0.002796173095703125, 0.00359344482421875, 0.004390716552734375, 0.00518798828125, 0.005985260009765625, 0.00678253173828125, 0.007579803466796875, 0.0083770751953125, 0.009174346923828125, 0.00997161865234375, 0.010768890380859375, 0.011566162109375, 0.012363433837890625, 0.01316070556640625, 0.013957977294921875, 0.0147552490234375, 0.015552520751953125, 0.01634979248046875, 0.017147064208984375, 0.0179443359375, 0.018741607666015625, 0.01953887939453125, 0.020336151123046875, 0.0211334228515625, 0.021930694580078125, 0.02272796630859375, 0.023525238037109375, 0.024322509765625, 0.025119781494140625, 0.02591705322265625, 0.026714324951171875, 0.0275115966796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 7.0, 10.0, 14.0, 15.0, 24.0, 32.0, 58.0, 82.0, 125.0, 248.0, 524.0, 1407.0, 7119.0, 875579.0, 157216.0, 4158.0, 1008.0, 386.0, 179.0, 111.0, 68.0, 36.0, 34.0, 22.0, 10.0, 16.0, 6.0, 8.0, 8.0, 8.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.445148468017578e-05, -3.311969339847565e-05, -3.178790211677551e-05, -3.045611083507538e-05, -2.9124319553375244e-05, -2.779252827167511e-05, -2.6460736989974976e-05, -2.512894570827484e-05, -2.3797154426574707e-05, -2.2465363144874573e-05, -2.113357186317444e-05, -1.9801780581474304e-05, -1.846998929977417e-05, -1.7138198018074036e-05, -1.58064067363739e-05, -1.4474615454673767e-05, -1.3142824172973633e-05, -1.1811032891273499e-05, -1.0479241609573364e-05, -9.14745032787323e-06, -7.815659046173096e-06, -6.4838677644729614e-06, -5.152076482772827e-06, -3.820285201072693e-06, -2.4884939193725586e-06, -1.1567026376724243e-06, 1.7508864402770996e-07, 1.5068799257278442e-06, 2.8386712074279785e-06, 4.170462489128113e-06, 5.502253770828247e-06, 6.834045052528381e-06, 8.165836334228516e-06, 9.49762761592865e-06, 1.0829418897628784e-05, 1.2161210179328918e-05, 1.3493001461029053e-05, 1.4824792742729187e-05, 1.615658402442932e-05, 1.7488375306129456e-05, 1.882016658782959e-05, 2.0151957869529724e-05, 2.148374915122986e-05, 2.2815540432929993e-05, 2.4147331714630127e-05, 2.547912299633026e-05, 2.6810914278030396e-05, 2.814270555973053e-05, 2.9474496841430664e-05, 3.08062881231308e-05, 3.213807940483093e-05, 3.346987068653107e-05, 3.48016619682312e-05, 3.6133453249931335e-05, 3.746524453163147e-05, 3.8797035813331604e-05, 4.012882709503174e-05, 4.146061837673187e-05, 4.279240965843201e-05, 4.412420094013214e-05, 4.5455992221832275e-05, 4.678778350353241e-05, 4.8119574785232544e-05, 4.945136606693268e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 12.0, 6.0, 17.0, 8.0, 17.0, 33.0, 22.0, 39.0, 25.0, 74.0, 67.0, 63.0, 88.0, 73.0, 93.0, 58.0, 43.0, 52.0, 19.0, 52.0, 19.0, 19.0, 18.0, 11.0, 13.0, 13.0, 9.0, 7.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.602836608886719e-06, -5.448237061500549e-06, -5.29363751411438e-06, -5.1390379667282104e-06, -4.984438419342041e-06, -4.829838871955872e-06, -4.675239324569702e-06, -4.520639777183533e-06, -4.366040229797363e-06, -4.211440682411194e-06, -4.056841135025024e-06, -3.902241587638855e-06, -3.7476420402526855e-06, -3.593042492866516e-06, -3.4384429454803467e-06, -3.2838433980941772e-06, -3.129243850708008e-06, -2.9746443033218384e-06, -2.820044755935669e-06, -2.6654452085494995e-06, -2.51084566116333e-06, -2.3562461137771606e-06, -2.201646566390991e-06, -2.0470470190048218e-06, -1.8924474716186523e-06, -1.737847924232483e-06, -1.5832483768463135e-06, -1.428648829460144e-06, -1.2740492820739746e-06, -1.1194497346878052e-06, -9.648501873016357e-07, -8.102506399154663e-07, -6.556510925292969e-07, -5.010515451431274e-07, -3.46451997756958e-07, -1.9185245037078857e-07, -3.725290298461914e-08, 1.1734664440155029e-07, 2.7194619178771973e-07, 4.2654573917388916e-07, 5.811452865600586e-07, 7.35744833946228e-07, 8.903443813323975e-07, 1.044943928718567e-06, 1.1995434761047363e-06, 1.3541430234909058e-06, 1.5087425708770752e-06, 1.6633421182632446e-06, 1.817941665649414e-06, 1.9725412130355835e-06, 2.127140760421753e-06, 2.2817403078079224e-06, 2.436339855194092e-06, 2.5909394025802612e-06, 2.7455389499664307e-06, 2.9001384973526e-06, 3.0547380447387695e-06, 3.209337592124939e-06, 3.3639371395111084e-06, 3.518536686897278e-06, 3.6731362342834473e-06, 3.827735781669617e-06, 3.982335329055786e-06, 4.1369348764419556e-06, 4.291534423828125e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 8.0, 8.0, 22.0, 27.0, 36.0, 89.0, 121.0, 229.0, 711.0, 4777.0, 1033941.0, 7206.0, 748.0, 266.0, 141.0, 79.0, 41.0, 29.0, 18.0, 10.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16908073425293e-05, -5.960371345281601e-05, -5.751661956310272e-05, -5.5429525673389435e-05, -5.334243178367615e-05, -5.125533789396286e-05, -4.916824400424957e-05, -4.7081150114536285e-05, -4.4994056224823e-05, -4.290696233510971e-05, -4.081986844539642e-05, -3.8732774555683136e-05, -3.664568066596985e-05, -3.455858677625656e-05, -3.2471492886543274e-05, -3.0384398996829987e-05, -2.82973051071167e-05, -2.6210211217403412e-05, -2.4123117327690125e-05, -2.2036023437976837e-05, -1.994892954826355e-05, -1.7861835658550262e-05, -1.5774741768836975e-05, -1.3687647879123688e-05, -1.16005539894104e-05, -9.513460099697113e-06, -7.426366209983826e-06, -5.339272320270538e-06, -3.252178430557251e-06, -1.1650845408439636e-06, 9.220093488693237e-07, 3.009103238582611e-06, 5.0961971282958984e-06, 7.183291018009186e-06, 9.270384907722473e-06, 1.135747879743576e-05, 1.3444572687149048e-05, 1.5531666576862335e-05, 1.7618760466575623e-05, 1.970585435628891e-05, 2.1792948246002197e-05, 2.3880042135715485e-05, 2.5967136025428772e-05, 2.805422991514206e-05, 3.0141323804855347e-05, 3.2228417694568634e-05, 3.431551158428192e-05, 3.640260547399521e-05, 3.8489699363708496e-05, 4.0576793253421783e-05, 4.266388714313507e-05, 4.475098103284836e-05, 4.6838074922561646e-05, 4.892516881227493e-05, 5.101226270198822e-05, 5.309935659170151e-05, 5.5186450481414795e-05, 5.727354437112808e-05, 5.936063826084137e-05, 6.144773215055466e-05, 6.353482604026794e-05, 6.562191992998123e-05, 6.770901381969452e-05, 6.97961077094078e-05, 7.18832015991211e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 8.0, 26.0, 26.0, 20.0, 44.0, 78.0, 118.0, 207.0, 153.0, 102.0, 58.0, 39.0, 37.0, 20.0, 12.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.759695053100586e-05, -2.6520341634750366e-05, -2.5443732738494873e-05, -2.436712384223938e-05, -2.3290514945983887e-05, -2.2213906049728394e-05, -2.11372971534729e-05, -2.0060688257217407e-05, -1.8984079360961914e-05, -1.790747046470642e-05, -1.6830861568450928e-05, -1.5754252672195435e-05, -1.4677643775939941e-05, -1.3601034879684448e-05, -1.2524425983428955e-05, -1.1447817087173462e-05, -1.0371208190917969e-05, -9.294599294662476e-06, -8.217990398406982e-06, -7.141381502151489e-06, -6.064772605895996e-06, -4.988163709640503e-06, -3.91155481338501e-06, -2.8349459171295166e-06, -1.7583370208740234e-06, -6.817281246185303e-07, 3.948807716369629e-07, 1.471489667892456e-06, 2.5480985641479492e-06, 3.6247074604034424e-06, 4.7013163566589355e-06, 5.777925252914429e-06, 6.854534149169922e-06, 7.931143045425415e-06, 9.007751941680908e-06, 1.0084360837936401e-05, 1.1160969734191895e-05, 1.2237578630447388e-05, 1.3314187526702881e-05, 1.4390796422958374e-05, 1.5467405319213867e-05, 1.654401421546936e-05, 1.7620623111724854e-05, 1.8697232007980347e-05, 1.977384090423584e-05, 2.0850449800491333e-05, 2.1927058696746826e-05, 2.300366759300232e-05, 2.4080276489257812e-05, 2.5156885385513306e-05, 2.62334942817688e-05, 2.7310103178024292e-05, 2.8386712074279785e-05, 2.946332097053528e-05, 3.053992986679077e-05, 3.1616538763046265e-05, 3.269314765930176e-05, 3.376975655555725e-05, 3.4846365451812744e-05, 3.592297434806824e-05, 3.699958324432373e-05, 3.8076192140579224e-05, 3.915280103683472e-05, 4.022940993309021e-05, 4.13060188293457e-05]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 23.0, 79.0, 574.0, 241.0, 59.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12260283529758453, -0.11834025382995605, -0.11407766491174698, -0.1098150759935379, -0.10555249452590942, -0.10128991305828094, -0.09702732414007187, -0.09276473522186279, -0.08850215375423431, -0.08423957228660583, -0.07997698336839676, -0.07571439445018768, -0.0714518129825592, -0.06718923151493073, -0.06292664259672165, -0.05866405740380287, -0.054401472210884094, -0.05013888701796532, -0.04587630182504654, -0.04161371663212776, -0.037351131439208984, -0.03308854624629021, -0.02882596105337143, -0.024563375860452652, -0.020300790667533875, -0.016038205474615097, -0.01177562028169632, -0.007513035088777542, -0.0032504498958587646, 0.0010121352970600128, 0.00527472048997879, 0.009537305682897568, 0.013799875974655151, 0.01806246116757393, 0.022325046360492706, 0.026587631553411484, 0.03085021674633026, 0.03511280193924904, 0.039375387132167816, 0.043637972325086594, 0.04790055751800537, 0.05216314271092415, 0.056425727903842926, 0.060688313096761703, 0.06495089828968048, 0.06921347975730896, 0.07347606867551804, 0.07773865759372711, 0.08200123906135559, 0.08626382052898407, 0.09052640944719315, 0.09478899836540222, 0.0990515798330307, 0.10331416130065918, 0.10757675021886826, 0.11183933913707733, 0.11610192060470581, 0.12036450207233429, 0.12462709099054337, 0.12888967990875244, 0.13315226137638092, 0.1374148428440094, 0.14167743921279907, 0.14594002068042755, 0.15020260214805603]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 14.0, 17.0, 13.0, 21.0, 35.0, 36.0, 57.0, 58.0, 76.0, 86.0, 85.0, 80.0, 101.0, 47.0, 53.0, 49.0, 39.0, 31.0, 24.0, 17.0, 19.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3054198622703552, -0.2963999807834625, -0.28738006949424744, -0.27836018800735474, -0.26934030652046204, -0.26032042503356934, -0.25130051374435425, -0.24228063225746155, -0.23326073586940765, -0.22424083948135376, -0.21522095799446106, -0.20620106160640717, -0.19718116521835327, -0.18816128373146057, -0.17914138734340668, -0.17012149095535278, -0.16110160946846008, -0.1520817130804062, -0.1430618315935135, -0.1340419352054596, -0.1250220537185669, -0.116002157330513, -0.1069822609424591, -0.09796237200498581, -0.08894248306751251, -0.07992259413003922, -0.07090270519256592, -0.061882808804512024, -0.05286291986703873, -0.04384303092956543, -0.034823138266801834, -0.02580324560403824, -0.01678335666656494, -0.007763465866446495, 0.0012564249336719513, 0.010276315733790398, 0.019296206533908844, 0.02831609547138214, 0.03733598813414574, 0.04635588079690933, 0.05537576973438263, 0.06439565867185593, 0.07341554760932922, 0.08243544399738312, 0.09145533293485641, 0.10047522187232971, 0.1094951182603836, 0.1185150071978569, 0.1275348961353302, 0.1365547925233841, 0.1455746740102768, 0.1545945703983307, 0.1636144518852234, 0.17263434827327728, 0.18165424466133118, 0.19067412614822388, 0.19969402253627777, 0.20871391892433167, 0.21773380041122437, 0.22675369679927826, 0.23577359318733215, 0.24479347467422485, 0.25381335616111755, 0.26283326745033264, 0.27185314893722534]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 7.0, 12.0, 23.0, 27.0, 31.0, 41.0, 70.0, 93.0, 131.0, 203.0, 371.0, 1133.0, 18583.0, 3843278.0, 320433.0, 7921.0, 607.0, 381.0, 248.0, 176.0, 122.0, 83.0, 70.0, 50.0, 41.0, 29.0, 19.0, 18.0, 9.0, 11.0, 10.0, 10.0, 4.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211639404296875, -0.020406246185302734, -0.01964855194091797, -0.018890857696533203, -0.018133163452148438, -0.017375469207763672, -0.016617774963378906, -0.01586008071899414, -0.015102386474609375, -0.01434469223022461, -0.013586997985839844, -0.012829303741455078, -0.012071609497070312, -0.011313915252685547, -0.010556221008300781, -0.009798526763916016, -0.00904083251953125, -0.008283138275146484, -0.007525444030761719, -0.006767749786376953, -0.0060100555419921875, -0.005252361297607422, -0.004494667053222656, -0.0037369728088378906, -0.002979278564453125, -0.0022215843200683594, -0.0014638900756835938, -0.0007061958312988281, 5.14984130859375e-05, 0.0008091926574707031, 0.0015668869018554688, 0.0023245811462402344, 0.003082275390625, 0.0038399696350097656, 0.004597663879394531, 0.005355358123779297, 0.0061130523681640625, 0.006870746612548828, 0.007628440856933594, 0.00838613510131836, 0.009143829345703125, 0.00990152359008789, 0.010659217834472656, 0.011416912078857422, 0.012174606323242188, 0.012932300567626953, 0.013689994812011719, 0.014447689056396484, 0.01520538330078125, 0.015963077545166016, 0.01672077178955078, 0.017478466033935547, 0.018236160278320312, 0.018993854522705078, 0.019751548767089844, 0.02050924301147461, 0.021266937255859375, 0.02202463150024414, 0.022782325744628906, 0.023540019989013672, 0.024297714233398438, 0.025055408477783203, 0.02581310272216797, 0.026570796966552734, 0.0273284912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 6.0, 11.0, 11.0, 7.0, 5.0, 17.0, 51.0, 147.0, 307.0, 216.0, 90.0, 20.0, 7.0, 10.0, 10.0, 8.0, 10.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00777435302734375, -0.007497429847717285, -0.00722050666809082, -0.0069435834884643555, -0.006666660308837891, -0.006389737129211426, -0.006112813949584961, -0.005835890769958496, -0.005558967590332031, -0.005282044410705566, -0.0050051212310791016, -0.004728198051452637, -0.004451274871826172, -0.004174351692199707, -0.003897428512573242, -0.0036205053329467773, -0.0033435821533203125, -0.0030666589736938477, -0.002789735794067383, -0.002512812614440918, -0.002235889434814453, -0.0019589662551879883, -0.0016820430755615234, -0.0014051198959350586, -0.0011281967163085938, -0.0008512735366821289, -0.0005743503570556641, -0.0002974271774291992, -2.0503997802734375e-05, 0.00025641918182373047, 0.0005333423614501953, 0.0008102655410766602, 0.001087188720703125, 0.0013641119003295898, 0.0016410350799560547, 0.0019179582595825195, 0.0021948814392089844, 0.0024718046188354492, 0.002748727798461914, 0.003025650978088379, 0.0033025741577148438, 0.0035794973373413086, 0.0038564205169677734, 0.004133343696594238, 0.004410266876220703, 0.004687190055847168, 0.004964113235473633, 0.005241036415100098, 0.0055179595947265625, 0.005794882774353027, 0.006071805953979492, 0.006348729133605957, 0.006625652313232422, 0.006902575492858887, 0.0071794986724853516, 0.007456421852111816, 0.007733345031738281, 0.008010268211364746, 0.008287191390991211, 0.008564114570617676, 0.00884103775024414, 0.009117960929870605, 0.00939488410949707, 0.009671807289123535, 0.00994873046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 12.0, 15.0, 31.0, 29.0, 75.0, 150.0, 411.0, 1848.0, 37173.0, 4148994.0, 4413.0, 662.0, 188.0, 102.0, 38.0, 35.0, 17.0, 11.0, 4.0, 10.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04246091842651367, -0.041007041931152344, -0.039553165435791016, -0.03809928894042969, -0.03664541244506836, -0.03519153594970703, -0.0337376594543457, -0.032283782958984375, -0.030829906463623047, -0.02937602996826172, -0.02792215347290039, -0.026468276977539062, -0.025014400482177734, -0.023560523986816406, -0.022106647491455078, -0.02065277099609375, -0.019198894500732422, -0.017745018005371094, -0.016291141510009766, -0.014837265014648438, -0.01338338851928711, -0.011929512023925781, -0.010475635528564453, -0.009021759033203125, -0.007567882537841797, -0.006114006042480469, -0.004660129547119141, -0.0032062530517578125, -0.0017523765563964844, -0.00029850006103515625, 0.0011553764343261719, 0.0026092529296875, 0.004063129425048828, 0.005517005920410156, 0.006970882415771484, 0.008424758911132812, 0.00987863540649414, 0.011332511901855469, 0.012786388397216797, 0.014240264892578125, 0.015694141387939453, 0.01714801788330078, 0.01860189437866211, 0.020055770874023438, 0.021509647369384766, 0.022963523864746094, 0.024417400360107422, 0.02587127685546875, 0.027325153350830078, 0.028779029846191406, 0.030232906341552734, 0.03168678283691406, 0.03314065933227539, 0.03459453582763672, 0.03604841232299805, 0.037502288818359375, 0.0389561653137207, 0.04041004180908203, 0.04186391830444336, 0.04331779479980469, 0.044771671295166016, 0.046225547790527344, 0.04767942428588867, 0.04913330078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 21.0, 49.0, 101.0, 293.0, 1532.0, 1495.0, 319.0, 115.0, 61.0, 21.0, 11.0, 7.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.016082763671875, -0.015659451484680176, -0.015236139297485352, -0.014812827110290527, -0.014389514923095703, -0.013966202735900879, -0.013542890548706055, -0.01311957836151123, -0.012696266174316406, -0.012272953987121582, -0.011849641799926758, -0.011426329612731934, -0.01100301742553711, -0.010579705238342285, -0.010156393051147461, -0.009733080863952637, -0.009309768676757812, -0.008886456489562988, -0.008463144302368164, -0.00803983211517334, -0.007616519927978516, -0.007193207740783691, -0.006769895553588867, -0.006346583366394043, -0.005923271179199219, -0.0054999589920043945, -0.00507664680480957, -0.004653334617614746, -0.004230022430419922, -0.0038067102432250977, -0.0033833980560302734, -0.0029600858688354492, -0.002536773681640625, -0.0021134614944458008, -0.0016901493072509766, -0.0012668371200561523, -0.0008435249328613281, -0.0004202127456665039, 3.0994415283203125e-06, 0.00042641162872314453, 0.0008497238159179688, 0.001273036003112793, 0.0016963481903076172, 0.0021196603775024414, 0.0025429725646972656, 0.00296628475189209, 0.003389596939086914, 0.0038129091262817383, 0.0042362213134765625, 0.004659533500671387, 0.005082845687866211, 0.005506157875061035, 0.005929470062255859, 0.006352782249450684, 0.006776094436645508, 0.007199406623840332, 0.007622718811035156, 0.00804603099822998, 0.008469343185424805, 0.008892655372619629, 0.009315967559814453, 0.009739279747009277, 0.010162591934204102, 0.010585904121398926, 0.01100921630859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 970.0, 34.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15761198103427887, -0.153827503323555, -0.15004302561283112, -0.14625854790210724, -0.14247405529022217, -0.1386895775794983, -0.13490509986877441, -0.13112062215805054, -0.12733614444732666, -0.12355166673660278, -0.1197671890258789, -0.11598270386457443, -0.11219822615385056, -0.10841374844312668, -0.1046292632818222, -0.10084478557109833, -0.09706030786037445, -0.09327583014965057, -0.0894913524389267, -0.08570686727762222, -0.08192238956689835, -0.07813791185617447, -0.07435342669487, -0.07056894898414612, -0.06678447127342224, -0.06299999356269836, -0.05921551212668419, -0.05543103069067001, -0.051646552979946136, -0.04786207526922226, -0.044077593833208084, -0.04029311239719391, -0.03650863468647003, -0.032724156975746155, -0.02893967553973198, -0.025155195966362953, -0.021370716392993927, -0.0175862368196249, -0.013801757246255875, -0.010017277672886848, -0.006232798099517822, -0.002448318526148796, 0.00133616104722023, 0.005120640620589256, 0.008905120193958282, 0.012689599767327309, 0.016474079340696335, 0.02025855891406536, 0.024043038487434387, 0.027827518060803413, 0.03161199763417244, 0.035396479070186615, 0.03918095678091049, 0.04296543449163437, 0.046749915927648544, 0.05053439736366272, 0.0543188750743866, 0.058103352785110474, 0.06188783422112465, 0.06567231565713882, 0.0694567933678627, 0.07324127107858658, 0.07702575623989105, 0.08081023395061493, 0.0845947116613388]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 10.0, 12.0, 20.0, 20.0, 23.0, 30.0, 40.0, 51.0, 43.0, 48.0, 57.0, 41.0, 61.0, 56.0, 45.0, 39.0, 41.0, 46.0, 33.0, 44.0, 27.0, 23.0, 28.0, 33.0, 22.0, 17.0, 12.0, 12.0, 10.0, 9.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03274601697921753, -0.03188027814030647, -0.031014541164040565, -0.030148804187774658, -0.0292830653488636, -0.028417326509952545, -0.027551589533686638, -0.02668585255742073, -0.025820113718509674, -0.024954374879598618, -0.02408863790333271, -0.023222900927066803, -0.022357162088155746, -0.02149142324924469, -0.020625686272978783, -0.019759949296712875, -0.01889421045780182, -0.018028471618890762, -0.017162734642624855, -0.016296997666358948, -0.015431258827447891, -0.01456552091985941, -0.013699783012270927, -0.012834045104682446, -0.011968307197093964, -0.011102569289505482, -0.010236831381917, -0.009371093474328518, -0.008505355566740036, -0.007639617659151554, -0.006773879751563072, -0.00590814184397459, -0.005042403936386108, -0.0041766660287976265, -0.0033109281212091446, -0.0024451902136206627, -0.0015794523060321808, -0.0007137143984436989, 0.00015202350914478302, 0.001017761416733265, 0.0018834993243217468, 0.0027492372319102287, 0.0036149751394987106, 0.0044807130470871925, 0.0053464509546756744, 0.006212188862264156, 0.007077926769852638, 0.00794366467744112, 0.008809402585029602, 0.009675140492618084, 0.010540878400206566, 0.011406616307795048, 0.01227235421538353, 0.013138092122972012, 0.014003830030560493, 0.014869567938148975, 0.015735305845737457, 0.016601044684648514, 0.01746678166091442, 0.01833251863718033, 0.019198257476091385, 0.02006399631500244, 0.02092973329126835, 0.021795470267534256, 0.022661209106445312]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 9.0, 10.0, 11.0, 21.0, 19.0, 34.0, 42.0, 70.0, 100.0, 129.0, 173.0, 232.0, 356.0, 519.0, 810.0, 1174.0, 1791.0, 2821.0, 4616.0, 8240.0, 17087.0, 68515.0, 858691.0, 48504.0, 14967.0, 7562.0, 4177.0, 2668.0, 1672.0, 1153.0, 743.0, 491.0, 344.0, 245.0, 143.0, 125.0, 81.0, 55.0, 40.0, 28.0, 24.0, 11.0, 5.0, 12.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.01500701904296875, -0.014571070671081543, -0.014135122299194336, -0.013699173927307129, -0.013263225555419922, -0.012827277183532715, -0.012391328811645508, -0.0119553804397583, -0.011519432067871094, -0.011083483695983887, -0.01064753532409668, -0.010211586952209473, -0.009775638580322266, -0.009339690208435059, -0.008903741836547852, -0.008467793464660645, -0.008031845092773438, -0.0075958967208862305, -0.0071599483489990234, -0.006723999977111816, -0.006288051605224609, -0.005852103233337402, -0.005416154861450195, -0.004980206489562988, -0.004544258117675781, -0.004108309745788574, -0.003672361373901367, -0.00323641300201416, -0.002800464630126953, -0.002364516258239746, -0.001928567886352539, -0.001492619514465332, -0.001056671142578125, -0.000620722770690918, -0.00018477439880371094, 0.0002511739730834961, 0.0006871223449707031, 0.0011230707168579102, 0.0015590190887451172, 0.0019949674606323242, 0.0024309158325195312, 0.0028668642044067383, 0.0033028125762939453, 0.0037387609481811523, 0.004174709320068359, 0.004610657691955566, 0.0050466060638427734, 0.0054825544357299805, 0.0059185028076171875, 0.0063544511795043945, 0.0067903995513916016, 0.007226347923278809, 0.007662296295166016, 0.008098244667053223, 0.00853419303894043, 0.008970141410827637, 0.009406089782714844, 0.00984203815460205, 0.010277986526489258, 0.010713934898376465, 0.011149883270263672, 0.011585831642150879, 0.012021780014038086, 0.012457728385925293, 0.0128936767578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 6.0, 1.0, 4.0, 13.0, 11.0, 8.0, 4.0, 16.0, 48.0, 146.0, 309.0, 219.0, 85.0, 25.0, 6.0, 10.0, 11.0, 8.0, 9.0, 6.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0077667236328125, -0.0074901580810546875, -0.007213592529296875, -0.0069370269775390625, -0.00666046142578125, -0.0063838958740234375, -0.006107330322265625, -0.0058307647705078125, -0.00555419921875, -0.0052776336669921875, -0.005001068115234375, -0.0047245025634765625, -0.00444793701171875, -0.0041713714599609375, -0.003894805908203125, -0.0036182403564453125, -0.0033416748046875, -0.0030651092529296875, -0.002788543701171875, -0.0025119781494140625, -0.00223541259765625, -0.0019588470458984375, -0.001682281494140625, -0.0014057159423828125, -0.001129150390625, -0.0008525848388671875, -0.000576019287109375, -0.0002994537353515625, -2.288818359375e-05, 0.0002536773681640625, 0.000530242919921875, 0.0008068084716796875, 0.0010833740234375, 0.0013599395751953125, 0.001636505126953125, 0.0019130706787109375, 0.00218963623046875, 0.0024662017822265625, 0.002742767333984375, 0.0030193328857421875, 0.0032958984375, 0.0035724639892578125, 0.003849029541015625, 0.0041255950927734375, 0.00440216064453125, 0.0046787261962890625, 0.004955291748046875, 0.0052318572998046875, 0.0055084228515625, 0.0057849884033203125, 0.006061553955078125, 0.0063381195068359375, 0.00661468505859375, 0.0068912506103515625, 0.007167816162109375, 0.0074443817138671875, 0.007720947265625, 0.007997512817382812, 0.008274078369140625, 0.008550643920898438, 0.00882720947265625, 0.009103775024414062, 0.009380340576171875, 0.009656906127929688, 0.0099334716796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 5.0, 11.0, 14.0, 14.0, 14.0, 19.0, 28.0, 31.0, 37.0, 46.0, 63.0, 67.0, 66.0, 118.0, 142.0, 191.0, 250.0, 437.0, 661.0, 1510.0, 8531.0, 821542.0, 206649.0, 4836.0, 1209.0, 634.0, 348.0, 260.0, 162.0, 116.0, 96.0, 100.0, 56.0, 34.0, 43.0, 37.0, 28.0, 36.0, 22.0, 16.0, 20.0, 10.0, 4.0, 7.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.03973388671875, -0.03852558135986328, -0.03731727600097656, -0.036108970642089844, -0.034900665283203125, -0.033692359924316406, -0.03248405456542969, -0.03127574920654297, -0.03006744384765625, -0.02885913848876953, -0.027650833129882812, -0.026442527770996094, -0.025234222412109375, -0.024025917053222656, -0.022817611694335938, -0.02160930633544922, -0.0204010009765625, -0.01919269561767578, -0.017984390258789062, -0.016776084899902344, -0.015567779541015625, -0.014359474182128906, -0.013151168823242188, -0.011942863464355469, -0.01073455810546875, -0.009526252746582031, -0.008317947387695312, -0.007109642028808594, -0.005901336669921875, -0.004693031311035156, -0.0034847259521484375, -0.0022764205932617188, -0.001068115234375, 0.00014019012451171875, 0.0013484954833984375, 0.0025568008422851562, 0.003765106201171875, 0.004973411560058594, 0.0061817169189453125, 0.007390022277832031, 0.00859832763671875, 0.009806632995605469, 0.011014938354492188, 0.012223243713378906, 0.013431549072265625, 0.014639854431152344, 0.015848159790039062, 0.01705646514892578, 0.0182647705078125, 0.01947307586669922, 0.020681381225585938, 0.021889686584472656, 0.023097991943359375, 0.024306297302246094, 0.025514602661132812, 0.02672290802001953, 0.02793121337890625, 0.02913951873779297, 0.030347824096679688, 0.031556129455566406, 0.032764434814453125, 0.033972740173339844, 0.03518104553222656, 0.03638935089111328, 0.03759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 9.0, 7.0, 10.0, 13.0, 14.0, 12.0, 21.0, 28.0, 21.0, 23.0, 24.0, 33.0, 33.0, 27.0, 52.0, 39.0, 30.0, 45.0, 38.0, 32.0, 32.0, 33.0, 32.0, 31.0, 24.0, 33.0, 30.0, 33.0, 36.0, 26.0, 10.0, 28.0, 20.0, 14.0, 20.0, 13.0, 11.0, 13.0, 7.0, 4.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0235443115234375, -0.02282881736755371, -0.022113323211669922, -0.021397829055786133, -0.020682334899902344, -0.019966840744018555, -0.019251346588134766, -0.018535852432250977, -0.017820358276367188, -0.0171048641204834, -0.01638936996459961, -0.01567387580871582, -0.014958381652832031, -0.014242887496948242, -0.013527393341064453, -0.012811899185180664, -0.012096405029296875, -0.011380910873413086, -0.010665416717529297, -0.009949922561645508, -0.009234428405761719, -0.00851893424987793, -0.007803440093994141, -0.0070879459381103516, -0.0063724517822265625, -0.0056569576263427734, -0.004941463470458984, -0.004225969314575195, -0.0035104751586914062, -0.002794981002807617, -0.002079486846923828, -0.001363992691040039, -0.00064849853515625, 6.699562072753906e-05, 0.0007824897766113281, 0.0014979839324951172, 0.0022134780883789062, 0.0029289722442626953, 0.0036444664001464844, 0.0043599605560302734, 0.0050754547119140625, 0.0057909488677978516, 0.006506443023681641, 0.00722193717956543, 0.007937431335449219, 0.008652925491333008, 0.009368419647216797, 0.010083913803100586, 0.010799407958984375, 0.011514902114868164, 0.012230396270751953, 0.012945890426635742, 0.013661384582519531, 0.01437687873840332, 0.01509237289428711, 0.0158078670501709, 0.016523361206054688, 0.017238855361938477, 0.017954349517822266, 0.018669843673706055, 0.019385337829589844, 0.020100831985473633, 0.020816326141357422, 0.02153182029724121, 0.022247314453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 8.0, 15.0, 15.0, 23.0, 28.0, 45.0, 57.0, 91.0, 179.0, 306.0, 711.0, 2035.0, 9988.0, 169467.0, 844383.0, 16650.0, 2806.0, 839.0, 348.0, 238.0, 120.0, 69.0, 41.0, 30.0, 22.0, 5.0, 9.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-05, -1.5014782547950745e-05, -1.4532357454299927e-05, -1.4049932360649109e-05, -1.3567507266998291e-05, -1.3085082173347473e-05, -1.2602657079696655e-05, -1.2120231986045837e-05, -1.163780689239502e-05, -1.1155381798744202e-05, -1.0672956705093384e-05, -1.0190531611442566e-05, -9.708106517791748e-06, -9.22568142414093e-06, -8.743256330490112e-06, -8.260831236839294e-06, -7.778406143188477e-06, -7.295981049537659e-06, -6.813555955886841e-06, -6.331130862236023e-06, -5.848705768585205e-06, -5.366280674934387e-06, -4.883855581283569e-06, -4.4014304876327515e-06, -3.919005393981934e-06, -3.4365803003311157e-06, -2.954155206680298e-06, -2.47173011302948e-06, -1.989305019378662e-06, -1.5068799257278442e-06, -1.0244548320770264e-06, -5.420297384262085e-07, -5.960464477539063e-08, 4.2282044887542725e-07, 9.052455425262451e-07, 1.387670636177063e-06, 1.8700957298278809e-06, 2.3525208234786987e-06, 2.8349459171295166e-06, 3.3173710107803345e-06, 3.7997961044311523e-06, 4.28222119808197e-06, 4.764646291732788e-06, 5.247071385383606e-06, 5.729496479034424e-06, 6.211921572685242e-06, 6.6943466663360596e-06, 7.1767717599868774e-06, 7.659196853637695e-06, 8.141621947288513e-06, 8.624047040939331e-06, 9.106472134590149e-06, 9.588897228240967e-06, 1.0071322321891785e-05, 1.0553747415542603e-05, 1.103617250919342e-05, 1.1518597602844238e-05, 1.2001022696495056e-05, 1.2483447790145874e-05, 1.2965872883796692e-05, 1.344829797744751e-05, 1.3930723071098328e-05, 1.4413148164749146e-05, 1.4895573258399963e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 19.0, 26.0, 24.0, 44.0, 40.0, 86.0, 63.0, 65.0, 124.0, 76.0, 87.0, 91.0, 44.0, 49.0, 29.0, 25.0, 13.0, 22.0, 13.0, 5.0, 10.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.852190613746643e-06, -4.637986421585083e-06, -4.423782229423523e-06, -4.209578037261963e-06, -3.995373845100403e-06, -3.7811696529388428e-06, -3.5669654607772827e-06, -3.3527612686157227e-06, -3.1385570764541626e-06, -2.9243528842926025e-06, -2.7101486921310425e-06, -2.4959444999694824e-06, -2.2817403078079224e-06, -2.0675361156463623e-06, -1.8533319234848022e-06, -1.6391277313232422e-06, -1.4249235391616821e-06, -1.210719347000122e-06, -9.96515154838562e-07, -7.82310962677002e-07, -5.681067705154419e-07, -3.5390257835388184e-07, -1.3969838619232178e-07, 7.450580596923828e-08, 2.8870999813079834e-07, 5.029141902923584e-07, 7.171183824539185e-07, 9.313225746154785e-07, 1.1455267667770386e-06, 1.3597309589385986e-06, 1.5739351511001587e-06, 1.7881393432617188e-06, 2.002343535423279e-06, 2.216547727584839e-06, 2.430751919746399e-06, 2.644956111907959e-06, 2.859160304069519e-06, 3.073364496231079e-06, 3.287568688392639e-06, 3.5017728805541992e-06, 3.7159770727157593e-06, 3.930181264877319e-06, 4.144385457038879e-06, 4.3585896492004395e-06, 4.5727938413619995e-06, 4.7869980335235596e-06, 5.00120222568512e-06, 5.21540641784668e-06, 5.42961061000824e-06, 5.6438148021698e-06, 5.85801899433136e-06, 6.07222318649292e-06, 6.28642737865448e-06, 6.50063157081604e-06, 6.7148357629776e-06, 6.92903995513916e-06, 7.14324414730072e-06, 7.35744833946228e-06, 7.57165253162384e-06, 7.7858567237854e-06, 8.00006091594696e-06, 8.21426510810852e-06, 8.42846930027008e-06, 8.64267349243164e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 9.0, 9.0, 12.0, 11.0, 18.0, 29.0, 47.0, 109.0, 308.0, 1712.0, 1036926.0, 8449.0, 568.0, 164.0, 84.0, 31.0, 19.0, 15.0, 10.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.039308547973633e-05, -6.836559623479843e-05, -6.633810698986053e-05, -6.431061774492264e-05, -6.228312849998474e-05, -6.0255639255046844e-05, -5.822815001010895e-05, -5.620066076517105e-05, -5.4173171520233154e-05, -5.214568227529526e-05, -5.011819303035736e-05, -4.8090703785419464e-05, -4.606321454048157e-05, -4.403572529554367e-05, -4.2008236050605774e-05, -3.998074680566788e-05, -3.795325756072998e-05, -3.5925768315792084e-05, -3.389827907085419e-05, -3.187078982591629e-05, -2.9843300580978394e-05, -2.7815811336040497e-05, -2.57883220911026e-05, -2.3760832846164703e-05, -2.1733343601226807e-05, -1.970585435628891e-05, -1.7678365111351013e-05, -1.5650875866413116e-05, -1.362338662147522e-05, -1.1595897376537323e-05, -9.568408131599426e-06, -7.5409188866615295e-06, -5.513429641723633e-06, -3.485940396785736e-06, -1.4584511518478394e-06, 5.690380930900574e-07, 2.596527338027954e-06, 4.624016582965851e-06, 6.6515058279037476e-06, 8.678995072841644e-06, 1.0706484317779541e-05, 1.2733973562717438e-05, 1.4761462807655334e-05, 1.678895205259323e-05, 1.8816441297531128e-05, 2.0843930542469025e-05, 2.287141978740692e-05, 2.4898909032344818e-05, 2.6926398277282715e-05, 2.895388752222061e-05, 3.098137676715851e-05, 3.3008866012096405e-05, 3.50363552570343e-05, 3.70638445019722e-05, 3.9091333746910095e-05, 4.111882299184799e-05, 4.314631223678589e-05, 4.5173801481723785e-05, 4.720129072666168e-05, 4.922877997159958e-05, 5.1256269216537476e-05, 5.328375846147537e-05, 5.531124770641327e-05, 5.7338736951351166e-05, 5.936622619628906e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 2.0, 5.0, 16.0, 15.0, 42.0, 75.0, 144.0, 306.0, 177.0, 106.0, 48.0, 17.0, 14.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -4.0617771446704865e-05, -3.951229155063629e-05, -3.840681165456772e-05, -3.7301331758499146e-05, -3.619585186243057e-05, -3.5090371966362e-05, -3.3984892070293427e-05, -3.2879412174224854e-05, -3.177393227815628e-05, -3.066845238208771e-05, -2.9562972486019135e-05, -2.845749258995056e-05, -2.735201269388199e-05, -2.6246532797813416e-05, -2.5141052901744843e-05, -2.403557300567627e-05, -2.2930093109607697e-05, -2.1824613213539124e-05, -2.071913331747055e-05, -1.9613653421401978e-05, -1.8508173525333405e-05, -1.740269362926483e-05, -1.629721373319626e-05, -1.5191733837127686e-05, -1.4086253941059113e-05, -1.298077404499054e-05, -1.1875294148921967e-05, -1.0769814252853394e-05, -9.66433435678482e-06, -8.558854460716248e-06, -7.4533745646476746e-06, -6.3478946685791016e-06, -5.2424147725105286e-06, -4.1369348764419556e-06, -3.0314549803733826e-06, -1.9259750843048096e-06, -8.204951882362366e-07, 2.849847078323364e-07, 1.3904646039009094e-06, 2.4959444999694824e-06, 3.6014243960380554e-06, 4.706904292106628e-06, 5.812384188175201e-06, 6.917864084243774e-06, 8.023343980312347e-06, 9.12882387638092e-06, 1.0234303772449493e-05, 1.1339783668518066e-05, 1.244526356458664e-05, 1.3550743460655212e-05, 1.4656223356723785e-05, 1.576170325279236e-05, 1.686718314886093e-05, 1.7972663044929504e-05, 1.9078142940998077e-05, 2.018362283706665e-05, 2.1289102733135223e-05, 2.2394582629203796e-05, 2.350006252527237e-05, 2.4605542421340942e-05, 2.5711022317409515e-05, 2.681650221347809e-05, 2.792198210954666e-05, 2.9027462005615234e-05]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 21.0, 34.0, 137.0, 496.0, 199.0, 68.0, 16.0, 10.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06408916413784027, -0.06138811260461807, -0.058687061071395874, -0.055986013263463974, -0.053284961730241776, -0.05058391019701958, -0.04788286238908768, -0.04518181085586548, -0.04248075932264328, -0.03977970778942108, -0.03707865625619888, -0.03437760844826698, -0.031676556915044785, -0.028975505381822586, -0.026274455711245537, -0.023573406040668488, -0.02087235450744629, -0.01817130297422409, -0.015470253303647041, -0.012769202701747417, -0.010068152099847794, -0.00736710149794817, -0.004666050896048546, -0.0019650012254714966, 0.0007360503077507019, 0.0034371009096503258, 0.00613815151154995, 0.008839202113449574, 0.011540252715349197, 0.014241303317248821, 0.016942353919148445, 0.019643403589725494, 0.022344455122947693, 0.02504550665616989, 0.02774655632674694, 0.03044760599732399, 0.03314865753054619, 0.03584970906376839, 0.03855075687170029, 0.041251808404922485, 0.043952859938144684, 0.04665391147136688, 0.04935496300458908, 0.05205601081252098, 0.05475706234574318, 0.05745811387896538, 0.06015916168689728, 0.06286021322011948, 0.06556126475334167, 0.06826231628656387, 0.07096336781978607, 0.07366441935300827, 0.07636547088623047, 0.07906651496887207, 0.08176756650209427, 0.08446861803531647, 0.08716966956853867, 0.08987072110176086, 0.09257177263498306, 0.09527282416820526, 0.09797386825084686, 0.10067491978406906, 0.10337597131729126, 0.10607702285051346, 0.10877807438373566]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 11.0, 8.0, 14.0, 15.0, 12.0, 16.0, 15.0, 24.0, 34.0, 20.0, 22.0, 44.0, 33.0, 46.0, 45.0, 45.0, 43.0, 52.0, 43.0, 55.0, 42.0, 38.0, 35.0, 42.0, 28.0, 29.0, 18.0, 20.0, 16.0, 17.0, 18.0, 16.0, 11.0, 14.0, 4.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.15168660879135132, -0.14716698229312897, -0.14264734089374542, -0.13812771439552307, -0.13360807299613953, -0.12908844649791718, -0.12456881999969482, -0.12004918605089188, -0.11552955210208893, -0.11100991815328598, -0.10649028420448303, -0.10197065770626068, -0.09745102375745773, -0.09293138980865479, -0.08841176331043243, -0.08389212936162949, -0.07937249541282654, -0.07485286146402359, -0.07033322751522064, -0.06581360101699829, -0.06129396706819534, -0.056774333119392395, -0.052254702895879745, -0.047735072672367096, -0.04321543872356415, -0.0386958047747612, -0.03417617455124855, -0.02965654246509075, -0.025136910378932953, -0.020617278292775154, -0.016097646206617355, -0.011578015983104706, -0.007058382034301758, -0.002538749948143959, 0.0019808821380138397, 0.0065005142241716385, 0.011020146310329437, 0.015539778396487236, 0.020059410482645035, 0.024579040706157684, 0.029098674654960632, 0.03361830860376358, 0.03813793882727623, 0.04265756905078888, 0.04717720299959183, 0.051696836948394775, 0.056216467171907425, 0.060736097395420074, 0.06525573134422302, 0.06977536529302597, 0.07429499924182892, 0.07881462574005127, 0.08333425968885422, 0.08785389363765717, 0.09237352013587952, 0.09689315408468246, 0.10141278803348541, 0.10593242198228836, 0.11045205593109131, 0.11497168242931366, 0.11949131637811661, 0.12401095032691956, 0.1285305768251419, 0.13305020332336426, 0.1375698447227478]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 18.0, 20.0, 27.0, 23.0, 32.0, 68.0, 556.0, 4603.0, 4161182.0, 25990.0, 1408.0, 80.0, 38.0, 38.0, 41.0, 35.0, 16.0, 15.0, 12.0, 6.0, 10.0, 4.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185394287109375, -0.017873287200927734, -0.01720714569091797, -0.016541004180908203, -0.015874862670898438, -0.015208721160888672, -0.014542579650878906, -0.01387643814086914, -0.013210296630859375, -0.01254415512084961, -0.011878013610839844, -0.011211872100830078, -0.010545730590820312, -0.009879589080810547, -0.009213447570800781, -0.008547306060791016, -0.00788116455078125, -0.007215023040771484, -0.006548881530761719, -0.005882740020751953, -0.0052165985107421875, -0.004550457000732422, -0.0038843154907226562, -0.0032181739807128906, -0.002552032470703125, -0.0018858909606933594, -0.0012197494506835938, -0.0005536079406738281, 0.0001125335693359375, 0.0007786750793457031, 0.0014448165893554688, 0.0021109580993652344, 0.002777099609375, 0.0034432411193847656, 0.004109382629394531, 0.004775524139404297, 0.0054416656494140625, 0.006107807159423828, 0.006773948669433594, 0.007440090179443359, 0.008106231689453125, 0.00877237319946289, 0.009438514709472656, 0.010104656219482422, 0.010770797729492188, 0.011436939239501953, 0.012103080749511719, 0.012769222259521484, 0.01343536376953125, 0.014101505279541016, 0.014767646789550781, 0.015433788299560547, 0.016099929809570312, 0.016766071319580078, 0.017432212829589844, 0.01809835433959961, 0.018764495849609375, 0.01943063735961914, 0.020096778869628906, 0.020762920379638672, 0.021429061889648438, 0.022095203399658203, 0.02276134490966797, 0.023427486419677734, 0.0240936279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 5.0, 13.0, 10.0, 6.0, 6.0, 15.0, 64.0, 139.0, 278.0, 228.0, 95.0, 26.0, 9.0, 8.0, 12.0, 9.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00760650634765625, -0.007335662841796875, -0.0070648193359375, -0.006793975830078125, -0.00652313232421875, -0.006252288818359375, -0.0059814453125, -0.005710601806640625, -0.00543975830078125, -0.005168914794921875, -0.0048980712890625, -0.004627227783203125, -0.00435638427734375, -0.004085540771484375, -0.003814697265625, -0.003543853759765625, -0.00327301025390625, -0.003002166748046875, -0.0027313232421875, -0.002460479736328125, -0.00218963623046875, -0.001918792724609375, -0.00164794921875, -0.001377105712890625, -0.00110626220703125, -0.000835418701171875, -0.0005645751953125, -0.000293731689453125, -2.288818359375e-05, 0.000247955322265625, 0.000518798828125, 0.000789642333984375, 0.00106048583984375, 0.001331329345703125, 0.0016021728515625, 0.001873016357421875, 0.00214385986328125, 0.002414703369140625, 0.002685546875, 0.002956390380859375, 0.00322723388671875, 0.003498077392578125, 0.0037689208984375, 0.004039764404296875, 0.00431060791015625, 0.004581451416015625, 0.004852294921875, 0.005123138427734375, 0.00539398193359375, 0.005664825439453125, 0.0059356689453125, 0.006206512451171875, 0.00647735595703125, 0.006748199462890625, 0.00701904296875, 0.007289886474609375, 0.00756072998046875, 0.007831573486328125, 0.0081024169921875, 0.008373260498046875, 0.00864410400390625, 0.008914947509765625, 0.009185791015625, 0.009456634521484375, 0.00972747802734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 14.0, 9.0, 22.0, 38.0, 109.0, 313.0, 1561.0, 70134.0, 4118719.0, 2561.0, 496.0, 159.0, 62.0, 22.0, 15.0, 12.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02703857421875, -0.02628946304321289, -0.02554035186767578, -0.024791240692138672, -0.024042129516601562, -0.023293018341064453, -0.022543907165527344, -0.021794795989990234, -0.021045684814453125, -0.020296573638916016, -0.019547462463378906, -0.018798351287841797, -0.018049240112304688, -0.017300128936767578, -0.01655101776123047, -0.01580190658569336, -0.01505279541015625, -0.01430368423461914, -0.013554573059082031, -0.012805461883544922, -0.012056350708007812, -0.011307239532470703, -0.010558128356933594, -0.009809017181396484, -0.009059906005859375, -0.008310794830322266, -0.007561683654785156, -0.006812572479248047, -0.0060634613037109375, -0.005314350128173828, -0.004565238952636719, -0.0038161277770996094, -0.0030670166015625, -0.0023179054260253906, -0.0015687942504882812, -0.0008196830749511719, -7.05718994140625e-05, 0.0006785392761230469, 0.0014276504516601562, 0.0021767616271972656, 0.002925872802734375, 0.0036749839782714844, 0.004424095153808594, 0.005173206329345703, 0.0059223175048828125, 0.006671428680419922, 0.007420539855957031, 0.00816965103149414, 0.00891876220703125, 0.00966787338256836, 0.010416984558105469, 0.011166095733642578, 0.011915206909179688, 0.012664318084716797, 0.013413429260253906, 0.014162540435791016, 0.014911651611328125, 0.015660762786865234, 0.016409873962402344, 0.017158985137939453, 0.017908096313476562, 0.018657207489013672, 0.01940631866455078, 0.02015542984008789, 0.020904541015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 27.0, 42.0, 108.0, 3207.0, 506.0, 86.0, 40.0, 18.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005298614501953125, -0.005076348781585693, -0.004854083061218262, -0.00463181734085083, -0.0044095516204833984, -0.004187285900115967, -0.003965020179748535, -0.0037427544593811035, -0.003520488739013672, -0.0032982230186462402, -0.0030759572982788086, -0.002853691577911377, -0.0026314258575439453, -0.0024091601371765137, -0.002186894416809082, -0.0019646286964416504, -0.0017423629760742188, -0.0015200972557067871, -0.0012978315353393555, -0.0010755658149719238, -0.0008533000946044922, -0.0006310343742370605, -0.0004087686538696289, -0.00018650293350219727, 3.5762786865234375e-05, 0.000258028507232666, 0.00048029422760009766, 0.0007025599479675293, 0.0009248256683349609, 0.0011470913887023926, 0.0013693571090698242, 0.0015916228294372559, 0.0018138885498046875, 0.002036154270172119, 0.0022584199905395508, 0.0024806857109069824, 0.002702951431274414, 0.0029252171516418457, 0.0031474828720092773, 0.003369748592376709, 0.0035920143127441406, 0.0038142800331115723, 0.004036545753479004, 0.0042588114738464355, 0.004481077194213867, 0.004703342914581299, 0.0049256086349487305, 0.005147874355316162, 0.005370140075683594, 0.005592405796051025, 0.005814671516418457, 0.006036937236785889, 0.00625920295715332, 0.006481468677520752, 0.006703734397888184, 0.006926000118255615, 0.007148265838623047, 0.0073705315589904785, 0.00759279727935791, 0.007815062999725342, 0.008037328720092773, 0.008259594440460205, 0.008481860160827637, 0.008704125881195068, 0.0089263916015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 724.0, 287.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012417360208928585, -0.01033632643520832, -0.008255291730165482, -0.006174257956445217, -0.004093224182724953, -0.0020121904090046883, 6.884429603815079e-05, 0.0021498780697584152, 0.00423091184347868, 0.006311945617198944, 0.008392980322241783, 0.010474014095962048, 0.012555047869682312, 0.014636081643402576, 0.01671711727976799, 0.01879815012216568, 0.02087918296456337, 0.02296021766960621, 0.0250412505120039, 0.027122285217046738, 0.029203318059444427, 0.031284354627132416, 0.033365387469530106, 0.035446420311927795, 0.037527456879615784, 0.039608489722013474, 0.04168952628970146, 0.04377055913209915, 0.04585159197449684, 0.04793262481689453, 0.05001366138458252, 0.05209469422698021, 0.054175734519958496, 0.056256767362356186, 0.058337803930044174, 0.060418836772441864, 0.062499869614839554, 0.06458090245723724, 0.06666193902492523, 0.06874297559261322, 0.07082400470972061, 0.0729050412774086, 0.07498607039451599, 0.07706710696220398, 0.07914814352989197, 0.08122917264699936, 0.08331020921468735, 0.08539124578237534, 0.08747227489948273, 0.08955331146717072, 0.0916343405842781, 0.0937153771519661, 0.09579641371965408, 0.09787744283676147, 0.09995847940444946, 0.10203951597213745, 0.10412055253982544, 0.10620158910751343, 0.10828261822462082, 0.11036365479230881, 0.1124446913599968, 0.11452572047710419, 0.11660675704479218, 0.11868779361248016, 0.12076882272958755]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 13.0, 18.0, 26.0, 29.0, 41.0, 66.0, 66.0, 82.0, 74.0, 75.0, 90.0, 63.0, 68.0, 70.0, 66.0, 35.0, 37.0, 31.0, 21.0, 9.0, 6.0, 9.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019170522689819336, -0.018626732751727104, -0.018082942813634872, -0.01753915287554264, -0.01699536293745041, -0.016451572999358177, -0.015907783061265945, -0.015363993123173714, -0.014820203185081482, -0.01427641324698925, -0.013732623308897018, -0.013188833370804787, -0.012645043432712555, -0.012101253494620323, -0.011557463556528091, -0.01101367361843586, -0.010469883680343628, -0.009926093742251396, -0.009382303804159164, -0.008838513866066933, -0.008294723927974701, -0.007750933989882469, -0.007207144051790237, -0.006663354113698006, -0.006119564175605774, -0.005575774237513542, -0.00503198429942131, -0.004488194361329079, -0.003944404423236847, -0.003400614485144615, -0.0028568245470523834, -0.0023130346089601517, -0.00176924467086792, -0.0012254547327756882, -0.0006816647946834564, -0.00013787485659122467, 0.0004059150815010071, 0.0009497050195932388, 0.0014934949576854706, 0.0020372848957777023, 0.002581074833869934, 0.003124864771962166, 0.0036686547100543976, 0.004212444648146629, 0.004756234586238861, 0.005300024524331093, 0.005843814462423325, 0.006387604400515556, 0.006931394338607788, 0.00747518427670002, 0.008018974214792252, 0.008562764152884483, 0.009106554090976715, 0.009650344029068947, 0.010194133967161179, 0.01073792390525341, 0.011281713843345642, 0.011825503781437874, 0.012369293719530106, 0.012913083657622337, 0.013456873595714569, 0.0140006635338068, 0.014544453471899033, 0.015088243409991264, 0.015632033348083496]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 8.0, 12.0, 15.0, 17.0, 14.0, 24.0, 24.0, 41.0, 46.0, 62.0, 81.0, 91.0, 147.0, 174.0, 277.0, 482.0, 905.0, 1729.0, 3570.0, 7843.0, 21900.0, 704514.0, 273239.0, 19255.0, 6944.0, 3187.0, 1637.0, 867.0, 458.0, 276.0, 188.0, 114.0, 75.0, 69.0, 43.0, 42.0, 42.0, 28.0, 27.0, 16.0, 16.0, 14.0, 5.0, 3.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.015716552734375, -0.015191793441772461, -0.014667034149169922, -0.014142274856567383, -0.013617515563964844, -0.013092756271362305, -0.012567996978759766, -0.012043237686157227, -0.011518478393554688, -0.010993719100952148, -0.01046895980834961, -0.00994420051574707, -0.009419441223144531, -0.008894681930541992, -0.008369922637939453, -0.007845163345336914, -0.007320404052734375, -0.006795644760131836, -0.006270885467529297, -0.005746126174926758, -0.005221366882324219, -0.00469660758972168, -0.004171848297119141, -0.0036470890045166016, -0.0031223297119140625, -0.0025975704193115234, -0.0020728111267089844, -0.0015480518341064453, -0.0010232925415039062, -0.0004985332489013672, 2.6226043701171875e-05, 0.0005509853363037109, 0.00107574462890625, 0.001600503921508789, 0.002125263214111328, 0.002650022506713867, 0.0031747817993164062, 0.0036995410919189453, 0.004224300384521484, 0.0047490596771240234, 0.0052738189697265625, 0.0057985782623291016, 0.006323337554931641, 0.00684809684753418, 0.007372856140136719, 0.007897615432739258, 0.008422374725341797, 0.008947134017944336, 0.009471893310546875, 0.009996652603149414, 0.010521411895751953, 0.011046171188354492, 0.011570930480957031, 0.01209568977355957, 0.01262044906616211, 0.013145208358764648, 0.013669967651367188, 0.014194726943969727, 0.014719486236572266, 0.015244245529174805, 0.015769004821777344, 0.016293764114379883, 0.016818523406982422, 0.01734328269958496, 0.0178680419921875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 15.0, 9.0, 6.0, 6.0, 18.0, 67.0, 156.0, 287.0, 209.0, 84.0, 23.0, 10.0, 7.0, 14.0, 8.0, 8.0, 4.0, 5.0, 2.0, 6.0, 2.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0075836181640625, -0.007312655448913574, -0.0070416927337646484, -0.006770730018615723, -0.006499767303466797, -0.006228804588317871, -0.005957841873168945, -0.0056868791580200195, -0.005415916442871094, -0.005144953727722168, -0.004873991012573242, -0.004603028297424316, -0.004332065582275391, -0.004061102867126465, -0.003790140151977539, -0.0035191774368286133, -0.0032482147216796875, -0.0029772520065307617, -0.002706289291381836, -0.00243532657623291, -0.0021643638610839844, -0.0018934011459350586, -0.0016224384307861328, -0.001351475715637207, -0.0010805130004882812, -0.0008095502853393555, -0.0005385875701904297, -0.0002676248550415039, 3.337860107421875e-06, 0.00027430057525634766, 0.0005452632904052734, 0.0008162260055541992, 0.001087188720703125, 0.0013581514358520508, 0.0016291141510009766, 0.0019000768661499023, 0.002171039581298828, 0.002442002296447754, 0.0027129650115966797, 0.0029839277267456055, 0.0032548904418945312, 0.003525853157043457, 0.003796815872192383, 0.004067778587341309, 0.004338741302490234, 0.00460970401763916, 0.004880666732788086, 0.005151629447937012, 0.0054225921630859375, 0.005693554878234863, 0.005964517593383789, 0.006235480308532715, 0.006506443023681641, 0.006777405738830566, 0.007048368453979492, 0.007319331169128418, 0.007590293884277344, 0.00786125659942627, 0.008132219314575195, 0.008403182029724121, 0.008674144744873047, 0.008945107460021973, 0.009216070175170898, 0.009487032890319824, 0.00975799560546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 13.0, 14.0, 17.0, 13.0, 20.0, 23.0, 24.0, 43.0, 58.0, 46.0, 62.0, 78.0, 110.0, 135.0, 180.0, 274.0, 450.0, 787.0, 1824.0, 11462.0, 990311.0, 37465.0, 2469.0, 919.0, 517.0, 311.0, 212.0, 159.0, 110.0, 82.0, 65.0, 52.0, 39.0, 40.0, 32.0, 35.0, 17.0, 24.0, 13.0, 8.0, 10.0, 7.0, 11.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0352783203125, -0.03412675857543945, -0.032975196838378906, -0.03182363510131836, -0.030672073364257812, -0.029520511627197266, -0.02836894989013672, -0.027217388153076172, -0.026065826416015625, -0.024914264678955078, -0.02376270294189453, -0.022611141204833984, -0.021459579467773438, -0.02030801773071289, -0.019156455993652344, -0.018004894256591797, -0.01685333251953125, -0.015701770782470703, -0.014550209045410156, -0.01339864730834961, -0.012247085571289062, -0.011095523834228516, -0.009943962097167969, -0.008792400360107422, -0.007640838623046875, -0.006489276885986328, -0.005337715148925781, -0.004186153411865234, -0.0030345916748046875, -0.0018830299377441406, -0.0007314682006835938, 0.0004200935363769531, 0.0015716552734375, 0.002723217010498047, 0.0038747787475585938, 0.005026340484619141, 0.0061779022216796875, 0.007329463958740234, 0.008481025695800781, 0.009632587432861328, 0.010784149169921875, 0.011935710906982422, 0.013087272644042969, 0.014238834381103516, 0.015390396118164062, 0.01654195785522461, 0.017693519592285156, 0.018845081329345703, 0.01999664306640625, 0.021148204803466797, 0.022299766540527344, 0.02345132827758789, 0.024602890014648438, 0.025754451751708984, 0.02690601348876953, 0.028057575225830078, 0.029209136962890625, 0.030360698699951172, 0.03151226043701172, 0.032663822174072266, 0.03381538391113281, 0.03496694564819336, 0.036118507385253906, 0.03727006912231445, 0.038421630859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 7.0, 5.0, 13.0, 7.0, 10.0, 14.0, 12.0, 15.0, 30.0, 17.0, 23.0, 30.0, 40.0, 37.0, 37.0, 35.0, 26.0, 44.0, 38.0, 46.0, 31.0, 44.0, 33.0, 24.0, 48.0, 37.0, 33.0, 37.0, 38.0, 25.0, 21.0, 15.0, 19.0, 16.0, 15.0, 24.0, 3.0, 14.0, 10.0, 5.0, 6.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0212554931640625, -0.020560741424560547, -0.019865989685058594, -0.01917123794555664, -0.018476486206054688, -0.017781734466552734, -0.01708698272705078, -0.016392230987548828, -0.015697479248046875, -0.015002727508544922, -0.014307975769042969, -0.013613224029541016, -0.012918472290039062, -0.01222372055053711, -0.011528968811035156, -0.010834217071533203, -0.01013946533203125, -0.009444713592529297, -0.008749961853027344, -0.00805521011352539, -0.0073604583740234375, -0.006665706634521484, -0.005970954895019531, -0.005276203155517578, -0.004581451416015625, -0.003886699676513672, -0.0031919479370117188, -0.0024971961975097656, -0.0018024444580078125, -0.0011076927185058594, -0.00041294097900390625, 0.0002818107604980469, 0.0009765625, 0.0016713142395019531, 0.0023660659790039062, 0.0030608177185058594, 0.0037555694580078125, 0.004450321197509766, 0.005145072937011719, 0.005839824676513672, 0.006534576416015625, 0.007229328155517578, 0.007924079895019531, 0.008618831634521484, 0.009313583374023438, 0.01000833511352539, 0.010703086853027344, 0.011397838592529297, 0.01209259033203125, 0.012787342071533203, 0.013482093811035156, 0.01417684555053711, 0.014871597290039062, 0.015566349029541016, 0.01626110076904297, 0.016955852508544922, 0.017650604248046875, 0.018345355987548828, 0.01904010772705078, 0.019734859466552734, 0.020429611206054688, 0.02112436294555664, 0.021819114685058594, 0.022513866424560547, 0.0232086181640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 8.0, 10.0, 9.0, 17.0, 20.0, 25.0, 43.0, 46.0, 62.0, 139.0, 244.0, 427.0, 753.0, 2751.0, 13727.0, 133467.0, 860111.0, 29893.0, 4464.0, 1067.0, 534.0, 273.0, 125.0, 119.0, 58.0, 38.0, 25.0, 33.0, 18.0, 3.0, 8.0, 6.0, 2.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1282972991466522e-05, -1.0943040251731873e-05, -1.0603107511997223e-05, -1.0263174772262573e-05, -9.923242032527924e-06, -9.583309292793274e-06, -9.243376553058624e-06, -8.903443813323975e-06, -8.563511073589325e-06, -8.223578333854675e-06, -7.883645594120026e-06, -7.543712854385376e-06, -7.203780114650726e-06, -6.863847374916077e-06, -6.523914635181427e-06, -6.183981895446777e-06, -5.844049155712128e-06, -5.504116415977478e-06, -5.164183676242828e-06, -4.824250936508179e-06, -4.484318196773529e-06, -4.144385457038879e-06, -3.8044527173042297e-06, -3.46451997756958e-06, -3.1245872378349304e-06, -2.7846544981002808e-06, -2.444721758365631e-06, -2.1047890186309814e-06, -1.7648562788963318e-06, -1.4249235391616821e-06, -1.0849907994270325e-06, -7.450580596923828e-07, -4.0512531995773315e-07, -6.51925802230835e-08, 2.7474015951156616e-07, 6.146728992462158e-07, 9.546056389808655e-07, 1.2945383787155151e-06, 1.6344711184501648e-06, 1.9744038581848145e-06, 2.314336597919464e-06, 2.6542693376541138e-06, 2.9942020773887634e-06, 3.334134817123413e-06, 3.6740675568580627e-06, 4.014000296592712e-06, 4.353933036327362e-06, 4.693865776062012e-06, 5.033798515796661e-06, 5.373731255531311e-06, 5.713663995265961e-06, 6.05359673500061e-06, 6.39352947473526e-06, 6.73346221446991e-06, 7.073394954204559e-06, 7.413327693939209e-06, 7.753260433673859e-06, 8.093193173408508e-06, 8.433125913143158e-06, 8.773058652877808e-06, 9.112991392612457e-06, 9.452924132347107e-06, 9.792856872081757e-06, 1.0132789611816406e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 11.0, 9.0, 13.0, 14.0, 46.0, 31.0, 37.0, 82.0, 68.0, 99.0, 105.0, 117.0, 62.0, 69.0, 73.0, 39.0, 47.0, 18.0, 10.0, 12.0, 11.0, 6.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.068738341331482e-06, -6.865710020065308e-06, -6.662681698799133e-06, -6.459653377532959e-06, -6.256625056266785e-06, -6.05359673500061e-06, -5.850568413734436e-06, -5.647540092468262e-06, -5.444511771202087e-06, -5.241483449935913e-06, -5.038455128669739e-06, -4.8354268074035645e-06, -4.63239848613739e-06, -4.429370164871216e-06, -4.2263418436050415e-06, -4.023313522338867e-06, -3.820285201072693e-06, -3.6172568798065186e-06, -3.4142285585403442e-06, -3.21120023727417e-06, -3.0081719160079956e-06, -2.8051435947418213e-06, -2.602115273475647e-06, -2.3990869522094727e-06, -2.1960586309432983e-06, -1.993030309677124e-06, -1.7900019884109497e-06, -1.5869736671447754e-06, -1.383945345878601e-06, -1.1809170246124268e-06, -9.778887033462524e-07, -7.748603820800781e-07, -5.718320608139038e-07, -3.688037395477295e-07, -1.6577541828155518e-07, 3.725290298461914e-08, 2.4028122425079346e-07, 4.4330954551696777e-07, 6.463378667831421e-07, 8.493661880493164e-07, 1.0523945093154907e-06, 1.255422830581665e-06, 1.4584511518478394e-06, 1.6614794731140137e-06, 1.864507794380188e-06, 2.0675361156463623e-06, 2.2705644369125366e-06, 2.473592758178711e-06, 2.6766210794448853e-06, 2.8796494007110596e-06, 3.082677721977234e-06, 3.285706043243408e-06, 3.4887343645095825e-06, 3.691762685775757e-06, 3.894791007041931e-06, 4.0978193283081055e-06, 4.30084764957428e-06, 4.503875970840454e-06, 4.706904292106628e-06, 4.909932613372803e-06, 5.112960934638977e-06, 5.315989255905151e-06, 5.519017577171326e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 21.0, 19.0, 43.0, 57.0, 94.0, 184.0, 594.0, 3890.0, 1039782.0, 2927.0, 484.0, 193.0, 102.0, 46.0, 27.0, 36.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6835670471191406e-05, -3.5585835576057434e-05, -3.433600068092346e-05, -3.308616578578949e-05, -3.183633089065552e-05, -3.0586495995521545e-05, -2.9336661100387573e-05, -2.80868262052536e-05, -2.683699131011963e-05, -2.5587156414985657e-05, -2.4337321519851685e-05, -2.3087486624717712e-05, -2.183765172958374e-05, -2.0587816834449768e-05, -1.9337981939315796e-05, -1.8088147044181824e-05, -1.683831214904785e-05, -1.558847725391388e-05, -1.4338642358779907e-05, -1.3088807463645935e-05, -1.1838972568511963e-05, -1.058913767337799e-05, -9.339302778244019e-06, -8.089467883110046e-06, -6.839632987976074e-06, -5.589798092842102e-06, -4.33996319770813e-06, -3.0901283025741577e-06, -1.8402934074401855e-06, -5.904585123062134e-07, 6.593763828277588e-07, 1.909211277961731e-06, 3.159046173095703e-06, 4.408881068229675e-06, 5.6587159633636475e-06, 6.90855085849762e-06, 8.158385753631592e-06, 9.408220648765564e-06, 1.0658055543899536e-05, 1.1907890439033508e-05, 1.315772533416748e-05, 1.4407560229301453e-05, 1.5657395124435425e-05, 1.6907230019569397e-05, 1.815706491470337e-05, 1.940689980983734e-05, 2.0656734704971313e-05, 2.1906569600105286e-05, 2.3156404495239258e-05, 2.440623939037323e-05, 2.5656074285507202e-05, 2.6905909180641174e-05, 2.8155744075775146e-05, 2.940557897090912e-05, 3.065541386604309e-05, 3.190524876117706e-05, 3.3155083656311035e-05, 3.440491855144501e-05, 3.565475344657898e-05, 3.690458834171295e-05, 3.8154423236846924e-05, 3.9404258131980896e-05, 4.065409302711487e-05, 4.190392792224884e-05, 4.315376281738281e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 11.0, 7.0, 9.0, 18.0, 31.0, 31.0, 58.0, 124.0, 138.0, 267.0, 118.0, 71.0, 41.0, 21.0, 14.0, 13.0, 15.0, 4.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0384788513183594e-05, -1.965835690498352e-05, -1.8931925296783447e-05, -1.8205493688583374e-05, -1.74790620803833e-05, -1.6752630472183228e-05, -1.6026198863983154e-05, -1.529976725578308e-05, -1.4573335647583008e-05, -1.3846904039382935e-05, -1.3120472431182861e-05, -1.2394040822982788e-05, -1.1667609214782715e-05, -1.0941177606582642e-05, -1.0214745998382568e-05, -9.488314390182495e-06, -8.761882781982422e-06, -8.035451173782349e-06, -7.309019565582275e-06, -6.582587957382202e-06, -5.856156349182129e-06, -5.129724740982056e-06, -4.403293132781982e-06, -3.676861524581909e-06, -2.950429916381836e-06, -2.2239983081817627e-06, -1.4975666999816895e-06, -7.711350917816162e-07, -4.470348358154297e-08, 6.817281246185303e-07, 1.4081597328186035e-06, 2.1345913410186768e-06, 2.86102294921875e-06, 3.5874545574188232e-06, 4.3138861656188965e-06, 5.04031777381897e-06, 5.766749382019043e-06, 6.493180990219116e-06, 7.2196125984191895e-06, 7.946044206619263e-06, 8.672475814819336e-06, 9.39890742301941e-06, 1.0125339031219482e-05, 1.0851770639419556e-05, 1.1578202247619629e-05, 1.2304633855819702e-05, 1.3031065464019775e-05, 1.3757497072219849e-05, 1.4483928680419922e-05, 1.5210360288619995e-05, 1.593679189682007e-05, 1.666322350502014e-05, 1.7389655113220215e-05, 1.8116086721420288e-05, 1.884251832962036e-05, 1.9568949937820435e-05, 2.0295381546020508e-05, 2.102181315422058e-05, 2.1748244762420654e-05, 2.2474676370620728e-05, 2.32011079788208e-05, 2.3927539587020874e-05, 2.4653971195220947e-05, 2.538040280342102e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 48.0, 735.0, 200.0, 20.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27395039796829224, -0.2670600414276123, -0.26016965508461, -0.25327929854393005, -0.24638892710208893, -0.2394985556602478, -0.23260819911956787, -0.22571782767772675, -0.21882745623588562, -0.2119370847940445, -0.20504672825336456, -0.19815635681152344, -0.1912659853696823, -0.1843756139278412, -0.17748525738716125, -0.17059488594532013, -0.163704514503479, -0.15681414306163788, -0.14992378652095795, -0.14303341507911682, -0.1361430436372757, -0.12925267219543457, -0.12236231565475464, -0.11547194421291351, -0.10858158767223358, -0.10169122368097305, -0.09480085223913193, -0.0879104882478714, -0.08102011680603027, -0.07412975281476974, -0.06723938882350922, -0.06034901738166809, -0.053458645939826965, -0.04656827822327614, -0.03967791050672531, -0.03278754651546478, -0.025897176936268806, -0.01900681108236313, -0.012116443365812302, -0.005226075649261475, 0.0016642920672893524, 0.00855465978384018, 0.015445026569068432, 0.022335393354296684, 0.02922576107084751, 0.03611612692475319, 0.043006494641304016, 0.04989686235785484, 0.05678723007440567, 0.0636775940656662, 0.07056796550750732, 0.07745832949876785, 0.08434870094060898, 0.0912390649318695, 0.09812943637371063, 0.10501980036497116, 0.11191016435623169, 0.11880052834749222, 0.12569089233875275, 0.13258126378059387, 0.139471635222435, 0.14636200666427612, 0.15325236320495605, 0.16014273464679718, 0.1670331060886383]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 6.0, 5.0, 11.0, 10.0, 13.0, 14.0, 19.0, 28.0, 29.0, 37.0, 42.0, 45.0, 50.0, 57.0, 56.0, 62.0, 51.0, 43.0, 48.0, 40.0, 46.0, 35.0, 41.0, 33.0, 38.0, 23.0, 19.0, 20.0, 15.0, 14.0, 8.0, 6.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16866850852966309, -0.1637195497751236, -0.1587705910205841, -0.15382163226604462, -0.14887267351150513, -0.14392371475696564, -0.13897475600242615, -0.13402581214904785, -0.12907683849334717, -0.12412787973880768, -0.11917892098426819, -0.1142299622297287, -0.10928100347518921, -0.10433204472064972, -0.09938309341669083, -0.09443413466215134, -0.08948518335819244, -0.08453622460365295, -0.07958726584911346, -0.07463830709457397, -0.06968934834003448, -0.064740389585495, -0.0597914382815361, -0.05484247952699661, -0.04989352077245712, -0.04494456201791763, -0.03999560326337814, -0.03504664823412895, -0.030097689479589462, -0.025148730725049973, -0.020199773833155632, -0.015250816941261292, -0.010301858186721802, -0.005352900363504887, -0.0004039425402879715, 0.004545015282928944, 0.009493973106145859, 0.014442931860685349, 0.01939188875257969, 0.02434084564447403, 0.02928980439901352, 0.03423876315355301, 0.0391877219080925, 0.04413667693734169, 0.04908563569188118, 0.05403459444642067, 0.05898354947566986, 0.06393250823020935, 0.06888146698474884, 0.07383042573928833, 0.07877938449382782, 0.08372834324836731, 0.0886773020029068, 0.09362626075744629, 0.09857521206140518, 0.10352417081594467, 0.10847312957048416, 0.11342208832502365, 0.11837104707956314, 0.12332000583410263, 0.12826895713806152, 0.133217915892601, 0.1381668746471405, 0.14311583340168, 0.14806479215621948]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 2.0, 7.0, 13.0, 7.0, 10.0, 10.0, 25.0, 84.0, 207.0, 4163852.0, 29758.0, 136.0, 42.0, 16.0, 16.0, 12.0, 11.0, 6.0, 4.0, 5.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.09469318389892578, -0.09118080139160156, -0.08766841888427734, -0.08415603637695312, -0.0806436538696289, -0.07713127136230469, -0.07361888885498047, -0.07010650634765625, -0.06659412384033203, -0.06308174133300781, -0.059569358825683594, -0.056056976318359375, -0.052544593811035156, -0.04903221130371094, -0.04551982879638672, -0.0420074462890625, -0.03849506378173828, -0.03498268127441406, -0.031470298767089844, -0.027957916259765625, -0.024445533752441406, -0.020933151245117188, -0.01742076873779297, -0.01390838623046875, -0.010396003723144531, -0.0068836212158203125, -0.0033712387084960938, 0.000141143798828125, 0.0036535263061523438, 0.0071659088134765625, 0.010678291320800781, 0.014190673828125, 0.01770305633544922, 0.021215438842773438, 0.024727821350097656, 0.028240203857421875, 0.031752586364746094, 0.03526496887207031, 0.03877735137939453, 0.04228973388671875, 0.04580211639404297, 0.04931449890136719, 0.052826881408691406, 0.056339263916015625, 0.059851646423339844, 0.06336402893066406, 0.06687641143798828, 0.0703887939453125, 0.07390117645263672, 0.07741355895996094, 0.08092594146728516, 0.08443832397460938, 0.0879507064819336, 0.09146308898925781, 0.09497547149658203, 0.09848785400390625, 0.10200023651123047, 0.10551261901855469, 0.1090250015258789, 0.11253738403320312, 0.11604976654052734, 0.11956214904785156, 0.12307453155517578, 0.1265869140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 5.0, 15.0, 7.0, 9.0, 8.0, 14.0, 70.0, 142.0, 281.0, 209.0, 99.0, 26.0, 8.0, 10.0, 10.0, 10.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007133066654205322, -0.0068694353103637695, -0.006605803966522217, -0.006342172622680664, -0.006078541278839111, -0.005814909934997559, -0.005551278591156006, -0.005287647247314453, -0.0050240159034729, -0.004760384559631348, -0.004496753215789795, -0.004233121871948242, -0.0039694905281066895, -0.0037058591842651367, -0.003442227840423584, -0.0031785964965820312, -0.0029149651527404785, -0.0026513338088989258, -0.002387702465057373, -0.0021240711212158203, -0.0018604397773742676, -0.0015968084335327148, -0.0013331770896911621, -0.0010695457458496094, -0.0008059144020080566, -0.0005422830581665039, -0.00027865171432495117, -1.5020370483398438e-05, 0.0002486109733581543, 0.000512242317199707, 0.0007758736610412598, 0.0010395050048828125, 0.0013031363487243652, 0.001566767692565918, 0.0018303990364074707, 0.0020940303802490234, 0.002357661724090576, 0.002621293067932129, 0.0028849244117736816, 0.0031485557556152344, 0.003412187099456787, 0.00367581844329834, 0.003939449787139893, 0.004203081130981445, 0.004466712474822998, 0.004730343818664551, 0.0049939751625061035, 0.005257606506347656, 0.005521237850189209, 0.005784869194030762, 0.0060485005378723145, 0.006312131881713867, 0.00657576322555542, 0.006839394569396973, 0.007103025913238525, 0.007366657257080078, 0.007630288600921631, 0.007893919944763184, 0.008157551288604736, 0.008421182632446289, 0.008684813976287842, 0.008948445320129395, 0.009212076663970947, 0.0094757080078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 9.0, 13.0, 23.0, 75.0, 202.0, 721.0, 6143.0, 4179271.0, 6784.0, 722.0, 190.0, 62.0, 27.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018585205078125, -0.017976045608520508, -0.017366886138916016, -0.016757726669311523, -0.01614856719970703, -0.015539407730102539, -0.014930248260498047, -0.014321088790893555, -0.013711929321289062, -0.01310276985168457, -0.012493610382080078, -0.011884450912475586, -0.011275291442871094, -0.010666131973266602, -0.01005697250366211, -0.009447813034057617, -0.008838653564453125, -0.008229494094848633, -0.007620334625244141, -0.0070111751556396484, -0.006402015686035156, -0.005792856216430664, -0.005183696746826172, -0.00457453727722168, -0.0039653778076171875, -0.0033562183380126953, -0.002747058868408203, -0.002137899398803711, -0.0015287399291992188, -0.0009195804595947266, -0.0003104209899902344, 0.0002987384796142578, 0.00090789794921875, 0.0015170574188232422, 0.0021262168884277344, 0.0027353763580322266, 0.0033445358276367188, 0.003953695297241211, 0.004562854766845703, 0.005172014236450195, 0.0057811737060546875, 0.00639033317565918, 0.006999492645263672, 0.007608652114868164, 0.008217811584472656, 0.008826971054077148, 0.00943613052368164, 0.010045289993286133, 0.010654449462890625, 0.011263608932495117, 0.01187276840209961, 0.012481927871704102, 0.013091087341308594, 0.013700246810913086, 0.014309406280517578, 0.01491856575012207, 0.015527725219726562, 0.016136884689331055, 0.016746044158935547, 0.01735520362854004, 0.01796436309814453, 0.018573522567749023, 0.019182682037353516, 0.019791841506958008, 0.0204010009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 12.0, 19.0, 37.0, 90.0, 193.0, 2958.0, 528.0, 128.0, 56.0, 29.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00806427001953125, -0.007861495018005371, -0.007658720016479492, -0.007455945014953613, -0.007253170013427734, -0.0070503950119018555, -0.0068476200103759766, -0.006644845008850098, -0.006442070007324219, -0.00623929500579834, -0.006036520004272461, -0.005833745002746582, -0.005630970001220703, -0.005428194999694824, -0.005225419998168945, -0.005022644996643066, -0.0048198699951171875, -0.004617094993591309, -0.00441431999206543, -0.004211544990539551, -0.004008769989013672, -0.003805994987487793, -0.003603219985961914, -0.003400444984436035, -0.0031976699829101562, -0.0029948949813842773, -0.0027921199798583984, -0.0025893449783325195, -0.0023865699768066406, -0.0021837949752807617, -0.001981019973754883, -0.001778244972229004, -0.001575469970703125, -0.001372694969177246, -0.0011699199676513672, -0.0009671449661254883, -0.0007643699645996094, -0.0005615949630737305, -0.00035881996154785156, -0.00015604496002197266, 4.673004150390625e-05, 0.00024950504302978516, 0.00045228004455566406, 0.000655055046081543, 0.0008578300476074219, 0.0010606050491333008, 0.0012633800506591797, 0.0014661550521850586, 0.0016689300537109375, 0.0018717050552368164, 0.0020744800567626953, 0.0022772550582885742, 0.002480030059814453, 0.002682805061340332, 0.002885580062866211, 0.00308835506439209, 0.0032911300659179688, 0.0034939050674438477, 0.0036966800689697266, 0.0038994550704956055, 0.004102230072021484, 0.004305005073547363, 0.004507780075073242, 0.004710555076599121, 0.004913330078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [107.0, 909.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444257356226444, -0.00020800484344363213, 0.00402824766933918, 0.008264499716460705, 0.012500752694904804, 0.01673700660467148, 0.02097325772047043, 0.02520950883626938, 0.029445763677358627, 0.03368201479315758, 0.037918269634246826, 0.042154520750045776, 0.04639077186584473, 0.050627026706933975, 0.054863277822732925, 0.059099532663822174, 0.06333578377962112, 0.06757203489542007, 0.07180828601121902, 0.07604454457759857, 0.08028079569339752, 0.08451704680919647, 0.08875329792499542, 0.09298954904079437, 0.09722580015659332, 0.10146205127239227, 0.10569830238819122, 0.10993455350399017, 0.11417081207036972, 0.11840706318616867, 0.12264331430196762, 0.12687957286834717, 0.13111580908298492, 0.13535206019878387, 0.13958831131458282, 0.14382456243038177, 0.14806081354618073, 0.15229707956314087, 0.15653333067893982, 0.16076958179473877, 0.16500583291053772, 0.16924208402633667, 0.17347833514213562, 0.17771458625793457, 0.18195083737373352, 0.18618708848953247, 0.19042333960533142, 0.19465960562229156, 0.19889584183692932, 0.20313209295272827, 0.20736834406852722, 0.21160459518432617, 0.21584084630012512, 0.22007709741592407, 0.22431334853172302, 0.22854961454868317, 0.23278586566448212, 0.23702211678028107, 0.24125836789608002, 0.24549461901187897, 0.24973087012767792, 0.25396713614463806, 0.258203387260437, 0.26243963837623596, 0.2666758894920349]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 6.0, 14.0, 13.0, 19.0, 17.0, 21.0, 23.0, 27.0, 40.0, 35.0, 57.0, 44.0, 65.0, 55.0, 45.0, 47.0, 54.0, 50.0, 50.0, 36.0, 37.0, 40.0, 29.0, 26.0, 33.0, 21.0, 10.0, 21.0, 11.0, 9.0, 14.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008043885231018066, -0.007724401541054249, -0.007404917851090431, -0.007085434161126614, -0.006765950471162796, -0.006446466781198978, -0.006126983091235161, -0.005807499401271343, -0.005488015711307526, -0.005168532021343708, -0.0048490483313798904, -0.004529564641416073, -0.004210080951452255, -0.0038905972614884377, -0.00357111357152462, -0.0032516298815608025, -0.002932146191596985, -0.0026126625016331673, -0.0022931788116693497, -0.001973695121705532, -0.0016542114317417145, -0.0013347277417778969, -0.0010152440518140793, -0.0006957603618502617, -0.0003762766718864441, -5.6792981922626495e-05, 0.0002626907080411911, 0.0005821743980050087, 0.0009016580879688263, 0.0012211417779326439, 0.0015406254678964615, 0.001860109157860279, 0.0021795928478240967, 0.0024990765377879143, 0.002818560227751732, 0.0031380439177155495, 0.003457527607679367, 0.0037770112976431847, 0.004096494987607002, 0.00441597867757082, 0.0047354623675346375, 0.005054946057498455, 0.005374429747462273, 0.00569391343742609, 0.006013397127389908, 0.006332880817353725, 0.006652364507317543, 0.006971848197281361, 0.007291331887245178, 0.007610815577208996, 0.007930299267172813, 0.008249782957136631, 0.008569266647100449, 0.008888750337064266, 0.009208234027028084, 0.009527717716991901, 0.009847201406955719, 0.010166685096919537, 0.010486168786883354, 0.010805652476847172, 0.01112513616681099, 0.011444619856774807, 0.011764103546738625, 0.012083587236702442, 0.01240307092666626]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 8.0, 9.0, 12.0, 18.0, 24.0, 32.0, 38.0, 42.0, 77.0, 114.0, 156.0, 217.0, 372.0, 547.0, 887.0, 1380.0, 2521.0, 4589.0, 9715.0, 27367.0, 813729.0, 151509.0, 18309.0, 7676.0, 3661.0, 2044.0, 1185.0, 752.0, 508.0, 319.0, 197.0, 176.0, 106.0, 80.0, 40.0, 28.0, 29.0, 19.0, 15.0, 14.0, 6.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.01155853271484375, -0.011236071586608887, -0.010913610458374023, -0.01059114933013916, -0.010268688201904297, -0.009946227073669434, -0.00962376594543457, -0.009301304817199707, -0.008978843688964844, -0.00865638256072998, -0.008333921432495117, -0.008011460304260254, -0.007688999176025391, -0.007366538047790527, -0.007044076919555664, -0.006721615791320801, -0.0063991546630859375, -0.006076693534851074, -0.005754232406616211, -0.005431771278381348, -0.005109310150146484, -0.004786849021911621, -0.004464387893676758, -0.0041419267654418945, -0.0038194656372070312, -0.003497004508972168, -0.0031745433807373047, -0.0028520822525024414, -0.002529621124267578, -0.002207159996032715, -0.0018846988677978516, -0.0015622377395629883, -0.001239776611328125, -0.0009173154830932617, -0.0005948543548583984, -0.00027239322662353516, 5.0067901611328125e-05, 0.0003725290298461914, 0.0006949901580810547, 0.001017451286315918, 0.0013399124145507812, 0.0016623735427856445, 0.001984834671020508, 0.002307295799255371, 0.0026297569274902344, 0.0029522180557250977, 0.003274679183959961, 0.0035971403121948242, 0.0039196014404296875, 0.004242062568664551, 0.004564523696899414, 0.004886984825134277, 0.005209445953369141, 0.005531907081604004, 0.005854368209838867, 0.0061768293380737305, 0.006499290466308594, 0.006821751594543457, 0.00714421272277832, 0.007466673851013184, 0.007789134979248047, 0.00811159610748291, 0.008434057235717773, 0.008756518363952637, 0.0090789794921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 6.0, 14.0, 7.0, 8.0, 9.0, 14.0, 70.0, 149.0, 278.0, 209.0, 96.0, 25.0, 8.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00738525390625, -0.0071218013763427734, -0.006858348846435547, -0.00659489631652832, -0.006331443786621094, -0.006067991256713867, -0.005804538726806641, -0.005541086196899414, -0.0052776336669921875, -0.005014181137084961, -0.004750728607177734, -0.004487276077270508, -0.004223823547363281, -0.003960371017456055, -0.003696918487548828, -0.0034334659576416016, -0.003170013427734375, -0.0029065608978271484, -0.002643108367919922, -0.0023796558380126953, -0.0021162033081054688, -0.0018527507781982422, -0.0015892982482910156, -0.001325845718383789, -0.0010623931884765625, -0.0007989406585693359, -0.0005354881286621094, -0.0002720355987548828, -8.58306884765625e-06, 0.0002548694610595703, 0.0005183219909667969, 0.0007817745208740234, 0.00104522705078125, 0.0013086795806884766, 0.0015721321105957031, 0.0018355846405029297, 0.0020990371704101562, 0.002362489700317383, 0.0026259422302246094, 0.002889394760131836, 0.0031528472900390625, 0.003416299819946289, 0.0036797523498535156, 0.003943204879760742, 0.004206657409667969, 0.004470109939575195, 0.004733562469482422, 0.0049970149993896484, 0.005260467529296875, 0.0055239200592041016, 0.005787372589111328, 0.006050825119018555, 0.006314277648925781, 0.006577730178833008, 0.006841182708740234, 0.007104635238647461, 0.0073680877685546875, 0.007631540298461914, 0.00789499282836914, 0.008158445358276367, 0.008421897888183594, 0.00868535041809082, 0.008948802947998047, 0.009212255477905273, 0.0094757080078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 10.0, 7.0, 14.0, 24.0, 17.0, 17.0, 31.0, 35.0, 32.0, 61.0, 100.0, 118.0, 137.0, 187.0, 308.0, 576.0, 1068.0, 4259.0, 799459.0, 236536.0, 3050.0, 939.0, 471.0, 309.0, 191.0, 151.0, 100.0, 95.0, 63.0, 41.0, 28.0, 29.0, 16.0, 15.0, 17.0, 10.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.02503371238708496, -0.024249553680419922, -0.023465394973754883, -0.022681236267089844, -0.021897077560424805, -0.021112918853759766, -0.020328760147094727, -0.019544601440429688, -0.01876044273376465, -0.01797628402709961, -0.01719212532043457, -0.01640796661376953, -0.015623807907104492, -0.014839649200439453, -0.014055490493774414, -0.013271331787109375, -0.012487173080444336, -0.011703014373779297, -0.010918855667114258, -0.010134696960449219, -0.00935053825378418, -0.00856637954711914, -0.0077822208404541016, -0.0069980621337890625, -0.0062139034271240234, -0.005429744720458984, -0.004645586013793945, -0.0038614273071289062, -0.003077268600463867, -0.002293109893798828, -0.001508951187133789, -0.00072479248046875, 5.936622619628906e-05, 0.0008435249328613281, 0.0016276836395263672, 0.0024118423461914062, 0.0031960010528564453, 0.003980159759521484, 0.0047643184661865234, 0.0055484771728515625, 0.0063326358795166016, 0.007116794586181641, 0.00790095329284668, 0.008685111999511719, 0.009469270706176758, 0.010253429412841797, 0.011037588119506836, 0.011821746826171875, 0.012605905532836914, 0.013390064239501953, 0.014174222946166992, 0.014958381652832031, 0.01574254035949707, 0.01652669906616211, 0.01731085777282715, 0.018095016479492188, 0.018879175186157227, 0.019663333892822266, 0.020447492599487305, 0.021231651306152344, 0.022015810012817383, 0.022799968719482422, 0.02358412742614746, 0.0243682861328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 10.0, 6.0, 13.0, 20.0, 13.0, 10.0, 19.0, 21.0, 19.0, 27.0, 40.0, 36.0, 37.0, 26.0, 38.0, 36.0, 44.0, 58.0, 39.0, 43.0, 34.0, 35.0, 38.0, 44.0, 40.0, 50.0, 25.0, 32.0, 24.0, 17.0, 19.0, 19.0, 10.0, 9.0, 15.0, 7.0, 8.0, 5.0, 1.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022247314453125, -0.02157115936279297, -0.020895004272460938, -0.020218849182128906, -0.019542694091796875, -0.018866539001464844, -0.018190383911132812, -0.01751422882080078, -0.01683807373046875, -0.01616191864013672, -0.015485763549804688, -0.014809608459472656, -0.014133453369140625, -0.013457298278808594, -0.012781143188476562, -0.012104988098144531, -0.0114288330078125, -0.010752677917480469, -0.010076522827148438, -0.009400367736816406, -0.008724212646484375, -0.008048057556152344, -0.0073719024658203125, -0.006695747375488281, -0.00601959228515625, -0.005343437194824219, -0.0046672821044921875, -0.003991127014160156, -0.003314971923828125, -0.0026388168334960938, -0.0019626617431640625, -0.0012865066528320312, -0.0006103515625, 6.580352783203125e-05, 0.0007419586181640625, 0.0014181137084960938, 0.002094268798828125, 0.0027704238891601562, 0.0034465789794921875, 0.004122734069824219, 0.00479888916015625, 0.005475044250488281, 0.0061511993408203125, 0.006827354431152344, 0.007503509521484375, 0.008179664611816406, 0.008855819702148438, 0.009531974792480469, 0.0102081298828125, 0.010884284973144531, 0.011560440063476562, 0.012236595153808594, 0.012912750244140625, 0.013588905334472656, 0.014265060424804688, 0.014941215515136719, 0.01561737060546875, 0.01629352569580078, 0.016969680786132812, 0.017645835876464844, 0.018321990966796875, 0.018998146057128906, 0.019674301147460938, 0.02035045623779297, 0.021026611328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 4.0, 8.0, 11.0, 23.0, 15.0, 22.0, 42.0, 37.0, 109.0, 86.0, 112.0, 298.0, 323.0, 1054.0, 1839.0, 15046.0, 147643.0, 836544.0, 39231.0, 3178.0, 1544.0, 444.0, 371.0, 175.0, 99.0, 97.0, 46.0, 43.0, 20.0, 17.0, 24.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.50480729341507e-06, -4.36045229434967e-06, -4.216097295284271e-06, -4.071742296218872e-06, -3.927387297153473e-06, -3.7830322980880737e-06, -3.6386772990226746e-06, -3.4943222999572754e-06, -3.3499673008918762e-06, -3.205612301826477e-06, -3.061257302761078e-06, -2.9169023036956787e-06, -2.7725473046302795e-06, -2.6281923055648804e-06, -2.483837306499481e-06, -2.339482307434082e-06, -2.195127308368683e-06, -2.0507723093032837e-06, -1.9064173102378845e-06, -1.7620623111724854e-06, -1.6177073121070862e-06, -1.473352313041687e-06, -1.3289973139762878e-06, -1.1846423149108887e-06, -1.0402873158454895e-06, -8.959323167800903e-07, -7.515773177146912e-07, -6.07222318649292e-07, -4.628673195838928e-07, -3.1851232051849365e-07, -1.7415732145309448e-07, -2.9802322387695312e-08, 1.1455267667770386e-07, 2.5890767574310303e-07, 4.032626748085022e-07, 5.476176738739014e-07, 6.919726729393005e-07, 8.363276720046997e-07, 9.806826710700989e-07, 1.125037670135498e-06, 1.2693926692008972e-06, 1.4137476682662964e-06, 1.5581026673316956e-06, 1.7024576663970947e-06, 1.846812665462494e-06, 1.991167664527893e-06, 2.1355226635932922e-06, 2.2798776626586914e-06, 2.4242326617240906e-06, 2.5685876607894897e-06, 2.712942659854889e-06, 2.857297658920288e-06, 3.0016526579856873e-06, 3.1460076570510864e-06, 3.2903626561164856e-06, 3.4347176551818848e-06, 3.579072654247284e-06, 3.723427653312683e-06, 3.867782652378082e-06, 4.0121376514434814e-06, 4.156492650508881e-06, 4.30084764957428e-06, 4.445202648639679e-06, 4.589557647705078e-06]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 17.0, 9.0, 17.0, 18.0, 28.0, 19.0, 40.0, 17.0, 39.0, 23.0, 61.0, 19.0, 64.0, 34.0, 91.0, 80.0, 38.0, 68.0, 15.0, 47.0, 29.0, 33.0, 18.0, 38.0, 17.0, 19.0, 7.0, 12.0, 6.0, 9.0, 8.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8293579816818237e-06, -2.738088369369507e-06, -2.64681875705719e-06, -2.555549144744873e-06, -2.464279532432556e-06, -2.3730099201202393e-06, -2.2817403078079224e-06, -2.1904706954956055e-06, -2.0992010831832886e-06, -2.0079314708709717e-06, -1.9166618585586548e-06, -1.8253922462463379e-06, -1.734122633934021e-06, -1.642853021621704e-06, -1.5515834093093872e-06, -1.4603137969970703e-06, -1.3690441846847534e-06, -1.2777745723724365e-06, -1.1865049600601196e-06, -1.0952353477478027e-06, -1.0039657354354858e-06, -9.126961231231689e-07, -8.21426510810852e-07, -7.301568984985352e-07, -6.388872861862183e-07, -5.476176738739014e-07, -4.5634806156158447e-07, -3.650784492492676e-07, -2.738088369369507e-07, -1.825392246246338e-07, -9.12696123123169e-08, 0.0, 9.12696123123169e-08, 1.825392246246338e-07, 2.738088369369507e-07, 3.650784492492676e-07, 4.5634806156158447e-07, 5.476176738739014e-07, 6.388872861862183e-07, 7.301568984985352e-07, 8.21426510810852e-07, 9.126961231231689e-07, 1.0039657354354858e-06, 1.0952353477478027e-06, 1.1865049600601196e-06, 1.2777745723724365e-06, 1.3690441846847534e-06, 1.4603137969970703e-06, 1.5515834093093872e-06, 1.642853021621704e-06, 1.734122633934021e-06, 1.8253922462463379e-06, 1.9166618585586548e-06, 2.0079314708709717e-06, 2.0992010831832886e-06, 2.1904706954956055e-06, 2.2817403078079224e-06, 2.3730099201202393e-06, 2.464279532432556e-06, 2.555549144744873e-06, 2.64681875705719e-06, 2.738088369369507e-06, 2.8293579816818237e-06, 2.9206275939941406e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 15.0, 19.0, 27.0, 51.0, 78.0, 167.0, 415.0, 3803.0, 1040571.0, 2588.0, 452.0, 148.0, 84.0, 45.0, 29.0, 20.0, 7.0, 7.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5174970030784607e-05, -1.4554709196090698e-05, -1.393444836139679e-05, -1.3314187526702881e-05, -1.2693926692008972e-05, -1.2073665857315063e-05, -1.1453405022621155e-05, -1.0833144187927246e-05, -1.0212883353233337e-05, -9.592622518539429e-06, -8.97236168384552e-06, -8.352100849151611e-06, -7.731840014457703e-06, -7.111579179763794e-06, -6.491318345069885e-06, -5.8710575103759766e-06, -5.250796675682068e-06, -4.630535840988159e-06, -4.0102750062942505e-06, -3.390014171600342e-06, -2.769753336906433e-06, -2.1494925022125244e-06, -1.5292316675186157e-06, -9.08970832824707e-07, -2.8870999813079834e-07, 3.3155083656311035e-07, 9.51811671257019e-07, 1.5720725059509277e-06, 2.1923333406448364e-06, 2.812594175338745e-06, 3.432855010032654e-06, 4.0531158447265625e-06, 4.673376679420471e-06, 5.29363751411438e-06, 5.9138983488082886e-06, 6.534159183502197e-06, 7.154420018196106e-06, 7.774680852890015e-06, 8.394941687583923e-06, 9.015202522277832e-06, 9.63546335697174e-06, 1.025572419166565e-05, 1.0875985026359558e-05, 1.1496245861053467e-05, 1.2116506695747375e-05, 1.2736767530441284e-05, 1.3357028365135193e-05, 1.3977289199829102e-05, 1.459755003452301e-05, 1.5217810869216919e-05, 1.5838071703910828e-05, 1.6458332538604736e-05, 1.7078593373298645e-05, 1.7698854207992554e-05, 1.8319115042686462e-05, 1.893937587738037e-05, 1.955963671207428e-05, 2.017989754676819e-05, 2.0800158381462097e-05, 2.1420419216156006e-05, 2.2040680050849915e-05, 2.2660940885543823e-05, 2.3281201720237732e-05, 2.390146255493164e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 8.0, 10.0, 9.0, 25.0, 30.0, 42.0, 67.0, 81.0, 481.0, 78.0, 55.0, 32.0, 23.0, 21.0, 6.0, 10.0, 5.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3055279850959778e-05, -1.2520700693130493e-05, -1.1986121535301208e-05, -1.1451542377471924e-05, -1.091696321964264e-05, -1.0382384061813354e-05, -9.84780490398407e-06, -9.313225746154785e-06, -8.7786465883255e-06, -8.244067430496216e-06, -7.709488272666931e-06, -7.1749091148376465e-06, -6.640329957008362e-06, -6.105750799179077e-06, -5.5711716413497925e-06, -5.036592483520508e-06, -4.502013325691223e-06, -3.9674341678619385e-06, -3.432855010032654e-06, -2.898275852203369e-06, -2.3636966943740845e-06, -1.8291175365447998e-06, -1.2945383787155151e-06, -7.599592208862305e-07, -2.253800630569458e-07, 3.0919909477233887e-07, 8.437782526016235e-07, 1.3783574104309082e-06, 1.912936568260193e-06, 2.4475157260894775e-06, 2.982094883918762e-06, 3.516674041748047e-06, 4.0512531995773315e-06, 4.585832357406616e-06, 5.120411515235901e-06, 5.6549906730651855e-06, 6.18956983089447e-06, 6.724148988723755e-06, 7.2587281465530396e-06, 7.793307304382324e-06, 8.327886462211609e-06, 8.862465620040894e-06, 9.397044777870178e-06, 9.931623935699463e-06, 1.0466203093528748e-05, 1.1000782251358032e-05, 1.1535361409187317e-05, 1.2069940567016602e-05, 1.2604519724845886e-05, 1.3139098882675171e-05, 1.3673678040504456e-05, 1.420825719833374e-05, 1.4742836356163025e-05, 1.527741551399231e-05, 1.5811994671821594e-05, 1.634657382965088e-05, 1.6881152987480164e-05, 1.7415732145309448e-05, 1.7950311303138733e-05, 1.8484890460968018e-05, 1.9019469618797302e-05, 1.9554048776626587e-05, 2.008862793445587e-05, 2.0623207092285156e-05]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 104.0, 878.0, 27.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476025819778442, -0.06575579941272736, -0.05675134062767029, -0.04774687811732292, -0.038742419332265854, -0.029737960547208786, -0.02073349803686142, -0.011729039251804352, -0.002724580466747284, 0.0062798792496323586, 0.015284338966012001, 0.024288799613714218, 0.033293258398771286, 0.042297717183828354, 0.05130217969417572, 0.06030663847923279, 0.06931109726428986, 0.07831555604934692, 0.08732001483440399, 0.09632447361946106, 0.10532893240451813, 0.1143333911895752, 0.12333785742521286, 0.13234230875968933, 0.1413467824459076, 0.15035124123096466, 0.15935570001602173, 0.1683601588010788, 0.17736461758613586, 0.18636907637119293, 0.19537353515625, 0.20437800884246826, 0.21338245272636414, 0.2223869115114212, 0.23139137029647827, 0.24039582908153534, 0.2494002878665924, 0.25840476155281067, 0.26740920543670654, 0.2764136791229248, 0.2854181230068207, 0.29442259669303894, 0.3034270405769348, 0.3124315142631531, 0.32143595814704895, 0.3304404318332672, 0.3394448757171631, 0.34844934940338135, 0.3574538230895996, 0.36645829677581787, 0.37546274065971375, 0.384467214345932, 0.3934716582298279, 0.40247613191604614, 0.411480575799942, 0.4204850494861603, 0.42948949337005615, 0.4384939670562744, 0.4474984109401703, 0.45650288462638855, 0.4655073285102844, 0.4745118021965027, 0.48351624608039856, 0.4925207197666168, 0.5015251636505127]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 6.0, 9.0, 12.0, 10.0, 17.0, 15.0, 14.0, 25.0, 23.0, 31.0, 41.0, 34.0, 40.0, 37.0, 54.0, 56.0, 49.0, 44.0, 54.0, 55.0, 38.0, 41.0, 29.0, 35.0, 23.0, 28.0, 26.0, 24.0, 18.0, 24.0, 13.0, 13.0, 8.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12279540300369263, -0.11929187923669815, -0.11578836292028427, -0.1122848391532898, -0.10878132283687592, -0.10527779906988144, -0.10177427530288696, -0.09827075898647308, -0.09476723521947861, -0.09126371145248413, -0.08776019513607025, -0.08425667136907578, -0.0807531476020813, -0.07724963128566742, -0.07374610751867294, -0.07024258375167847, -0.06673906743526459, -0.06323554366827011, -0.05973202735185623, -0.056228503584861755, -0.05272498354315758, -0.0492214635014534, -0.04571793973445892, -0.042214419692754745, -0.03871089965105057, -0.03520737960934639, -0.03170385956764221, -0.028200335800647736, -0.024696815758943558, -0.02119329571723938, -0.017689773812890053, -0.014186251908540726, -0.010682731866836548, -0.007179210893809795, -0.003675689920783043, -0.00017216894775629044, 0.003331352025270462, 0.00683487206697464, 0.010338393971323967, 0.013841915875673294, 0.017345435917377472, 0.02084895595908165, 0.024352477863430977, 0.027855999767780304, 0.03135951980948448, 0.03486303985118866, 0.038366563618183136, 0.041870083659887314, 0.04537360370159149, 0.04887712374329567, 0.05238064378499985, 0.055884167551994324, 0.0593876875936985, 0.06289120763540268, 0.06639473140239716, 0.06989824771881104, 0.07340177148580551, 0.07690529525279999, 0.08040881156921387, 0.08391233533620834, 0.08741585910320282, 0.0909193754196167, 0.09442289918661118, 0.09792642295360565, 0.10142993927001953]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 4.0, 16.0, 5.0, 11.0, 6.0, 21.0, 88.0, 498.0, 12074.0, 4180730.0, 613.0, 76.0, 27.0, 11.0, 12.0, 12.0, 6.0, 5.0, 6.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0277099609375, -0.026724815368652344, -0.025739669799804688, -0.02475452423095703, -0.023769378662109375, -0.02278423309326172, -0.021799087524414062, -0.020813941955566406, -0.01982879638671875, -0.018843650817871094, -0.017858505249023438, -0.01687335968017578, -0.015888214111328125, -0.014903068542480469, -0.013917922973632812, -0.012932777404785156, -0.0119476318359375, -0.010962486267089844, -0.009977340698242188, -0.008992195129394531, -0.008007049560546875, -0.007021903991699219, -0.0060367584228515625, -0.005051612854003906, -0.00406646728515625, -0.0030813217163085938, -0.0020961761474609375, -0.0011110305786132812, -0.000125885009765625, 0.0008592605590820312, 0.0018444061279296875, 0.0028295516967773438, 0.003814697265625, 0.004799842834472656, 0.0057849884033203125, 0.006770133972167969, 0.007755279541015625, 0.008740425109863281, 0.009725570678710938, 0.010710716247558594, 0.01169586181640625, 0.012681007385253906, 0.013666152954101562, 0.014651298522949219, 0.015636444091796875, 0.01662158966064453, 0.017606735229492188, 0.018591880798339844, 0.0195770263671875, 0.020562171936035156, 0.021547317504882812, 0.02253246307373047, 0.023517608642578125, 0.02450275421142578, 0.025487899780273438, 0.026473045349121094, 0.02745819091796875, 0.028443336486816406, 0.029428482055664062, 0.03041362762451172, 0.031398773193359375, 0.03238391876220703, 0.03336906433105469, 0.034354209899902344, 0.03533935546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 3.0, 16.0, 6.0, 10.0, 6.0, 15.0, 54.0, 118.0, 265.0, 233.0, 116.0, 37.0, 14.0, 7.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007142364978790283, -0.006880402565002441, -0.0066184401512146, -0.006356477737426758, -0.006094515323638916, -0.005832552909851074, -0.005570590496063232, -0.005308628082275391, -0.005046665668487549, -0.004784703254699707, -0.004522740840911865, -0.0042607784271240234, -0.003998816013336182, -0.00373685359954834, -0.003474891185760498, -0.0032129287719726562, -0.0029509663581848145, -0.0026890039443969727, -0.002427041530609131, -0.002165079116821289, -0.0019031167030334473, -0.0016411542892456055, -0.0013791918754577637, -0.0011172294616699219, -0.0008552670478820801, -0.0005933046340942383, -0.0003313422203063965, -6.937980651855469e-05, 0.0001925826072692871, 0.0004545450210571289, 0.0007165074348449707, 0.0009784698486328125, 0.0012404322624206543, 0.001502394676208496, 0.0017643570899963379, 0.0020263195037841797, 0.0022882819175720215, 0.0025502443313598633, 0.002812206745147705, 0.003074169158935547, 0.0033361315727233887, 0.0035980939865112305, 0.0038600564002990723, 0.004122018814086914, 0.004383981227874756, 0.004645943641662598, 0.0049079060554504395, 0.005169868469238281, 0.005431830883026123, 0.005693793296813965, 0.005955755710601807, 0.0062177181243896484, 0.00647968053817749, 0.006741642951965332, 0.007003605365753174, 0.007265567779541016, 0.007527530193328857, 0.007789492607116699, 0.008051455020904541, 0.008313417434692383, 0.008575379848480225, 0.008837342262268066, 0.009099304676055908, 0.00936126708984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 11.0, 4.0, 22.0, 22.0, 44.0, 56.0, 209.0, 646.0, 2926.0, 27620.0, 4148640.0, 11572.0, 1730.0, 454.0, 136.0, 73.0, 18.0, 22.0, 16.0, 11.0, 8.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0074310302734375, -0.007214725017547607, -0.006998419761657715, -0.006782114505767822, -0.00656580924987793, -0.006349503993988037, -0.0061331987380981445, -0.005916893482208252, -0.005700588226318359, -0.005484282970428467, -0.005267977714538574, -0.005051672458648682, -0.004835367202758789, -0.0046190619468688965, -0.004402756690979004, -0.004186451435089111, -0.003970146179199219, -0.003753840923309326, -0.0035375356674194336, -0.003321230411529541, -0.0031049251556396484, -0.002888619899749756, -0.0026723146438598633, -0.0024560093879699707, -0.002239704132080078, -0.0020233988761901855, -0.001807093620300293, -0.0015907883644104004, -0.0013744831085205078, -0.0011581778526306152, -0.0009418725967407227, -0.0007255673408508301, -0.0005092620849609375, -0.0002929568290710449, -7.665157318115234e-05, 0.00013965368270874023, 0.0003559589385986328, 0.0005722641944885254, 0.000788569450378418, 0.0010048747062683105, 0.0012211799621582031, 0.0014374852180480957, 0.0016537904739379883, 0.0018700957298278809, 0.0020864009857177734, 0.002302706241607666, 0.0025190114974975586, 0.002735316753387451, 0.0029516220092773438, 0.0031679272651672363, 0.003384232521057129, 0.0036005377769470215, 0.003816843032836914, 0.004033148288726807, 0.004249453544616699, 0.004465758800506592, 0.004682064056396484, 0.004898369312286377, 0.0051146745681762695, 0.005330979824066162, 0.005547285079956055, 0.005763590335845947, 0.00597989559173584, 0.006196200847625732, 0.006412506103515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 7.0, 8.0, 3.0, 7.0, 15.0, 25.0, 36.0, 162.0, 3526.0, 152.0, 43.0, 23.0, 17.0, 11.0, 10.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002166748046875, -0.0020933449268341064, -0.002019941806793213, -0.0019465386867523193, -0.0018731355667114258, -0.0017997324466705322, -0.0017263293266296387, -0.0016529262065887451, -0.0015795230865478516, -0.001506119966506958, -0.0014327168464660645, -0.001359313726425171, -0.0012859106063842773, -0.0012125074863433838, -0.0011391043663024902, -0.0010657012462615967, -0.0009922981262207031, -0.0009188950061798096, -0.000845491886138916, -0.0007720887660980225, -0.0006986856460571289, -0.0006252825260162354, -0.0005518794059753418, -0.00047847628593444824, -0.0004050731658935547, -0.00033167004585266113, -0.0002582669258117676, -0.00018486380577087402, -0.00011146068572998047, -3.8057565689086914e-05, 3.534555435180664e-05, 0.0001087486743927002, 0.00018215179443359375, 0.0002555549144744873, 0.00032895803451538086, 0.0004023611545562744, 0.00047576427459716797, 0.0005491673946380615, 0.0006225705146789551, 0.0006959736347198486, 0.0007693767547607422, 0.0008427798748016357, 0.0009161829948425293, 0.0009895861148834229, 0.0010629892349243164, 0.00113639235496521, 0.0012097954750061035, 0.001283198595046997, 0.0013566017150878906, 0.0014300048351287842, 0.0015034079551696777, 0.0015768110752105713, 0.0016502141952514648, 0.0017236173152923584, 0.001797020435333252, 0.0018704235553741455, 0.001943826675415039, 0.0020172297954559326, 0.002090632915496826, 0.0021640360355377197, 0.0022374391555786133, 0.002310842275619507, 0.0023842453956604004, 0.002457648515701294, 0.0025310516357421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 918.0, 72.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020353326573967934, -0.019935347139835358, -0.01951736770570278, -0.019099388271570206, -0.01868141070008278, -0.018263431265950203, -0.017845451831817627, -0.01742747239768505, -0.017009492963552475, -0.0165915135294199, -0.016173534095287323, -0.015755556523799896, -0.015337576158344746, -0.014919597655534744, -0.014501618221402168, -0.014083638787269592, -0.013665660284459591, -0.013247680850327015, -0.012829702347517014, -0.012411722913384438, -0.011993743479251862, -0.011575764045119286, -0.011157785542309284, -0.010739806108176708, -0.010321827605366707, -0.00990384817123413, -0.00948586966842413, -0.009067890234291553, -0.008649910800158978, -0.008231932297348976, -0.0078139528632164, -0.007395973429083824, -0.006977994926273823, -0.006560015957802534, -0.006142036523669958, -0.005724057555198669, -0.0053060781210660934, -0.004888099152594805, -0.004470120184123516, -0.00405214074999094, -0.0036341617815196514, -0.003216182580217719, -0.0027982033789157867, -0.002380224410444498, -0.0019622452091425657, -0.0015442660078406334, -0.0011262870393693447, -0.0007083078380674124, -0.00029032863676548004, 0.00012765050632879138, 0.0005456296494230628, 0.0009636087343096733, 0.0013815879356116056, 0.001799567136913538, 0.0022175461053848267, 0.002635525306686759, 0.0030535045079886913, 0.0034714837092906237, 0.003889462910592556, 0.004307441879063845, 0.004725420847535133, 0.005143400281667709, 0.005561379250138998, 0.005979358218610287, 0.006397337652742863]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 16.0, 14.0, 10.0, 19.0, 22.0, 22.0, 29.0, 30.0, 38.0, 40.0, 39.0, 36.0, 36.0, 56.0, 55.0, 59.0, 51.0, 47.0, 49.0, 41.0, 46.0, 38.0, 37.0, 30.0, 37.0, 16.0, 17.0, 10.0, 12.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.004937589168548584, -0.0047957561910152435, -0.004653923213481903, -0.004512090235948563, -0.004370257258415222, -0.004228424280881882, -0.004086591303348541, -0.003944758325815201, -0.0038029253482818604, -0.00366109237074852, -0.0035192593932151794, -0.003377426415681839, -0.0032355934381484985, -0.003093760460615158, -0.0029519274830818176, -0.002810094505548477, -0.0026682615280151367, -0.0025264285504817963, -0.002384595572948456, -0.0022427625954151154, -0.002100929617881775, -0.0019590966403484344, -0.001817263662815094, -0.0016754306852817535, -0.001533597707748413, -0.0013917647302150726, -0.0012499317526817322, -0.0011080987751483917, -0.0009662657976150513, -0.0008244328200817108, -0.0006825998425483704, -0.0005407668650150299, -0.00039893388748168945, -0.000257100909948349, -0.00011526793241500854, 2.656504511833191e-05, 0.00016839802265167236, 0.0003102310001850128, 0.00045206397771835327, 0.0005938969552516937, 0.0007357299327850342, 0.0008775629103183746, 0.001019395887851715, 0.0011612288653850555, 0.001303061842918396, 0.0014448948204517365, 0.001586727797985077, 0.0017285607755184174, 0.0018703937530517578, 0.0020122267305850983, 0.0021540597081184387, 0.002295892685651779, 0.0024377256631851196, 0.00257955864071846, 0.0027213916182518005, 0.002863224595785141, 0.0030050575733184814, 0.003146890550851822, 0.0032887235283851624, 0.003430556505918503, 0.0035723894834518433, 0.0037142224609851837, 0.003856055438518524, 0.003997888416051865, 0.004139721393585205]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 9.0, 4.0, 14.0, 9.0, 14.0, 17.0, 37.0, 55.0, 59.0, 93.0, 142.0, 208.0, 322.0, 440.0, 622.0, 988.0, 1604.0, 2544.0, 4350.0, 8113.0, 17370.0, 81866.0, 857292.0, 42220.0, 13513.0, 6741.0, 3664.0, 2117.0, 1370.0, 887.0, 597.0, 394.0, 272.0, 174.0, 110.0, 83.0, 65.0, 54.0, 38.0, 22.0, 16.0, 17.0, 7.0, 4.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00897216796875, -0.008666515350341797, -0.008360862731933594, -0.00805521011352539, -0.0077495574951171875, -0.007443904876708984, -0.007138252258300781, -0.006832599639892578, -0.006526947021484375, -0.006221294403076172, -0.005915641784667969, -0.005609989166259766, -0.0053043365478515625, -0.004998683929443359, -0.004693031311035156, -0.004387378692626953, -0.00408172607421875, -0.003776073455810547, -0.0034704208374023438, -0.0031647682189941406, -0.0028591156005859375, -0.0025534629821777344, -0.0022478103637695312, -0.0019421577453613281, -0.001636505126953125, -0.0013308525085449219, -0.0010251998901367188, -0.0007195472717285156, -0.0004138946533203125, -0.00010824203491210938, 0.00019741058349609375, 0.0005030632019042969, 0.0008087158203125, 0.0011143684387207031, 0.0014200210571289062, 0.0017256736755371094, 0.0020313262939453125, 0.0023369789123535156, 0.0026426315307617188, 0.002948284149169922, 0.003253936767578125, 0.003559589385986328, 0.0038652420043945312, 0.004170894622802734, 0.0044765472412109375, 0.004782199859619141, 0.005087852478027344, 0.005393505096435547, 0.00569915771484375, 0.006004810333251953, 0.006310462951660156, 0.006616115570068359, 0.0069217681884765625, 0.007227420806884766, 0.007533073425292969, 0.007838726043701172, 0.008144378662109375, 0.008450031280517578, 0.008755683898925781, 0.009061336517333984, 0.009366989135742188, 0.00967264175415039, 0.009978294372558594, 0.010283946990966797, 0.010589599609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 16.0, 5.0, 10.0, 6.0, 15.0, 56.0, 116.0, 271.0, 227.0, 116.0, 39.0, 12.0, 7.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007134854793548584, -0.006873011589050293, -0.006611168384552002, -0.006349325180053711, -0.00608748197555542, -0.005825638771057129, -0.005563795566558838, -0.005301952362060547, -0.005040109157562256, -0.004778265953063965, -0.004516422748565674, -0.004254579544067383, -0.003992736339569092, -0.0037308931350708008, -0.0034690499305725098, -0.0032072067260742188, -0.0029453635215759277, -0.0026835203170776367, -0.0024216771125793457, -0.0021598339080810547, -0.0018979907035827637, -0.0016361474990844727, -0.0013743042945861816, -0.0011124610900878906, -0.0008506178855895996, -0.0005887746810913086, -0.0003269314765930176, -6.508827209472656e-05, 0.00019675493240356445, 0.00045859813690185547, 0.0007204413414001465, 0.0009822845458984375, 0.0012441277503967285, 0.0015059709548950195, 0.0017678141593933105, 0.0020296573638916016, 0.0022915005683898926, 0.0025533437728881836, 0.0028151869773864746, 0.0030770301818847656, 0.0033388733863830566, 0.0036007165908813477, 0.0038625597953796387, 0.00412440299987793, 0.004386246204376221, 0.004648089408874512, 0.004909932613372803, 0.005171775817871094, 0.005433619022369385, 0.005695462226867676, 0.005957305431365967, 0.006219148635864258, 0.006480991840362549, 0.00674283504486084, 0.007004678249359131, 0.007266521453857422, 0.007528364658355713, 0.007790207862854004, 0.008052051067352295, 0.008313894271850586, 0.008575737476348877, 0.008837580680847168, 0.009099423885345459, 0.00936126708984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 6.0, 8.0, 11.0, 12.0, 15.0, 9.0, 27.0, 40.0, 44.0, 48.0, 78.0, 101.0, 130.0, 224.0, 338.0, 583.0, 1389.0, 11482.0, 988220.0, 41750.0, 2018.0, 747.0, 397.0, 245.0, 143.0, 110.0, 95.0, 61.0, 43.0, 36.0, 36.0, 22.0, 17.0, 12.0, 13.0, 9.0, 10.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02239990234375, -0.02158975601196289, -0.02077960968017578, -0.019969463348388672, -0.019159317016601562, -0.018349170684814453, -0.017539024353027344, -0.016728878021240234, -0.015918731689453125, -0.015108585357666016, -0.014298439025878906, -0.013488292694091797, -0.012678146362304688, -0.011868000030517578, -0.011057853698730469, -0.01024770736694336, -0.00943756103515625, -0.00862741470336914, -0.007817268371582031, -0.007007122039794922, -0.0061969757080078125, -0.005386829376220703, -0.004576683044433594, -0.0037665367126464844, -0.002956390380859375, -0.0021462440490722656, -0.0013360977172851562, -0.0005259513854980469, 0.0002841949462890625, 0.0010943412780761719, 0.0019044876098632812, 0.0027146339416503906, 0.0035247802734375, 0.004334926605224609, 0.005145072937011719, 0.005955219268798828, 0.0067653656005859375, 0.007575511932373047, 0.008385658264160156, 0.009195804595947266, 0.010005950927734375, 0.010816097259521484, 0.011626243591308594, 0.012436389923095703, 0.013246536254882812, 0.014056682586669922, 0.014866828918457031, 0.01567697525024414, 0.01648712158203125, 0.01729726791381836, 0.01810741424560547, 0.018917560577392578, 0.019727706909179688, 0.020537853240966797, 0.021347999572753906, 0.022158145904541016, 0.022968292236328125, 0.023778438568115234, 0.024588584899902344, 0.025398731231689453, 0.026208877563476562, 0.027019023895263672, 0.02782917022705078, 0.02863931655883789, 0.029449462890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 11.0, 5.0, 14.0, 24.0, 25.0, 21.0, 32.0, 31.0, 34.0, 53.0, 46.0, 47.0, 42.0, 47.0, 49.0, 41.0, 35.0, 34.0, 42.0, 38.0, 42.0, 41.0, 42.0, 31.0, 28.0, 16.0, 23.0, 16.0, 9.0, 11.0, 11.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0197296142578125, -0.01901698112487793, -0.01830434799194336, -0.01759171485900879, -0.01687908172607422, -0.01616644859313965, -0.015453815460205078, -0.014741182327270508, -0.014028549194335938, -0.013315916061401367, -0.012603282928466797, -0.011890649795532227, -0.011178016662597656, -0.010465383529663086, -0.009752750396728516, -0.009040117263793945, -0.008327484130859375, -0.007614850997924805, -0.006902217864990234, -0.006189584732055664, -0.005476951599121094, -0.0047643184661865234, -0.004051685333251953, -0.003339052200317383, -0.0026264190673828125, -0.0019137859344482422, -0.0012011528015136719, -0.0004885196685791016, 0.00022411346435546875, 0.0009367465972900391, 0.0016493797302246094, 0.0023620128631591797, 0.00307464599609375, 0.0037872791290283203, 0.004499912261962891, 0.005212545394897461, 0.005925178527832031, 0.0066378116607666016, 0.007350444793701172, 0.008063077926635742, 0.008775711059570312, 0.009488344192504883, 0.010200977325439453, 0.010913610458374023, 0.011626243591308594, 0.012338876724243164, 0.013051509857177734, 0.013764142990112305, 0.014476776123046875, 0.015189409255981445, 0.015902042388916016, 0.016614675521850586, 0.017327308654785156, 0.018039941787719727, 0.018752574920654297, 0.019465208053588867, 0.020177841186523438, 0.020890474319458008, 0.021603107452392578, 0.02231574058532715, 0.02302837371826172, 0.02374100685119629, 0.02445363998413086, 0.02516627311706543, 0.02587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 36.0, 32.0, 53.0, 56.0, 87.0, 166.0, 356.0, 865.0, 1357.0, 6704.0, 53288.0, 922044.0, 53612.0, 6699.0, 1347.0, 909.0, 323.0, 172.0, 113.0, 51.0, 54.0, 45.0, 22.0, 18.0, 5.0, 13.0, 8.0, 8.0, 8.0, 9.0, 1.0, 8.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.6140124797821045e-06, -5.446374416351318e-06, -5.278736352920532e-06, -5.111098289489746e-06, -4.94346022605896e-06, -4.775822162628174e-06, -4.608184099197388e-06, -4.4405460357666016e-06, -4.2729079723358154e-06, -4.105269908905029e-06, -3.937631845474243e-06, -3.769993782043457e-06, -3.602355718612671e-06, -3.4347176551818848e-06, -3.2670795917510986e-06, -3.0994415283203125e-06, -2.9318034648895264e-06, -2.7641654014587402e-06, -2.596527338027954e-06, -2.428889274597168e-06, -2.261251211166382e-06, -2.0936131477355957e-06, -1.9259750843048096e-06, -1.7583370208740234e-06, -1.5906989574432373e-06, -1.4230608940124512e-06, -1.255422830581665e-06, -1.087784767150879e-06, -9.201467037200928e-07, -7.525086402893066e-07, -5.848705768585205e-07, -4.172325134277344e-07, -2.4959444999694824e-07, -8.195638656616211e-08, 8.568167686462402e-08, 2.5331974029541016e-07, 4.209578037261963e-07, 5.885958671569824e-07, 7.562339305877686e-07, 9.238719940185547e-07, 1.0915100574493408e-06, 1.259148120880127e-06, 1.426786184310913e-06, 1.5944242477416992e-06, 1.7620623111724854e-06, 1.9297003746032715e-06, 2.0973384380340576e-06, 2.2649765014648438e-06, 2.43261456489563e-06, 2.600252628326416e-06, 2.767890691757202e-06, 2.9355287551879883e-06, 3.1031668186187744e-06, 3.2708048820495605e-06, 3.4384429454803467e-06, 3.606081008911133e-06, 3.773719072341919e-06, 3.941357135772705e-06, 4.108995199203491e-06, 4.276633262634277e-06, 4.4442713260650635e-06, 4.61190938949585e-06, 4.779547452926636e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 9.0, 16.0, 16.0, 10.0, 17.0, 34.0, 25.0, 31.0, 39.0, 79.0, 51.0, 52.0, 77.0, 95.0, 58.0, 83.0, 44.0, 37.0, 22.0, 33.0, 16.0, 32.0, 17.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.947185516357422e-06, -4.81773167848587e-06, -4.688277840614319e-06, -4.558824002742767e-06, -4.429370164871216e-06, -4.299916326999664e-06, -4.170462489128113e-06, -4.041008651256561e-06, -3.91155481338501e-06, -3.7821009755134583e-06, -3.6526471376419067e-06, -3.5231932997703552e-06, -3.3937394618988037e-06, -3.264285624027252e-06, -3.1348317861557007e-06, -3.005377948284149e-06, -2.8759241104125977e-06, -2.746470272541046e-06, -2.6170164346694946e-06, -2.487562596797943e-06, -2.3581087589263916e-06, -2.22865492105484e-06, -2.0992010831832886e-06, -1.969747245311737e-06, -1.8402934074401855e-06, -1.710839569568634e-06, -1.5813857316970825e-06, -1.451931893825531e-06, -1.3224780559539795e-06, -1.193024218082428e-06, -1.0635703802108765e-06, -9.34116542339325e-07, -8.046627044677734e-07, -6.752088665962219e-07, -5.457550287246704e-07, -4.163011908531189e-07, -2.868473529815674e-07, -1.5739351511001587e-07, -2.7939677238464355e-08, 1.0151416063308716e-07, 2.3096799850463867e-07, 3.604218363761902e-07, 4.898756742477417e-07, 6.193295121192932e-07, 7.487833499908447e-07, 8.782371878623962e-07, 1.0076910257339478e-06, 1.1371448636054993e-06, 1.2665987014770508e-06, 1.3960525393486023e-06, 1.5255063772201538e-06, 1.6549602150917053e-06, 1.7844140529632568e-06, 1.9138678908348083e-06, 2.04332172870636e-06, 2.1727755665779114e-06, 2.302229404449463e-06, 2.4316832423210144e-06, 2.561137080192566e-06, 2.6905909180641174e-06, 2.820044755935669e-06, 2.9494985938072205e-06, 3.078952431678772e-06, 3.2084062695503235e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 10.0, 15.0, 23.0, 28.0, 36.0, 85.0, 202.0, 820.0, 78333.0, 967444.0, 1094.0, 206.0, 100.0, 42.0, 32.0, 20.0, 12.0, 12.0, 6.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.1517276763916016e-05, -2.0920298993587494e-05, -2.0323321223258972e-05, -1.972634345293045e-05, -1.912936568260193e-05, -1.8532387912273407e-05, -1.7935410141944885e-05, -1.7338432371616364e-05, -1.6741454601287842e-05, -1.614447683095932e-05, -1.55474990606308e-05, -1.4950521290302277e-05, -1.4353543519973755e-05, -1.3756565749645233e-05, -1.3159587979316711e-05, -1.256261020898819e-05, -1.1965632438659668e-05, -1.1368654668331146e-05, -1.0771676898002625e-05, -1.0174699127674103e-05, -9.577721357345581e-06, -8.98074358701706e-06, -8.383765816688538e-06, -7.786788046360016e-06, -7.189810276031494e-06, -6.592832505702972e-06, -5.995854735374451e-06, -5.398876965045929e-06, -4.801899194717407e-06, -4.2049214243888855e-06, -3.6079436540603638e-06, -3.010965883731842e-06, -2.4139881134033203e-06, -1.8170103430747986e-06, -1.2200325727462769e-06, -6.230548024177551e-07, -2.60770320892334e-08, 5.709007382392883e-07, 1.16787850856781e-06, 1.7648562788963318e-06, 2.3618340492248535e-06, 2.9588118195533752e-06, 3.555789589881897e-06, 4.152767360210419e-06, 4.7497451305389404e-06, 5.346722900867462e-06, 5.943700671195984e-06, 6.540678441524506e-06, 7.137656211853027e-06, 7.734633982181549e-06, 8.33161175251007e-06, 8.928589522838593e-06, 9.525567293167114e-06, 1.0122545063495636e-05, 1.0719522833824158e-05, 1.131650060415268e-05, 1.1913478374481201e-05, 1.2510456144809723e-05, 1.3107433915138245e-05, 1.3704411685466766e-05, 1.4301389455795288e-05, 1.489836722612381e-05, 1.549534499645233e-05, 1.6092322766780853e-05, 1.6689300537109375e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 3.0, 10.0, 25.0, 34.0, 55.0, 103.0, 544.0, 74.0, 47.0, 32.0, 17.0, 9.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.901388168334961e-05, -1.848861575126648e-05, -1.796334981918335e-05, -1.743808388710022e-05, -1.691281795501709e-05, -1.638755202293396e-05, -1.586228609085083e-05, -1.53370201587677e-05, -1.481175422668457e-05, -1.428648829460144e-05, -1.376122236251831e-05, -1.323595643043518e-05, -1.271069049835205e-05, -1.2185424566268921e-05, -1.1660158634185791e-05, -1.1134892702102661e-05, -1.0609626770019531e-05, -1.0084360837936401e-05, -9.559094905853271e-06, -9.033828973770142e-06, -8.508563041687012e-06, -7.983297109603882e-06, -7.458031177520752e-06, -6.932765245437622e-06, -6.407499313354492e-06, -5.882233381271362e-06, -5.356967449188232e-06, -4.8317015171051025e-06, -4.306435585021973e-06, -3.7811696529388428e-06, -3.255903720855713e-06, -2.730637788772583e-06, -2.205371856689453e-06, -1.6801059246063232e-06, -1.1548399925231934e-06, -6.295740604400635e-07, -1.043081283569336e-07, 4.209578037261963e-07, 9.462237358093262e-07, 1.471489667892456e-06, 1.996755599975586e-06, 2.522021532058716e-06, 3.0472874641418457e-06, 3.5725533962249756e-06, 4.0978193283081055e-06, 4.623085260391235e-06, 5.148351192474365e-06, 5.673617124557495e-06, 6.198883056640625e-06, 6.724148988723755e-06, 7.249414920806885e-06, 7.774680852890015e-06, 8.299946784973145e-06, 8.825212717056274e-06, 9.350478649139404e-06, 9.875744581222534e-06, 1.0401010513305664e-05, 1.0926276445388794e-05, 1.1451542377471924e-05, 1.1976808309555054e-05, 1.2502074241638184e-05, 1.3027340173721313e-05, 1.3552606105804443e-05, 1.4077872037887573e-05, 1.4603137969970703e-05]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 35.0, 240.0, 634.0, 78.0, 12.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20908275246620178, -0.20536312460899353, -0.20164349675178528, -0.19792388379573822, -0.19420425593852997, -0.19048462808132172, -0.18676500022411346, -0.1830453723669052, -0.17932575941085815, -0.1756061315536499, -0.17188650369644165, -0.1681668907403946, -0.16444726288318634, -0.1607276350259781, -0.15700800716876984, -0.15328837931156158, -0.14956875145435333, -0.14584912359714508, -0.14212949573993683, -0.13840988278388977, -0.13469025492668152, -0.13097062706947327, -0.12725099921226501, -0.12353137880563736, -0.1198117583990097, -0.11609213054180145, -0.1123725101351738, -0.10865288227796555, -0.10493326187133789, -0.10121363401412964, -0.09749400615692139, -0.09377438575029373, -0.09005476534366608, -0.08633513748645782, -0.08261551707983017, -0.07889588922262192, -0.07517626881599426, -0.07145664095878601, -0.06773701310157776, -0.0640173926949501, -0.06029776483774185, -0.0565781407058239, -0.052858516573905945, -0.04913888871669769, -0.04541926458477974, -0.041699640452861786, -0.03798001632094383, -0.03426039218902588, -0.030540764331817627, -0.026821140199899673, -0.02310151420533657, -0.019381890073418617, -0.015662264078855515, -0.011942639946937561, -0.008223015815019608, -0.004503389820456505, -0.0007837656885385513, 0.002935859141871333, 0.006655483972281218, 0.010375108569860458, 0.014094733633100986, 0.017814358696341515, 0.021533982828259468, 0.02525360882282257, 0.028973232954740524]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 3.0, 5.0, 8.0, 12.0, 14.0, 8.0, 17.0, 20.0, 24.0, 20.0, 37.0, 33.0, 36.0, 38.0, 42.0, 44.0, 39.0, 46.0, 48.0, 44.0, 45.0, 53.0, 35.0, 45.0, 34.0, 37.0, 32.0, 30.0, 31.0, 29.0, 17.0, 21.0, 11.0, 13.0, 5.0, 3.0, 5.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1010514497756958, -0.09765557199716568, -0.09425970166921616, -0.09086382389068604, -0.08746795356273651, -0.08407207578420639, -0.08067619800567627, -0.07728032767772675, -0.07388444989919662, -0.0704885721206665, -0.06709270179271698, -0.06369682401418686, -0.06030094996094704, -0.056905075907707214, -0.053509198129177094, -0.05011332407593727, -0.04671745002269745, -0.043321575969457626, -0.039925701916217804, -0.03652982413768768, -0.03313395008444786, -0.02973807603120804, -0.026342200115323067, -0.022946324199438095, -0.019550450146198273, -0.01615457609295845, -0.012758700177073479, -0.009362825192511082, -0.005966950207948685, -0.0025710761547088623, 0.0008247997611761093, 0.004220675677061081, 0.007616549730300903, 0.0110124247148633, 0.014408299699425697, 0.01780417561531067, 0.02120004966855049, 0.024595923721790314, 0.027991799637675285, 0.03138767555356026, 0.03478354960680008, 0.0381794236600399, 0.041575297713279724, 0.044971175491809845, 0.04836704954504967, 0.05176292359828949, 0.05515880137681961, 0.05855467543005943, 0.061950549483299255, 0.06534642726182938, 0.0687422975897789, 0.07213817536830902, 0.07553404569625854, 0.07892992347478867, 0.08232580125331879, 0.08572167158126831, 0.08911754935979843, 0.09251342713832855, 0.09590929746627808, 0.0993051752448082, 0.10270105302333832, 0.10609692335128784, 0.10949280112981796, 0.11288867890834808, 0.11628454923629761]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 14.0, 9.0, 8.0, 9.0, 18.0, 72.0, 166.0, 1615.0, 4191893.0, 244.0, 84.0, 29.0, 15.0, 14.0, 6.0, 12.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07489013671875, -0.07224273681640625, -0.0695953369140625, -0.06694793701171875, -0.064300537109375, -0.06165313720703125, -0.0590057373046875, -0.05635833740234375, -0.0537109375, -0.05106353759765625, -0.0484161376953125, -0.04576873779296875, -0.043121337890625, -0.04047393798828125, -0.0378265380859375, -0.03517913818359375, -0.03253173828125, -0.02988433837890625, -0.0272369384765625, -0.02458953857421875, -0.021942138671875, -0.01929473876953125, -0.0166473388671875, -0.01399993896484375, -0.0113525390625, -0.00870513916015625, -0.0060577392578125, -0.00341033935546875, -0.000762939453125, 0.00188446044921875, 0.0045318603515625, 0.00717926025390625, 0.00982666015625, 0.01247406005859375, 0.0151214599609375, 0.01776885986328125, 0.020416259765625, 0.02306365966796875, 0.0257110595703125, 0.02835845947265625, 0.031005859375, 0.03365325927734375, 0.0363006591796875, 0.03894805908203125, 0.041595458984375, 0.04424285888671875, 0.0468902587890625, 0.04953765869140625, 0.05218505859375, 0.05483245849609375, 0.0574798583984375, 0.06012725830078125, 0.062774658203125, 0.06542205810546875, 0.0680694580078125, 0.07071685791015625, 0.0733642578125, 0.07601165771484375, 0.0786590576171875, 0.08130645751953125, 0.083953857421875, 0.08660125732421875, 0.0892486572265625, 0.09189605712890625, 0.09454345703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 4.0, 12.0, 10.0, 9.0, 7.0, 15.0, 40.0, 119.0, 228.0, 256.0, 131.0, 47.0, 14.0, 8.0, 11.0, 9.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00737762451171875, -0.0071179866790771484, -0.006858348846435547, -0.006598711013793945, -0.006339073181152344, -0.006079435348510742, -0.005819797515869141, -0.005560159683227539, -0.0053005218505859375, -0.005040884017944336, -0.004781246185302734, -0.004521608352661133, -0.004261970520019531, -0.00400233268737793, -0.003742694854736328, -0.0034830570220947266, -0.003223419189453125, -0.0029637813568115234, -0.002704143524169922, -0.0024445056915283203, -0.0021848678588867188, -0.0019252300262451172, -0.0016655921936035156, -0.001405954360961914, -0.0011463165283203125, -0.0008866786956787109, -0.0006270408630371094, -0.0003674030303955078, -0.00010776519775390625, 0.0001518726348876953, 0.0004115104675292969, 0.0006711483001708984, 0.0009307861328125, 0.0011904239654541016, 0.0014500617980957031, 0.0017096996307373047, 0.0019693374633789062, 0.002228975296020508, 0.0024886131286621094, 0.002748250961303711, 0.0030078887939453125, 0.003267526626586914, 0.0035271644592285156, 0.003786802291870117, 0.004046440124511719, 0.00430607795715332, 0.004565715789794922, 0.0048253536224365234, 0.005084991455078125, 0.0053446292877197266, 0.005604267120361328, 0.00586390495300293, 0.006123542785644531, 0.006383180618286133, 0.006642818450927734, 0.006902456283569336, 0.0071620941162109375, 0.007421731948852539, 0.007681369781494141, 0.007941007614135742, 0.008200645446777344, 0.008460283279418945, 0.008719921112060547, 0.008979558944702148, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 5.0, 13.0, 38.0, 117.0, 422.0, 1267.0, 81219.0, 4109075.0, 1471.0, 421.0, 126.0, 58.0, 21.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0125732421875, -0.01220393180847168, -0.01183462142944336, -0.011465311050415039, -0.011096000671386719, -0.010726690292358398, -0.010357379913330078, -0.009988069534301758, -0.009618759155273438, -0.009249448776245117, -0.008880138397216797, -0.008510828018188477, -0.008141517639160156, -0.007772207260131836, -0.007402896881103516, -0.007033586502075195, -0.006664276123046875, -0.006294965744018555, -0.005925655364990234, -0.005556344985961914, -0.005187034606933594, -0.0048177242279052734, -0.004448413848876953, -0.004079103469848633, -0.0037097930908203125, -0.003340482711791992, -0.002971172332763672, -0.0026018619537353516, -0.0022325515747070312, -0.001863241195678711, -0.0014939308166503906, -0.0011246204376220703, -0.00075531005859375, -0.0003859996795654297, -1.6689300537109375e-05, 0.00035262107849121094, 0.0007219314575195312, 0.0010912418365478516, 0.0014605522155761719, 0.0018298625946044922, 0.0021991729736328125, 0.002568483352661133, 0.002937793731689453, 0.0033071041107177734, 0.0036764144897460938, 0.004045724868774414, 0.004415035247802734, 0.004784345626831055, 0.005153656005859375, 0.005522966384887695, 0.005892276763916016, 0.006261587142944336, 0.006630897521972656, 0.0070002079010009766, 0.007369518280029297, 0.007738828659057617, 0.008108139038085938, 0.008477449417114258, 0.008846759796142578, 0.009216070175170898, 0.009585380554199219, 0.009954690933227539, 0.01032400131225586, 0.01069331169128418, 0.0110626220703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 16.0, 36.0, 155.0, 3775.0, 51.0, 17.0, 5.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028514862060546875, -0.002742379903793335, -0.0026332736015319824, -0.00252416729927063, -0.0024150609970092773, -0.002305954694747925, -0.0021968483924865723, -0.0020877420902252197, -0.001978635787963867, -0.0018695294857025146, -0.0017604231834411621, -0.0016513168811798096, -0.001542210578918457, -0.0014331042766571045, -0.001323997974395752, -0.0012148916721343994, -0.0011057853698730469, -0.0009966790676116943, -0.0008875727653503418, -0.0007784664630889893, -0.0006693601608276367, -0.0005602538585662842, -0.00045114755630493164, -0.0003420412540435791, -0.00023293495178222656, -0.00012382864952087402, -1.4722347259521484e-05, 9.438395500183105e-05, 0.0002034902572631836, 0.00031259655952453613, 0.00042170286178588867, 0.0005308091640472412, 0.0006399154663085938, 0.0007490217685699463, 0.0008581280708312988, 0.0009672343730926514, 0.001076340675354004, 0.0011854469776153564, 0.001294553279876709, 0.0014036595821380615, 0.001512765884399414, 0.0016218721866607666, 0.0017309784889221191, 0.0018400847911834717, 0.0019491910934448242, 0.0020582973957061768, 0.0021674036979675293, 0.002276510000228882, 0.0023856163024902344, 0.002494722604751587, 0.0026038289070129395, 0.002712935209274292, 0.0028220415115356445, 0.002931147813796997, 0.0030402541160583496, 0.003149360418319702, 0.0032584667205810547, 0.0033675730228424072, 0.0034766793251037598, 0.0035857856273651123, 0.003694891929626465, 0.0038039982318878174, 0.00391310453414917, 0.0040222108364105225, 0.004131317138671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1001.0, 17.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001215107156895101, 0.0004822030896320939, 0.002179513219743967, 0.003876823466271162, 0.005574133712798357, 0.007271443959325552, 0.008968754671514034, 0.01066606491804123, 0.012363375164568424, 0.01406068541109562, 0.01575799658894539, 0.01745530590415001, 0.01915261521935463, 0.0208499263972044, 0.02254723757505417, 0.02424454689025879, 0.02594185620546341, 0.02763916552066803, 0.0293364766985178, 0.03103378787636757, 0.03273109719157219, 0.03442840650677681, 0.03612571954727173, 0.03782302886247635, 0.03952033817768097, 0.04121764749288559, 0.04291495680809021, 0.04461226984858513, 0.04630957916378975, 0.04800688847899437, 0.04970420151948929, 0.05140151083469391, 0.05309882014989853, 0.05479612946510315, 0.05649343878030777, 0.05819075182080269, 0.05988806113600731, 0.06158537045121193, 0.06328268349170685, 0.06497999280691147, 0.06667730212211609, 0.06837461143732071, 0.07007192075252533, 0.07176923006772995, 0.07346653938293457, 0.07516385614871979, 0.07686116546392441, 0.07855847477912903, 0.08025578409433365, 0.08195309340953827, 0.08365040272474289, 0.08534771203994751, 0.08704502880573273, 0.08874233812093735, 0.09043964743614197, 0.09213695675134659, 0.09383426606655121, 0.09553157538175583, 0.09722888469696045, 0.09892619401216507, 0.10062350332736969, 0.10232082009315491, 0.10401812940835953, 0.10571543872356415, 0.10741274803876877]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 29.0, 43.0, 63.0, 57.0, 91.0, 90.0, 112.0, 83.0, 92.0, 84.0, 73.0, 52.0, 33.0, 22.0, 19.0, 12.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006871998310089111, -0.006643389351665974, -0.006414780393242836, -0.006186171434819698, -0.005957562476396561, -0.005728953517973423, -0.005500344559550285, -0.005271735601127148, -0.00504312664270401, -0.004814517684280872, -0.004585908725857735, -0.004357299767434597, -0.004128690809011459, -0.0039000818505883217, -0.003671472892165184, -0.0034428639337420464, -0.0032142549753189087, -0.002985646016895771, -0.0027570370584726334, -0.0025284281000494957, -0.002299819141626358, -0.0020712101832032204, -0.0018426012247800827, -0.001613992266356945, -0.0013853833079338074, -0.0011567743495106697, -0.000928165391087532, -0.0006995564326643944, -0.0004709474742412567, -0.00024233851581811905, -1.3729557394981384e-05, 0.00021487940102815628, 0.00044348835945129395, 0.0006720973178744316, 0.0009007062762975693, 0.001129315234720707, 0.0013579241931438446, 0.0015865331515669823, 0.00181514210999012, 0.0020437510684132576, 0.0022723600268363953, 0.002500968985259533, 0.0027295779436826706, 0.0029581869021058083, 0.003186795860528946, 0.0034154048189520836, 0.0036440137773752213, 0.003872622735798359, 0.004101231694221497, 0.004329840652644634, 0.004558449611067772, 0.00478705856949091, 0.005015667527914047, 0.005244276486337185, 0.005472885444760323, 0.00570149440318346, 0.005930103361606598, 0.0061587123200297356, 0.006387321278452873, 0.006615930236876011, 0.0068445391952991486, 0.007073148153722286, 0.007301757112145424, 0.0075303660705685616, 0.007758975028991699]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 27.0, 25.0, 54.0, 69.0, 89.0, 164.0, 229.0, 364.0, 529.0, 855.0, 1397.0, 2572.0, 4858.0, 10688.0, 37155.0, 900380.0, 62487.0, 13481.0, 5897.0, 2922.0, 1634.0, 950.0, 595.0, 356.0, 234.0, 159.0, 104.0, 74.0, 55.0, 25.0, 23.0, 19.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0219573974609375, -0.02134084701538086, -0.02072429656982422, -0.020107746124267578, -0.019491195678710938, -0.018874645233154297, -0.018258094787597656, -0.017641544342041016, -0.017024993896484375, -0.016408443450927734, -0.015791893005371094, -0.015175342559814453, -0.014558792114257812, -0.013942241668701172, -0.013325691223144531, -0.01270914077758789, -0.01209259033203125, -0.01147603988647461, -0.010859489440917969, -0.010242938995361328, -0.009626388549804688, -0.009009838104248047, -0.008393287658691406, -0.007776737213134766, -0.007160186767578125, -0.006543636322021484, -0.005927085876464844, -0.005310535430908203, -0.0046939849853515625, -0.004077434539794922, -0.0034608840942382812, -0.0028443336486816406, -0.002227783203125, -0.0016112327575683594, -0.0009946823120117188, -0.0003781318664550781, 0.0002384185791015625, 0.0008549690246582031, 0.0014715194702148438, 0.0020880699157714844, 0.002704620361328125, 0.0033211708068847656, 0.003937721252441406, 0.004554271697998047, 0.0051708221435546875, 0.005787372589111328, 0.006403923034667969, 0.007020473480224609, 0.00763702392578125, 0.00825357437133789, 0.008870124816894531, 0.009486675262451172, 0.010103225708007812, 0.010719776153564453, 0.011336326599121094, 0.011952877044677734, 0.012569427490234375, 0.013185977935791016, 0.013802528381347656, 0.014419078826904297, 0.015035629272460938, 0.015652179718017578, 0.01626873016357422, 0.01688528060913086, 0.0175018310546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 4.0, 12.0, 10.0, 9.0, 7.0, 15.0, 41.0, 118.0, 230.0, 255.0, 131.0, 46.0, 14.0, 8.0, 10.0, 10.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007373809814453125, -0.007114231586456299, -0.006854653358459473, -0.0065950751304626465, -0.00633549690246582, -0.006075918674468994, -0.005816340446472168, -0.005556762218475342, -0.005297183990478516, -0.0050376057624816895, -0.004778027534484863, -0.004518449306488037, -0.004258871078491211, -0.003999292850494385, -0.0037397146224975586, -0.0034801363945007324, -0.0032205581665039062, -0.00296097993850708, -0.002701401710510254, -0.0024418234825134277, -0.0021822452545166016, -0.0019226670265197754, -0.0016630887985229492, -0.001403510570526123, -0.0011439323425292969, -0.0008843541145324707, -0.0006247758865356445, -0.00036519765853881836, -0.00010561943054199219, 0.00015395879745483398, 0.00041353702545166016, 0.0006731152534484863, 0.0009326934814453125, 0.0011922717094421387, 0.0014518499374389648, 0.001711428165435791, 0.001971006393432617, 0.0022305846214294434, 0.0024901628494262695, 0.0027497410774230957, 0.003009319305419922, 0.003268897533416748, 0.0035284757614135742, 0.0037880539894104004, 0.0040476322174072266, 0.004307210445404053, 0.004566788673400879, 0.004826366901397705, 0.005085945129394531, 0.005345523357391357, 0.005605101585388184, 0.00586467981338501, 0.006124258041381836, 0.006383836269378662, 0.006643414497375488, 0.0069029927253723145, 0.007162570953369141, 0.007422149181365967, 0.007681727409362793, 0.00794130563735962, 0.008200883865356445, 0.008460462093353271, 0.008720040321350098, 0.008979618549346924, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 3.0, 4.0, 7.0, 11.0, 12.0, 17.0, 23.0, 26.0, 33.0, 27.0, 40.0, 55.0, 63.0, 90.0, 138.0, 244.0, 404.0, 768.0, 1681.0, 9253.0, 1018456.0, 13366.0, 1790.0, 783.0, 422.0, 241.0, 154.0, 104.0, 96.0, 50.0, 33.0, 34.0, 27.0, 20.0, 17.0, 12.0, 10.0, 7.0, 11.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03839111328125, -0.03721141815185547, -0.03603172302246094, -0.034852027893066406, -0.033672332763671875, -0.032492637634277344, -0.03131294250488281, -0.03013324737548828, -0.02895355224609375, -0.02777385711669922, -0.026594161987304688, -0.025414466857910156, -0.024234771728515625, -0.023055076599121094, -0.021875381469726562, -0.02069568634033203, -0.0195159912109375, -0.01833629608154297, -0.017156600952148438, -0.015976905822753906, -0.014797210693359375, -0.013617515563964844, -0.012437820434570312, -0.011258125305175781, -0.01007843017578125, -0.008898735046386719, -0.0077190399169921875, -0.006539344787597656, -0.005359649658203125, -0.004179954528808594, -0.0030002593994140625, -0.0018205642700195312, -0.000640869140625, 0.0005388259887695312, 0.0017185211181640625, 0.0028982162475585938, 0.004077911376953125, 0.005257606506347656, 0.0064373016357421875, 0.007616996765136719, 0.00879669189453125, 0.009976387023925781, 0.011156082153320312, 0.012335777282714844, 0.013515472412109375, 0.014695167541503906, 0.015874862670898438, 0.01705455780029297, 0.0182342529296875, 0.01941394805908203, 0.020593643188476562, 0.021773338317871094, 0.022953033447265625, 0.024132728576660156, 0.025312423706054688, 0.02649211883544922, 0.02767181396484375, 0.02885150909423828, 0.030031204223632812, 0.031210899353027344, 0.032390594482421875, 0.033570289611816406, 0.03474998474121094, 0.03592967987060547, 0.037109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 3.0, 2.0, 9.0, 11.0, 11.0, 16.0, 23.0, 24.0, 27.0, 21.0, 31.0, 25.0, 34.0, 32.0, 30.0, 35.0, 37.0, 32.0, 39.0, 48.0, 45.0, 29.0, 51.0, 27.0, 41.0, 33.0, 25.0, 37.0, 41.0, 25.0, 25.0, 23.0, 19.0, 15.0, 17.0, 11.0, 8.0, 6.0, 12.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.019878387451171875, -0.01924896240234375, -0.018619537353515625, -0.0179901123046875, -0.017360687255859375, -0.01673126220703125, -0.016101837158203125, -0.015472412109375, -0.014842987060546875, -0.01421356201171875, -0.013584136962890625, -0.0129547119140625, -0.012325286865234375, -0.01169586181640625, -0.011066436767578125, -0.01043701171875, -0.009807586669921875, -0.00917816162109375, -0.008548736572265625, -0.0079193115234375, -0.007289886474609375, -0.00666046142578125, -0.006031036376953125, -0.005401611328125, -0.004772186279296875, -0.00414276123046875, -0.003513336181640625, -0.0028839111328125, -0.002254486083984375, -0.00162506103515625, -0.000995635986328125, -0.0003662109375, 0.000263214111328125, 0.00089263916015625, 0.001522064208984375, 0.0021514892578125, 0.002780914306640625, 0.00341033935546875, 0.004039764404296875, 0.004669189453125, 0.005298614501953125, 0.00592803955078125, 0.006557464599609375, 0.0071868896484375, 0.007816314697265625, 0.00844573974609375, 0.009075164794921875, 0.00970458984375, 0.010334014892578125, 0.01096343994140625, 0.011592864990234375, 0.0122222900390625, 0.012851715087890625, 0.01348114013671875, 0.014110565185546875, 0.014739990234375, 0.015369415283203125, 0.01599884033203125, 0.016628265380859375, 0.0172576904296875, 0.017887115478515625, 0.01851654052734375, 0.019145965576171875, 0.019775390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 8.0, 6.0, 8.0, 17.0, 15.0, 26.0, 59.0, 70.0, 137.0, 358.0, 1287.0, 34820.0, 1002748.0, 7744.0, 759.0, 209.0, 120.0, 53.0, 40.0, 17.0, 16.0, 9.0, 10.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0829960703849792e-05, -2.014264464378357e-05, -1.9455328583717346e-05, -1.8768012523651123e-05, -1.80806964635849e-05, -1.7393380403518677e-05, -1.6706064343452454e-05, -1.601874828338623e-05, -1.5331432223320007e-05, -1.4644116163253784e-05, -1.3956800103187561e-05, -1.3269484043121338e-05, -1.2582167983055115e-05, -1.1894851922988892e-05, -1.1207535862922668e-05, -1.0520219802856445e-05, -9.832903742790222e-06, -9.145587682723999e-06, -8.458271622657776e-06, -7.770955562591553e-06, -7.08363950252533e-06, -6.3963234424591064e-06, -5.709007382392883e-06, -5.02169132232666e-06, -4.334375262260437e-06, -3.647059202194214e-06, -2.9597431421279907e-06, -2.2724270820617676e-06, -1.5851110219955444e-06, -8.977949619293213e-07, -2.1047890186309814e-07, 4.76837158203125e-07, 1.1641532182693481e-06, 1.8514692783355713e-06, 2.5387853384017944e-06, 3.2261013984680176e-06, 3.913417458534241e-06, 4.600733518600464e-06, 5.288049578666687e-06, 5.97536563873291e-06, 6.662681698799133e-06, 7.3499977588653564e-06, 8.03731381893158e-06, 8.724629878997803e-06, 9.411945939064026e-06, 1.0099261999130249e-05, 1.0786578059196472e-05, 1.1473894119262695e-05, 1.2161210179328918e-05, 1.2848526239395142e-05, 1.3535842299461365e-05, 1.4223158359527588e-05, 1.4910474419593811e-05, 1.5597790479660034e-05, 1.6285106539726257e-05, 1.697242259979248e-05, 1.7659738659858704e-05, 1.8347054719924927e-05, 1.903437077999115e-05, 1.9721686840057373e-05, 2.0409002900123596e-05, 2.109631896018982e-05, 2.1783635020256042e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 10.0, 11.0, 16.0, 21.0, 22.0, 30.0, 51.0, 69.0, 111.0, 116.0, 150.0, 116.0, 73.0, 57.0, 32.0, 30.0, 23.0, 15.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-05, -1.0973773896694183e-05, -1.0622665286064148e-05, -1.0271556675434113e-05, -9.920448064804077e-06, -9.569339454174042e-06, -9.218230843544006e-06, -8.867122232913971e-06, -8.516013622283936e-06, -8.1649050116539e-06, -7.813796401023865e-06, -7.462687790393829e-06, -7.111579179763794e-06, -6.7604705691337585e-06, -6.409361958503723e-06, -6.058253347873688e-06, -5.707144737243652e-06, -5.356036126613617e-06, -5.0049275159835815e-06, -4.653818905353546e-06, -4.302710294723511e-06, -3.951601684093475e-06, -3.60049307346344e-06, -3.2493844628334045e-06, -2.898275852203369e-06, -2.5471672415733337e-06, -2.1960586309432983e-06, -1.844950020313263e-06, -1.4938414096832275e-06, -1.1427327990531921e-06, -7.916241884231567e-07, -4.4051557779312134e-07, -8.940696716308594e-08, 2.6170164346694946e-07, 6.128102540969849e-07, 9.639188647270203e-07, 1.3150274753570557e-06, 1.666136085987091e-06, 2.0172446966171265e-06, 2.368353307247162e-06, 2.7194619178771973e-06, 3.0705705285072327e-06, 3.421679139137268e-06, 3.7727877497673035e-06, 4.123896360397339e-06, 4.475004971027374e-06, 4.82611358165741e-06, 5.177222192287445e-06, 5.5283308029174805e-06, 5.879439413547516e-06, 6.230548024177551e-06, 6.581656634807587e-06, 6.932765245437622e-06, 7.2838738560676575e-06, 7.634982466697693e-06, 7.986091077327728e-06, 8.337199687957764e-06, 8.688308298587799e-06, 9.039416909217834e-06, 9.39052551984787e-06, 9.741634130477905e-06, 1.009274274110794e-05, 1.0443851351737976e-05, 1.0794959962368011e-05, 1.1146068572998047e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 9.0, 7.0, 13.0, 24.0, 36.0, 55.0, 118.0, 333.0, 1906.0, 1043067.0, 2321.0, 365.0, 123.0, 72.0, 34.0, 23.0, 15.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.791188985109329e-05, -4.6232715249061584e-05, -4.455354064702988e-05, -4.287436604499817e-05, -4.119519144296646e-05, -3.9516016840934753e-05, -3.7836842238903046e-05, -3.615766763687134e-05, -3.447849303483963e-05, -3.279931843280792e-05, -3.1120143830776215e-05, -2.9440969228744507e-05, -2.77617946267128e-05, -2.608262002468109e-05, -2.4403445422649384e-05, -2.2724270820617676e-05, -2.1045096218585968e-05, -1.936592161655426e-05, -1.7686747014522552e-05, -1.6007572412490845e-05, -1.4328397810459137e-05, -1.264922320842743e-05, -1.0970048606395721e-05, -9.290874004364014e-06, -7.611699402332306e-06, -5.932524800300598e-06, -4.25335019826889e-06, -2.5741755962371826e-06, -8.950009942054749e-07, 7.841736078262329e-07, 2.4633482098579407e-06, 4.1425228118896484e-06, 5.821697413921356e-06, 7.500872015953064e-06, 9.180046617984772e-06, 1.085922122001648e-05, 1.2538395822048187e-05, 1.4217570424079895e-05, 1.5896745026111603e-05, 1.757591962814331e-05, 1.925509423017502e-05, 2.0934268832206726e-05, 2.2613443434238434e-05, 2.429261803627014e-05, 2.597179263830185e-05, 2.7650967240333557e-05, 2.9330141842365265e-05, 3.100931644439697e-05, 3.268849104642868e-05, 3.436766564846039e-05, 3.6046840250492096e-05, 3.7726014852523804e-05, 3.940518945455551e-05, 4.108436405658722e-05, 4.276353865861893e-05, 4.4442713260650635e-05, 4.612188786268234e-05, 4.780106246471405e-05, 4.948023706674576e-05, 5.1159411668777466e-05, 5.2838586270809174e-05, 5.451776087284088e-05, 5.619693547487259e-05, 5.78761100769043e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 4.0, 7.0, 11.0, 13.0, 22.0, 29.0, 55.0, 130.0, 440.0, 107.0, 65.0, 35.0, 28.0, 9.0, 12.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6524066925048828e-05, -2.5626271963119507e-05, -2.4728477001190186e-05, -2.3830682039260864e-05, -2.2932887077331543e-05, -2.203509211540222e-05, -2.11372971534729e-05, -2.023950219154358e-05, -1.9341707229614258e-05, -1.8443912267684937e-05, -1.7546117305755615e-05, -1.6648322343826294e-05, -1.5750527381896973e-05, -1.4852732419967651e-05, -1.395493745803833e-05, -1.3057142496109009e-05, -1.2159347534179688e-05, -1.1261552572250366e-05, -1.0363757610321045e-05, -9.465962648391724e-06, -8.568167686462402e-06, -7.670372724533081e-06, -6.77257776260376e-06, -5.8747828006744385e-06, -4.976987838745117e-06, -4.079192876815796e-06, -3.1813979148864746e-06, -2.2836029529571533e-06, -1.385807991027832e-06, -4.880130290985107e-07, 4.0978193283081055e-07, 1.3075768947601318e-06, 2.205371856689453e-06, 3.1031668186187744e-06, 4.000961780548096e-06, 4.898756742477417e-06, 5.796551704406738e-06, 6.6943466663360596e-06, 7.592141628265381e-06, 8.489936590194702e-06, 9.387731552124023e-06, 1.0285526514053345e-05, 1.1183321475982666e-05, 1.2081116437911987e-05, 1.2978911399841309e-05, 1.387670636177063e-05, 1.4774501323699951e-05, 1.5672296285629272e-05, 1.6570091247558594e-05, 1.7467886209487915e-05, 1.8365681171417236e-05, 1.9263476133346558e-05, 2.016127109527588e-05, 2.10590660572052e-05, 2.195686101913452e-05, 2.2854655981063843e-05, 2.3752450942993164e-05, 2.4650245904922485e-05, 2.5548040866851807e-05, 2.6445835828781128e-05, 2.734363079071045e-05, 2.824142575263977e-05, 2.9139220714569092e-05, 3.0037015676498413e-05, 3.0934810638427734e-05]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 121.0, 854.0, 30.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07917436212301254, -0.07066558301448822, -0.062156811356544495, -0.05364803597331047, -0.04513926059007645, -0.03663048520684242, -0.0281217098236084, -0.019612934440374374, -0.01110415905714035, -0.0025953836739063263, 0.005913391709327698, 0.014422167092561722, 0.022930942475795746, 0.03143971785902977, 0.039948493242263794, 0.04845726862549782, 0.05696604400873184, 0.06547482311725616, 0.07398359477519989, 0.08249236643314362, 0.09100114554166794, 0.09950992465019226, 0.10801869630813599, 0.11652746796607971, 0.12503623962402344, 0.13354501128196716, 0.1420537829399109, 0.1505625694990158, 0.15907134115695953, 0.16758011281490326, 0.17608889937400818, 0.1845976710319519, 0.19310647249221802, 0.20161524415016174, 0.21012401580810547, 0.2186328023672104, 0.2271415740251541, 0.23565034568309784, 0.24415913224220276, 0.2526679039001465, 0.2611766755580902, 0.26968544721603394, 0.27819421887397766, 0.2867029905319214, 0.2952117919921875, 0.3037205636501312, 0.31222933530807495, 0.3207381069660187, 0.3292468786239624, 0.33775565028190613, 0.34626442193984985, 0.3547731935977936, 0.3632819652557373, 0.3717907667160034, 0.38029953837394714, 0.38880831003189087, 0.3973170816898346, 0.4058258533477783, 0.41433462500572205, 0.42284339666366577, 0.4313521981239319, 0.4398609697818756, 0.44836974143981934, 0.45687851309776306, 0.4653872847557068]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 10.0, 14.0, 11.0, 22.0, 24.0, 27.0, 38.0, 28.0, 39.0, 48.0, 59.0, 65.0, 50.0, 53.0, 48.0, 57.0, 54.0, 48.0, 47.0, 41.0, 36.0, 35.0, 21.0, 23.0, 22.0, 18.0, 17.0, 9.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15125852823257446, -0.14704565703868866, -0.14283278584480286, -0.13861992955207825, -0.13440705835819244, -0.13019418716430664, -0.12598131597042084, -0.12176844477653503, -0.11755558103322983, -0.11334270983934402, -0.10912984609603882, -0.10491697490215302, -0.10070410370826721, -0.096491239964962, -0.0922783687710762, -0.088065505027771, -0.08385263383388519, -0.07963976263999939, -0.07542689889669418, -0.07121402770280838, -0.06700116395950317, -0.06278829276561737, -0.05857542157173157, -0.05436255410313606, -0.05014968663454056, -0.04593681916594505, -0.04172395169734955, -0.037511080503463745, -0.03329821303486824, -0.029085345566272736, -0.02487247623503208, -0.020659606903791428, -0.016446739435195923, -0.012233871035277843, -0.008021002635359764, -0.0038081342354416847, 0.00040473416447639465, 0.004617601633071899, 0.008830470964312553, 0.013043340295553207, 0.017256207764148712, 0.021469075232744217, 0.02568194456398487, 0.029894813895225525, 0.03410768136382103, 0.038320548832416534, 0.04253342002630234, 0.04674628749489784, 0.05095915496349335, 0.05517202243208885, 0.05938488990068436, 0.06359776109457016, 0.06781062483787537, 0.07202349603176117, 0.07623636722564697, 0.08044923841953278, 0.08466210216283798, 0.08887497335672379, 0.09308783710002899, 0.0973007082939148, 0.1015135794878006, 0.1057264432311058, 0.10993931442499161, 0.11415217816829681, 0.11836504936218262]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 10.0, 7.0, 12.0, 25.0, 23.0, 19.0, 41.0, 44.0, 735.0, 3518.0, 4094215.0, 93020.0, 2069.0, 274.0, 39.0, 35.0, 24.0, 28.0, 16.0, 16.0, 12.0, 10.0, 10.0, 9.0, 4.0, 8.0, 2.0, 10.0, 2.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0151824951171875, -0.014658451080322266, -0.014134407043457031, -0.013610363006591797, -0.013086318969726562, -0.012562274932861328, -0.012038230895996094, -0.01151418685913086, -0.010990142822265625, -0.01046609878540039, -0.009942054748535156, -0.009418010711669922, -0.008893966674804688, -0.008369922637939453, -0.007845878601074219, -0.007321834564208984, -0.00679779052734375, -0.006273746490478516, -0.005749702453613281, -0.005225658416748047, -0.0047016143798828125, -0.004177570343017578, -0.0036535263061523438, -0.0031294822692871094, -0.002605438232421875, -0.0020813941955566406, -0.0015573501586914062, -0.0010333061218261719, -0.0005092620849609375, 1.4781951904296875e-05, 0.0005388259887695312, 0.0010628700256347656, 0.0015869140625, 0.0021109580993652344, 0.0026350021362304688, 0.003159046173095703, 0.0036830902099609375, 0.004207134246826172, 0.004731178283691406, 0.005255222320556641, 0.005779266357421875, 0.006303310394287109, 0.006827354431152344, 0.007351398468017578, 0.007875442504882812, 0.008399486541748047, 0.008923530578613281, 0.009447574615478516, 0.00997161865234375, 0.010495662689208984, 0.011019706726074219, 0.011543750762939453, 0.012067794799804688, 0.012591838836669922, 0.013115882873535156, 0.01363992691040039, 0.014163970947265625, 0.01468801498413086, 0.015212059020996094, 0.015736103057861328, 0.016260147094726562, 0.016784191131591797, 0.01730823516845703, 0.017832279205322266, 0.0183563232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 5.0, 14.0, 10.0, 10.0, 9.0, 25.0, 89.0, 184.0, 266.0, 184.0, 71.0, 18.0, 9.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007389068603515625, -0.007132232189178467, -0.006875395774841309, -0.00661855936050415, -0.006361722946166992, -0.006104886531829834, -0.005848050117492676, -0.005591213703155518, -0.005334377288818359, -0.005077540874481201, -0.004820704460144043, -0.004563868045806885, -0.0043070316314697266, -0.004050195217132568, -0.00379335880279541, -0.003536522388458252, -0.0032796859741210938, -0.0030228495597839355, -0.0027660131454467773, -0.002509176731109619, -0.002252340316772461, -0.0019955039024353027, -0.0017386674880981445, -0.0014818310737609863, -0.0012249946594238281, -0.0009681582450866699, -0.0007113218307495117, -0.0004544854164123535, -0.0001976490020751953, 5.918741226196289e-05, 0.0003160238265991211, 0.0005728602409362793, 0.0008296966552734375, 0.0010865330696105957, 0.001343369483947754, 0.0016002058982849121, 0.0018570423126220703, 0.0021138787269592285, 0.0023707151412963867, 0.002627551555633545, 0.002884387969970703, 0.0031412243843078613, 0.0033980607986450195, 0.0036548972129821777, 0.003911733627319336, 0.004168570041656494, 0.004425406455993652, 0.0046822428703308105, 0.004939079284667969, 0.005195915699005127, 0.005452752113342285, 0.005709588527679443, 0.0059664249420166016, 0.00622326135635376, 0.006480097770690918, 0.006736934185028076, 0.006993770599365234, 0.007250607013702393, 0.007507443428039551, 0.007764279842376709, 0.008021116256713867, 0.008277952671051025, 0.008534789085388184, 0.008791625499725342, 0.0090484619140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 27.0, 97.0, 317.0, 678.0, 2795.0, 4186952.0, 2259.0, 639.0, 334.0, 108.0, 35.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0201416015625, -0.019408464431762695, -0.01867532730102539, -0.017942190170288086, -0.01720905303955078, -0.016475915908813477, -0.015742778778076172, -0.015009641647338867, -0.014276504516601562, -0.013543367385864258, -0.012810230255126953, -0.012077093124389648, -0.011343955993652344, -0.010610818862915039, -0.009877681732177734, -0.00914454460144043, -0.008411407470703125, -0.00767827033996582, -0.006945133209228516, -0.006211996078491211, -0.005478858947753906, -0.0047457218170166016, -0.004012584686279297, -0.003279447555541992, -0.0025463104248046875, -0.0018131732940673828, -0.0010800361633300781, -0.00034689903259277344, 0.00038623809814453125, 0.001119375228881836, 0.0018525123596191406, 0.0025856494903564453, 0.00331878662109375, 0.004051923751831055, 0.004785060882568359, 0.005518198013305664, 0.006251335144042969, 0.0069844722747802734, 0.007717609405517578, 0.008450746536254883, 0.009183883666992188, 0.009917020797729492, 0.010650157928466797, 0.011383295059204102, 0.012116432189941406, 0.012849569320678711, 0.013582706451416016, 0.01431584358215332, 0.015048980712890625, 0.01578211784362793, 0.016515254974365234, 0.01724839210510254, 0.017981529235839844, 0.01871466636657715, 0.019447803497314453, 0.020180940628051758, 0.020914077758789062, 0.021647214889526367, 0.022380352020263672, 0.023113489151000977, 0.02384662628173828, 0.024579763412475586, 0.02531290054321289, 0.026046037673950195, 0.0267791748046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 16.0, 24.0, 351.0, 3635.0, 33.0, 11.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009190082550048828, -0.008934974670410156, -0.008679866790771484, -0.008424758911132812, -0.00816965103149414, -0.007914543151855469, -0.007659435272216797, -0.007404327392578125, -0.007149219512939453, -0.006894111633300781, -0.006639003753662109, -0.0063838958740234375, -0.006128787994384766, -0.005873680114746094, -0.005618572235107422, -0.00536346435546875, -0.005108356475830078, -0.004853248596191406, -0.004598140716552734, -0.0043430328369140625, -0.004087924957275391, -0.0038328170776367188, -0.003577709197998047, -0.003322601318359375, -0.003067493438720703, -0.0028123855590820312, -0.0025572776794433594, -0.0023021697998046875, -0.0020470619201660156, -0.0017919540405273438, -0.0015368461608886719, -0.00128173828125, -0.0010266304016113281, -0.0007715225219726562, -0.0005164146423339844, -0.0002613067626953125, -6.198883056640625e-06, 0.00024890899658203125, 0.0005040168762207031, 0.000759124755859375, 0.0010142326354980469, 0.0012693405151367188, 0.0015244483947753906, 0.0017795562744140625, 0.0020346641540527344, 0.0022897720336914062, 0.002544879913330078, 0.00279998779296875, 0.003055095672607422, 0.0033102035522460938, 0.0035653114318847656, 0.0038204193115234375, 0.004075527191162109, 0.004330635070800781, 0.004585742950439453, 0.004840850830078125, 0.005095958709716797, 0.005351066589355469, 0.005606174468994141, 0.0058612823486328125, 0.006116390228271484, 0.006371498107910156, 0.006626605987548828, 0.0068817138671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 993.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02370830811560154, -0.02196001075208187, -0.02021171525120735, -0.018463417887687683, -0.016715120524168015, -0.01496682409197092, -0.013218527659773827, -0.011470230296254158, -0.009721933864057064, -0.00797363743185997, -0.0062253400683403015, -0.0044770436361432076, -0.0027287467382848263, -0.000980449840426445, 0.000767846591770649, 0.0025161439552903175, 0.0042644403874874115, 0.006012737285345793, 0.007761034183204174, 0.009509330615401268, 0.011257627978920937, 0.01300592441111803, 0.014754220843315125, 0.016502518206834793, 0.01825081557035446, 0.01999911293387413, 0.02174740843474865, 0.023495705798268318, 0.025244003161787987, 0.026992298662662506, 0.028740596026182175, 0.030488893389701843, 0.03223719075322151, 0.03398548811674118, 0.03573378548026085, 0.03748208284378052, 0.03923037648200989, 0.040978673845529556, 0.042726971209049225, 0.04447526857256889, 0.04622356593608856, 0.04797186329960823, 0.0497201606631279, 0.05146845430135727, 0.05321675166487694, 0.054965049028396606, 0.056713346391916275, 0.058461643755435944, 0.060209937393665314, 0.06195823475718498, 0.06370653212070465, 0.06545482575893402, 0.06720312684774399, 0.06895142048597336, 0.07069972157478333, 0.0724480152130127, 0.07419631630182266, 0.07594460994005203, 0.077692911028862, 0.07944120466709137, 0.08118950575590134, 0.0829377993941307, 0.08468610048294067, 0.08643439412117004, 0.08818268775939941]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 21.0, 24.0, 43.0, 38.0, 60.0, 80.0, 75.0, 86.0, 106.0, 109.0, 91.0, 67.0, 49.0, 39.0, 33.0, 24.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01140064001083374, -0.011000651866197586, -0.010600663721561432, -0.010200675576925278, -0.009800687432289124, -0.00940069928765297, -0.009000711143016815, -0.008600722998380661, -0.008200734853744507, -0.007800746709108353, -0.0074007585644721985, -0.007000770419836044, -0.00660078227519989, -0.006200794130563736, -0.005800805985927582, -0.005400817841291428, -0.0050008296966552734, -0.004600841552019119, -0.004200853407382965, -0.003800865262746811, -0.0034008771181106567, -0.0030008889734745026, -0.0026009008288383484, -0.002200912684202194, -0.00180092453956604, -0.0014009363949298859, -0.0010009482502937317, -0.0006009601056575775, -0.00020097196102142334, 0.00019901618361473083, 0.000599004328250885, 0.0009989924728870392, 0.0013989806175231934, 0.0017989687621593475, 0.0021989569067955017, 0.002598945051431656, 0.00299893319606781, 0.0033989213407039642, 0.0037989094853401184, 0.004198897629976273, 0.004598885774612427, 0.004998873919248581, 0.005398862063884735, 0.005798850208520889, 0.0061988383531570435, 0.006598826497793198, 0.006998814642429352, 0.007398802787065506, 0.00779879093170166, 0.008198779076337814, 0.008598767220973969, 0.008998755365610123, 0.009398743510246277, 0.009798731654882431, 0.010198719799518585, 0.01059870794415474, 0.010998696088790894, 0.011398684233427048, 0.011798672378063202, 0.012198660522699356, 0.01259864866733551, 0.012998636811971664, 0.013398624956607819, 0.013798613101243973, 0.014198601245880127]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 8.0, 6.0, 14.0, 18.0, 26.0, 33.0, 46.0, 89.0, 143.0, 269.0, 466.0, 864.0, 1899.0, 4055.0, 11287.0, 63361.0, 927677.0, 25599.0, 6909.0, 2770.0, 1331.0, 721.0, 359.0, 198.0, 130.0, 93.0, 59.0, 34.0, 27.0, 17.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0181427001953125, -0.017628788948059082, -0.017114877700805664, -0.016600966453552246, -0.016087055206298828, -0.01557314395904541, -0.015059232711791992, -0.014545321464538574, -0.014031410217285156, -0.013517498970031738, -0.01300358772277832, -0.012489676475524902, -0.011975765228271484, -0.011461853981018066, -0.010947942733764648, -0.01043403148651123, -0.009920120239257812, -0.009406208992004395, -0.008892297744750977, -0.008378386497497559, -0.00786447525024414, -0.007350564002990723, -0.006836652755737305, -0.006322741508483887, -0.005808830261230469, -0.005294919013977051, -0.004781007766723633, -0.004267096519470215, -0.003753185272216797, -0.003239274024963379, -0.002725362777709961, -0.002211451530456543, -0.001697540283203125, -0.001183629035949707, -0.0006697177886962891, -0.0001558065414428711, 0.0003581047058105469, 0.0008720159530639648, 0.0013859272003173828, 0.0018998384475708008, 0.0024137496948242188, 0.0029276609420776367, 0.0034415721893310547, 0.003955483436584473, 0.004469394683837891, 0.004983305931091309, 0.0054972171783447266, 0.0060111284255981445, 0.0065250396728515625, 0.0070389509201049805, 0.0075528621673583984, 0.008066773414611816, 0.008580684661865234, 0.009094595909118652, 0.00960850715637207, 0.010122418403625488, 0.010636329650878906, 0.011150240898132324, 0.011664152145385742, 0.01217806339263916, 0.012691974639892578, 0.013205885887145996, 0.013719797134399414, 0.014233708381652832, 0.01474761962890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 5.0, 14.0, 10.0, 10.0, 9.0, 25.0, 88.0, 182.0, 265.0, 188.0, 69.0, 20.0, 9.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007396697998046875, -0.007139742374420166, -0.006882786750793457, -0.006625831127166748, -0.006368875503540039, -0.00611191987991333, -0.005854964256286621, -0.005598008632659912, -0.005341053009033203, -0.005084097385406494, -0.004827141761779785, -0.004570186138153076, -0.004313230514526367, -0.004056274890899658, -0.0037993192672729492, -0.0035423636436462402, -0.0032854080200195312, -0.0030284523963928223, -0.0027714967727661133, -0.0025145411491394043, -0.0022575855255126953, -0.0020006299018859863, -0.0017436742782592773, -0.0014867186546325684, -0.0012297630310058594, -0.0009728074073791504, -0.0007158517837524414, -0.0004588961601257324, -0.00020194053649902344, 5.501508712768555e-05, 0.00031197071075439453, 0.0005689263343811035, 0.0008258819580078125, 0.0010828375816345215, 0.0013397932052612305, 0.0015967488288879395, 0.0018537044525146484, 0.0021106600761413574, 0.0023676156997680664, 0.0026245713233947754, 0.0028815269470214844, 0.0031384825706481934, 0.0033954381942749023, 0.0036523938179016113, 0.00390934944152832, 0.004166305065155029, 0.004423260688781738, 0.004680216312408447, 0.004937171936035156, 0.005194127559661865, 0.005451083183288574, 0.005708038806915283, 0.005964994430541992, 0.006221950054168701, 0.00647890567779541, 0.006735861301422119, 0.006992816925048828, 0.007249772548675537, 0.007506728172302246, 0.007763683795928955, 0.008020639419555664, 0.008277595043182373, 0.008534550666809082, 0.008791506290435791, 0.0090484619140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 2.0, 10.0, 11.0, 11.0, 13.0, 20.0, 25.0, 31.0, 26.0, 44.0, 45.0, 71.0, 91.0, 131.0, 190.0, 343.0, 767.0, 2016.0, 31238.0, 1004130.0, 6436.0, 1385.0, 563.0, 241.0, 190.0, 115.0, 89.0, 60.0, 52.0, 40.0, 25.0, 24.0, 19.0, 21.0, 9.0, 13.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0275421142578125, -0.026662826538085938, -0.025783538818359375, -0.024904251098632812, -0.02402496337890625, -0.023145675659179688, -0.022266387939453125, -0.021387100219726562, -0.0205078125, -0.019628524780273438, -0.018749237060546875, -0.017869949340820312, -0.01699066162109375, -0.016111373901367188, -0.015232086181640625, -0.014352798461914062, -0.0134735107421875, -0.012594223022460938, -0.011714935302734375, -0.010835647583007812, -0.00995635986328125, -0.009077072143554688, -0.008197784423828125, -0.0073184967041015625, -0.006439208984375, -0.0055599212646484375, -0.004680633544921875, -0.0038013458251953125, -0.00292205810546875, -0.0020427703857421875, -0.001163482666015625, -0.0002841949462890625, 0.0005950927734375, 0.0014743804931640625, 0.002353668212890625, 0.0032329559326171875, 0.00411224365234375, 0.0049915313720703125, 0.005870819091796875, 0.0067501068115234375, 0.00762939453125, 0.008508682250976562, 0.009387969970703125, 0.010267257690429688, 0.01114654541015625, 0.012025833129882812, 0.012905120849609375, 0.013784408569335938, 0.0146636962890625, 0.015542984008789062, 0.016422271728515625, 0.017301559448242188, 0.01818084716796875, 0.019060134887695312, 0.019939422607421875, 0.020818710327148438, 0.021697998046875, 0.022577285766601562, 0.023456573486328125, 0.024335861206054688, 0.02521514892578125, 0.026094436645507812, 0.026973724365234375, 0.027853012084960938, 0.0287322998046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 2.0, 10.0, 11.0, 11.0, 12.0, 15.0, 22.0, 23.0, 20.0, 21.0, 23.0, 35.0, 28.0, 35.0, 38.0, 36.0, 39.0, 29.0, 55.0, 43.0, 39.0, 51.0, 31.0, 27.0, 44.0, 37.0, 35.0, 27.0, 30.0, 26.0, 21.0, 17.0, 16.0, 17.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.01953125, -0.01890707015991211, -0.01828289031982422, -0.017658710479736328, -0.017034530639648438, -0.016410350799560547, -0.015786170959472656, -0.015161991119384766, -0.014537811279296875, -0.013913631439208984, -0.013289451599121094, -0.012665271759033203, -0.012041091918945312, -0.011416912078857422, -0.010792732238769531, -0.01016855239868164, -0.00954437255859375, -0.00892019271850586, -0.008296012878417969, -0.007671833038330078, -0.0070476531982421875, -0.006423473358154297, -0.005799293518066406, -0.005175113677978516, -0.004550933837890625, -0.003926753997802734, -0.0033025741577148438, -0.002678394317626953, -0.0020542144775390625, -0.0014300346374511719, -0.0008058547973632812, -0.00018167495727539062, 0.0004425048828125, 0.0010666847229003906, 0.0016908645629882812, 0.002315044403076172, 0.0029392242431640625, 0.003563404083251953, 0.004187583923339844, 0.004811763763427734, 0.005435943603515625, 0.006060123443603516, 0.006684303283691406, 0.007308483123779297, 0.007932662963867188, 0.008556842803955078, 0.009181022644042969, 0.00980520248413086, 0.01042938232421875, 0.01105356216430664, 0.011677742004394531, 0.012301921844482422, 0.012926101684570312, 0.013550281524658203, 0.014174461364746094, 0.014798641204833984, 0.015422821044921875, 0.016047000885009766, 0.016671180725097656, 0.017295360565185547, 0.017919540405273438, 0.018543720245361328, 0.01916790008544922, 0.01979207992553711, 0.020416259765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 1.0, 7.0, 9.0, 18.0, 20.0, 18.0, 45.0, 45.0, 66.0, 185.0, 246.0, 851.0, 2367.0, 27037.0, 951864.0, 58576.0, 5323.0, 972.0, 451.0, 149.0, 104.0, 69.0, 37.0, 24.0, 10.0, 14.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-1.0192394256591797e-05, -9.928829967975616e-06, -9.665265679359436e-06, -9.401701390743256e-06, -9.138137102127075e-06, -8.874572813510895e-06, -8.611008524894714e-06, -8.347444236278534e-06, -8.083879947662354e-06, -7.820315659046173e-06, -7.556751370429993e-06, -7.293187081813812e-06, -7.029622793197632e-06, -6.766058504581451e-06, -6.502494215965271e-06, -6.2389299273490906e-06, -5.97536563873291e-06, -5.71180135011673e-06, -5.448237061500549e-06, -5.184672772884369e-06, -4.9211084842681885e-06, -4.657544195652008e-06, -4.393979907035828e-06, -4.130415618419647e-06, -3.866851329803467e-06, -3.6032870411872864e-06, -3.339722752571106e-06, -3.0761584639549255e-06, -2.812594175338745e-06, -2.5490298867225647e-06, -2.2854655981063843e-06, -2.021901309490204e-06, -1.7583370208740234e-06, -1.494772732257843e-06, -1.2312084436416626e-06, -9.676441550254822e-07, -7.040798664093018e-07, -4.4051557779312134e-07, -1.7695128917694092e-07, 8.66129994392395e-08, 3.501772880554199e-07, 6.137415766716003e-07, 8.773058652877808e-07, 1.1408701539039612e-06, 1.4044344425201416e-06, 1.667998731136322e-06, 1.9315630197525024e-06, 2.195127308368683e-06, 2.4586915969848633e-06, 2.7222558856010437e-06, 2.985820174217224e-06, 3.2493844628334045e-06, 3.512948751449585e-06, 3.7765130400657654e-06, 4.040077328681946e-06, 4.303641617298126e-06, 4.567205905914307e-06, 4.830770194530487e-06, 5.0943344831466675e-06, 5.357898771762848e-06, 5.621463060379028e-06, 5.885027348995209e-06, 6.148591637611389e-06, 6.41215592622757e-06, 6.67572021484375e-06]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 5.0, 14.0, 10.0, 13.0, 14.0, 21.0, 24.0, 55.0, 59.0, 83.0, 86.0, 204.0, 99.0, 77.0, 65.0, 62.0, 21.0, 15.0, 12.0, 12.0, 2.0, 5.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.450580596923828e-06, -7.257796823978424e-06, -7.06501305103302e-06, -6.872229278087616e-06, -6.679445505142212e-06, -6.486661732196808e-06, -6.293877959251404e-06, -6.101094186306e-06, -5.908310413360596e-06, -5.715526640415192e-06, -5.522742867469788e-06, -5.3299590945243835e-06, -5.1371753215789795e-06, -4.9443915486335754e-06, -4.751607775688171e-06, -4.558824002742767e-06, -4.366040229797363e-06, -4.173256456851959e-06, -3.980472683906555e-06, -3.787688910961151e-06, -3.594905138015747e-06, -3.402121365070343e-06, -3.209337592124939e-06, -3.016553819179535e-06, -2.823770046234131e-06, -2.630986273288727e-06, -2.4382025003433228e-06, -2.2454187273979187e-06, -2.0526349544525146e-06, -1.8598511815071106e-06, -1.6670674085617065e-06, -1.4742836356163025e-06, -1.2814998626708984e-06, -1.0887160897254944e-06, -8.959323167800903e-07, -7.031485438346863e-07, -5.103647708892822e-07, -3.175809979438782e-07, -1.2479722499847412e-07, 6.798654794692993e-08, 2.60770320892334e-07, 4.5355409383773804e-07, 6.463378667831421e-07, 8.391216397285461e-07, 1.0319054126739502e-06, 1.2246891856193542e-06, 1.4174729585647583e-06, 1.6102567315101624e-06, 1.8030405044555664e-06, 1.9958242774009705e-06, 2.1886080503463745e-06, 2.3813918232917786e-06, 2.5741755962371826e-06, 2.7669593691825867e-06, 2.9597431421279907e-06, 3.1525269150733948e-06, 3.345310688018799e-06, 3.538094460964203e-06, 3.730878233909607e-06, 3.923662006855011e-06, 4.116445779800415e-06, 4.309229552745819e-06, 4.502013325691223e-06, 4.694797098636627e-06, 4.887580871582031e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 8.0, 14.0, 14.0, 22.0, 39.0, 66.0, 113.0, 194.0, 647.0, 23591.0, 1022085.0, 1133.0, 314.0, 126.0, 63.0, 32.0, 21.0, 20.0, 8.0, 7.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8298625946044922e-05, -1.7710961401462555e-05, -1.7123296856880188e-05, -1.653563231229782e-05, -1.5947967767715454e-05, -1.5360303223133087e-05, -1.477263867855072e-05, -1.4184974133968353e-05, -1.3597309589385986e-05, -1.300964504480362e-05, -1.2421980500221252e-05, -1.1834315955638885e-05, -1.1246651411056519e-05, -1.0658986866474152e-05, -1.0071322321891785e-05, -9.483657777309418e-06, -8.89599323272705e-06, -8.308328688144684e-06, -7.720664143562317e-06, -7.13299959897995e-06, -6.545335054397583e-06, -5.957670509815216e-06, -5.370005965232849e-06, -4.782341420650482e-06, -4.194676876068115e-06, -3.6070123314857483e-06, -3.0193477869033813e-06, -2.4316832423210144e-06, -1.8440186977386475e-06, -1.2563541531562805e-06, -6.686896085739136e-07, -8.102506399154663e-08, 5.066394805908203e-07, 1.0943040251731873e-06, 1.6819685697555542e-06, 2.269633114337921e-06, 2.857297658920288e-06, 3.444962203502655e-06, 4.032626748085022e-06, 4.620291292667389e-06, 5.207955837249756e-06, 5.795620381832123e-06, 6.38328492641449e-06, 6.970949470996857e-06, 7.558614015579224e-06, 8.14627856016159e-06, 8.733943104743958e-06, 9.321607649326324e-06, 9.909272193908691e-06, 1.0496936738491058e-05, 1.1084601283073425e-05, 1.1672265827655792e-05, 1.225993037223816e-05, 1.2847594916820526e-05, 1.3435259461402893e-05, 1.402292400598526e-05, 1.4610588550567627e-05, 1.5198253095149994e-05, 1.578591763973236e-05, 1.6373582184314728e-05, 1.6961246728897095e-05, 1.754891127347946e-05, 1.813657581806183e-05, 1.8724240362644196e-05, 1.9311904907226562e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 10.0, 14.0, 21.0, 31.0, 28.0, 46.0, 72.0, 95.0, 386.0, 70.0, 71.0, 47.0, 34.0, 10.0, 13.0, 10.0, 3.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2635253369808197e-05, -1.2217089533805847e-05, -1.1798925697803497e-05, -1.1380761861801147e-05, -1.0962598025798798e-05, -1.0544434189796448e-05, -1.0126270353794098e-05, -9.708106517791748e-06, -9.289942681789398e-06, -8.871778845787048e-06, -8.453615009784698e-06, -8.035451173782349e-06, -7.617287337779999e-06, -7.199123501777649e-06, -6.780959665775299e-06, -6.362795829772949e-06, -5.944631993770599e-06, -5.5264681577682495e-06, -5.1083043217659e-06, -4.69014048576355e-06, -4.2719766497612e-06, -3.85381281375885e-06, -3.4356489777565002e-06, -3.0174851417541504e-06, -2.5993213057518005e-06, -2.1811574697494507e-06, -1.7629936337471008e-06, -1.344829797744751e-06, -9.266659617424011e-07, -5.085021257400513e-07, -9.033828973770142e-08, 3.2782554626464844e-07, 7.459893822669983e-07, 1.1641532182693481e-06, 1.582317054271698e-06, 2.000480890274048e-06, 2.4186447262763977e-06, 2.8368085622787476e-06, 3.2549723982810974e-06, 3.6731362342834473e-06, 4.091300070285797e-06, 4.509463906288147e-06, 4.927627742290497e-06, 5.345791578292847e-06, 5.7639554142951965e-06, 6.182119250297546e-06, 6.600283086299896e-06, 7.018446922302246e-06, 7.436610758304596e-06, 7.854774594306946e-06, 8.272938430309296e-06, 8.691102266311646e-06, 9.109266102313995e-06, 9.527429938316345e-06, 9.945593774318695e-06, 1.0363757610321045e-05, 1.0781921446323395e-05, 1.1200085282325745e-05, 1.1618249118328094e-05, 1.2036412954330444e-05, 1.2454576790332794e-05, 1.2872740626335144e-05, 1.3290904462337494e-05, 1.3709068298339844e-05]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 40.0, 599.0, 346.0, 21.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10943986475467682, -0.10366286337375641, -0.0978858694434166, -0.09210887551307678, -0.08633187413215637, -0.08055487275123596, -0.07477787882089615, -0.06900088489055634, -0.06322388350963593, -0.057446885854005814, -0.0516698881983757, -0.04589289054274559, -0.04011589288711548, -0.03433889523148537, -0.028561897575855255, -0.022784899920225143, -0.017007902264595032, -0.01123090460896492, -0.005453906953334808, 0.00032309070229530334, 0.006100088357925415, 0.011877086013555527, 0.01765408366918564, 0.02343108132481575, 0.029208078980445862, 0.034985076636075974, 0.040762074291706085, 0.0465390719473362, 0.05231606960296631, 0.05809306725859642, 0.06387006491422653, 0.06964705884456635, 0.07542404532432556, 0.08120104670524597, 0.08697804063558578, 0.0927550345659256, 0.09853203594684601, 0.10430903732776642, 0.11008603125810623, 0.11586302518844604, 0.12164002656936646, 0.12741702795028687, 0.13319402933120728, 0.1389710158109665, 0.1447480171918869, 0.1505250185728073, 0.15630200505256653, 0.16207900643348694, 0.16785600781440735, 0.17363300919532776, 0.17941001057624817, 0.18518699705600739, 0.1909639984369278, 0.1967409998178482, 0.20251798629760742, 0.20829498767852783, 0.21407198905944824, 0.21984899044036865, 0.22562599182128906, 0.23140297830104828, 0.2371799796819687, 0.2429569810628891, 0.24873396754264832, 0.2545109689235687, 0.26028797030448914]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 9.0, 8.0, 16.0, 7.0, 12.0, 14.0, 18.0, 16.0, 10.0, 21.0, 22.0, 26.0, 35.0, 37.0, 35.0, 36.0, 49.0, 47.0, 46.0, 50.0, 41.0, 38.0, 38.0, 56.0, 37.0, 35.0, 23.0, 29.0, 29.0, 38.0, 17.0, 28.0, 10.0, 13.0, 7.0, 10.0, 9.0, 7.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11164200305938721, -0.10829945653676987, -0.10495691001415253, -0.10161437094211578, -0.09827182441949844, -0.0949292778968811, -0.09158673882484436, -0.08824419230222702, -0.08490164577960968, -0.08155909925699234, -0.078216552734375, -0.07487401366233826, -0.07153146713972092, -0.06818892061710358, -0.06484638154506683, -0.06150383502244949, -0.05816128849983215, -0.05481874197721481, -0.05147619917988777, -0.04813365638256073, -0.04479110985994339, -0.04144856333732605, -0.03810602053999901, -0.03476347774267197, -0.031420931220054626, -0.028078386560082436, -0.024735841900110245, -0.021393297240138054, -0.018050752580165863, -0.014708207920193672, -0.011365663260221481, -0.00802311860024929, -0.0046805739402771, -0.0013380292803049088, 0.002004515379667282, 0.005347060039639473, 0.008689604699611664, 0.012032149359583855, 0.015374694019556046, 0.018717238679528236, 0.022059783339500427, 0.025402327999472618, 0.02874487265944481, 0.03208741545677185, 0.03542996197938919, 0.03877250850200653, 0.04211505129933357, 0.045457594096660614, 0.048800140619277954, 0.052142687141895294, 0.055485229939222336, 0.05882777273654938, 0.06217031925916672, 0.06551286578178406, 0.0688554048538208, 0.07219795137643814, 0.07554049789905548, 0.07888304442167282, 0.08222559094429016, 0.0855681300163269, 0.08891067653894424, 0.09225322306156158, 0.09559576213359833, 0.09893830865621567, 0.10228085517883301]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 2.0, 4.0, 2.0, 5.0, 4.0, 2.0, 4.0, 7.0, 12.0, 12.0, 11.0, 6.0, 22.0, 72.0, 195.0, 4193549.0, 181.0, 79.0, 21.0, 10.0, 9.0, 7.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014276504516601562, -0.001387074589729309, -0.001346498727798462, -0.0013059228658676147, -0.0012653470039367676, -0.0012247711420059204, -0.0011841952800750732, -0.001143619418144226, -0.001103043556213379, -0.0010624676942825317, -0.0010218918323516846, -0.0009813159704208374, -0.0009407401084899902, -0.0009001642465591431, -0.0008595883846282959, -0.0008190125226974487, -0.0007784366607666016, -0.0007378607988357544, -0.0006972849369049072, -0.0006567090749740601, -0.0006161332130432129, -0.0005755573511123657, -0.0005349814891815186, -0.0004944056272506714, -0.0004538297653198242, -0.00041325390338897705, -0.0003726780414581299, -0.0003321021795272827, -0.00029152631759643555, -0.0002509504556655884, -0.0002103745937347412, -0.00016979873180389404, -0.00012922286987304688, -8.864700794219971e-05, -4.807114601135254e-05, -7.495284080505371e-06, 3.30805778503418e-05, 7.365643978118896e-05, 0.00011423230171203613, 0.0001548081636428833, 0.00019538402557373047, 0.00023595988750457764, 0.0002765357494354248, 0.00031711161136627197, 0.00035768747329711914, 0.0003982633352279663, 0.0004388391971588135, 0.00047941505908966064, 0.0005199909210205078, 0.000560566782951355, 0.0006011426448822021, 0.0006417185068130493, 0.0006822943687438965, 0.0007228702306747437, 0.0007634460926055908, 0.000804021954536438, 0.0008445978164672852, 0.0008851736783981323, 0.0009257495403289795, 0.0009663254022598267, 0.0010069012641906738, 0.001047477126121521, 0.0010880529880523682, 0.0011286288499832153, 0.0011692047119140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 15.0, 11.0, 6.0, 11.0, 17.0, 66.0, 153.0, 264.0, 210.0, 100.0, 24.0, 11.0, 9.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007415771484375, -0.007160305976867676, -0.0069048404693603516, -0.006649374961853027, -0.006393909454345703, -0.006138443946838379, -0.005882978439331055, -0.0056275129318237305, -0.005372047424316406, -0.005116581916809082, -0.004861116409301758, -0.004605650901794434, -0.004350185394287109, -0.004094719886779785, -0.003839254379272461, -0.0035837888717651367, -0.0033283233642578125, -0.0030728578567504883, -0.002817392349243164, -0.00256192684173584, -0.0023064613342285156, -0.0020509958267211914, -0.0017955303192138672, -0.001540064811706543, -0.0012845993041992188, -0.0010291337966918945, -0.0007736682891845703, -0.0005182027816772461, -0.0002627372741699219, -7.271766662597656e-06, 0.00024819374084472656, 0.0005036592483520508, 0.000759124755859375, 0.0010145902633666992, 0.0012700557708740234, 0.0015255212783813477, 0.0017809867858886719, 0.002036452293395996, 0.0022919178009033203, 0.0025473833084106445, 0.0028028488159179688, 0.003058314323425293, 0.003313779830932617, 0.0035692453384399414, 0.0038247108459472656, 0.00408017635345459, 0.004335641860961914, 0.004591107368469238, 0.0048465728759765625, 0.005102038383483887, 0.005357503890991211, 0.005612969398498535, 0.005868434906005859, 0.006123900413513184, 0.006379365921020508, 0.006634831428527832, 0.006890296936035156, 0.0071457624435424805, 0.007401227951049805, 0.007656693458557129, 0.007912158966064453, 0.008167624473571777, 0.008423089981079102, 0.008678555488586426, 0.00893402099609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 17.0, 29.0, 43.0, 69.0, 81.0, 104.0, 88.0, 4193366.0, 105.0, 116.0, 80.0, 85.0, 43.0, 31.0, 17.0, 11.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.375810623168945e-05, -9.08728688955307e-05, -8.798763155937195e-05, -8.51023942232132e-05, -8.221715688705444e-05, -7.933191955089569e-05, -7.644668221473694e-05, -7.356144487857819e-05, -7.067620754241943e-05, -6.779097020626068e-05, -6.490573287010193e-05, -6.202049553394318e-05, -5.9135258197784424e-05, -5.625002086162567e-05, -5.336478352546692e-05, -5.0479546189308167e-05, -4.7594308853149414e-05, -4.470907151699066e-05, -4.182383418083191e-05, -3.893859684467316e-05, -3.6053359508514404e-05, -3.316812217235565e-05, -3.02828848361969e-05, -2.7397647500038147e-05, -2.4512410163879395e-05, -2.1627172827720642e-05, -1.874193549156189e-05, -1.5856698155403137e-05, -1.2971460819244385e-05, -1.0086223483085632e-05, -7.20098614692688e-06, -4.3157488107681274e-06, -1.430511474609375e-06, 1.4547258615493774e-06, 4.33996319770813e-06, 7.225200533866882e-06, 1.0110437870025635e-05, 1.2995675206184387e-05, 1.588091254234314e-05, 1.8766149878501892e-05, 2.1651387214660645e-05, 2.4536624550819397e-05, 2.742186188697815e-05, 3.0307099223136902e-05, 3.3192336559295654e-05, 3.607757389545441e-05, 3.896281123161316e-05, 4.184804856777191e-05, 4.4733285903930664e-05, 4.7618523240089417e-05, 5.050376057624817e-05, 5.338899791240692e-05, 5.6274235248565674e-05, 5.9159472584724426e-05, 6.204470992088318e-05, 6.492994725704193e-05, 6.781518459320068e-05, 7.070042192935944e-05, 7.358565926551819e-05, 7.647089660167694e-05, 7.93561339378357e-05, 8.224137127399445e-05, 8.51266086101532e-05, 8.801184594631195e-05, 9.08970832824707e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 4.0046870708465576e-07, 8.009374141693115e-07, 1.2014061212539673e-06, 1.601874828338623e-06, 2.002343535423279e-06, 2.4028122425079346e-06, 2.8032809495925903e-06, 3.203749656677246e-06, 3.604218363761902e-06, 4.004687070846558e-06, 4.405155777931213e-06, 4.805624485015869e-06, 5.206093192100525e-06, 5.606561899185181e-06, 6.0070306062698364e-06, 6.407499313354492e-06, 6.807968020439148e-06, 7.208436727523804e-06, 7.6089054346084595e-06, 8.009374141693115e-06, 8.409842848777771e-06, 8.810311555862427e-06, 9.210780262947083e-06, 9.611248970031738e-06, 1.0011717677116394e-05, 1.041218638420105e-05, 1.0812655091285706e-05, 1.1213123798370361e-05, 1.1613592505455017e-05, 1.2014061212539673e-05, 1.2414529919624329e-05, 1.2814998626708984e-05, 1.321546733379364e-05, 1.3615936040878296e-05, 1.4016404747962952e-05, 1.4416873455047607e-05, 1.4817342162132263e-05, 1.5217810869216919e-05, 1.5618279576301575e-05, 1.601874828338623e-05, 1.6419216990470886e-05, 1.6819685697555542e-05, 1.7220154404640198e-05, 1.7620623111724854e-05, 1.802109181880951e-05, 1.8421560525894165e-05, 1.882202923297882e-05, 1.9222497940063477e-05, 1.9622966647148132e-05, 2.0023435354232788e-05, 2.0423904061317444e-05, 2.08243727684021e-05, 2.1224841475486755e-05, 2.162531018257141e-05, 2.2025778889656067e-05, 2.2426247596740723e-05, 2.282671630382538e-05, 2.3227185010910034e-05, 2.362765371799469e-05, 2.4028122425079346e-05, 2.4428591132164e-05, 2.4829059839248657e-05, 2.5229528546333313e-05, 2.562999725341797e-05]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 39.0, 971.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014892354374751449, -0.00014188833301886916, -0.00013485312229022384, -0.0001278179115615785, -0.00012078269355697557, -0.00011374748282833025, -0.00010671226482372731, -9.967705409508198e-05, -9.264184336643666e-05, -8.560663263779134e-05, -7.857142190914601e-05, -7.153620390454307e-05, -6.450099317589775e-05, -5.746578244725242e-05, -5.043056808062829e-05, -4.339535371400416e-05, -3.6360142985358834e-05, -2.9324930437724106e-05, -2.2289717890089378e-05, -1.525450534245465e-05, -8.219292794819921e-06, -1.1840820661745965e-06, 5.851132300449535e-06, 1.2886346667073667e-05, 1.9921557395718992e-05, 2.695676994335372e-05, 3.399198249098845e-05, 4.102719685761258e-05, 4.8062407586257905e-05, 5.509761831490323e-05, 6.213283631950617e-05, 6.916804704815149e-05, 7.620325777679682e-05, 8.323846850544214e-05, 9.027367923408747e-05, 9.73088972386904e-05, 0.00010434410796733573, 0.00011137931869598106, 0.000118414536700584, 0.00012544974742922932, 0.00013248495815787464, 0.00013952016888651997, 0.0001465553796151653, 0.00015359059034381062, 0.00016062581562437117, 0.0001676610263530165, 0.00017469623708166182, 0.00018173144781030715, 0.00018876665853895247, 0.0001958018692675978, 0.00020283707999624312, 0.00020987229072488844, 0.00021690750145353377, 0.0002239427121821791, 0.00023097793746273965, 0.00023801314819138497, 0.0002450483734719455, 0.00025208358420059085, 0.0002591187949292362, 0.0002661540056578815, 0.0002731892163865268, 0.00028022442711517215, 0.00028725963784381747, 0.0002942948485724628, 0.0003013300593011081]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 10.0, 48.0, 28.0, 92.0, 227.0, 99.0, 127.0, 182.0, 60.0, 43.0, 51.0, 4.0, 11.0, 0.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1179206669330597e-05, -2.000667154788971e-05, -1.8834136426448822e-05, -1.7661601305007935e-05, -1.6489066183567047e-05, -1.531653106212616e-05, -1.4143995940685272e-05, -1.2971460819244385e-05, -1.1798925697803497e-05, -1.062639057636261e-05, -9.453855454921722e-06, -8.281320333480835e-06, -7.1087852120399475e-06, -5.93625009059906e-06, -4.763714969158173e-06, -3.591179847717285e-06, -2.4186447262763977e-06, -1.2461096048355103e-06, -7.35744833946228e-08, 1.0989606380462646e-06, 2.271495759487152e-06, 3.4440308809280396e-06, 4.616566002368927e-06, 5.7891011238098145e-06, 6.961636245250702e-06, 8.13417136669159e-06, 9.306706488132477e-06, 1.0479241609573364e-05, 1.1651776731014252e-05, 1.282431185245514e-05, 1.3996846973896027e-05, 1.5169382095336914e-05, 1.63419172167778e-05, 1.751445233821869e-05, 1.8686987459659576e-05, 1.9859522581100464e-05, 2.103205770254135e-05, 2.220459282398224e-05, 2.3377127945423126e-05, 2.4549663066864014e-05, 2.57221981883049e-05, 2.689473330974579e-05, 2.8067268431186676e-05, 2.9239803552627563e-05, 3.041233867406845e-05, 3.158487379550934e-05, 3.2757408916950226e-05, 3.392994403839111e-05, 3.5102479159832e-05, 3.627501428127289e-05, 3.7447549402713776e-05, 3.862008452415466e-05, 3.979261964559555e-05, 4.096515476703644e-05, 4.2137689888477325e-05, 4.331022500991821e-05, 4.44827601313591e-05, 4.565529525279999e-05, 4.6827830374240875e-05, 4.800036549568176e-05, 4.917290061712265e-05, 5.034543573856354e-05, 5.1517970860004425e-05, 5.269050598144531e-05]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 10.0, 5.0, 10.0, 8.0, 16.0, 17.0, 22.0, 25.0, 38.0, 49.0, 66.0, 80.0, 136.0, 205.0, 344.0, 504.0, 840.0, 1540.0, 3387.0, 9820.0, 64883.0, 933796.0, 21672.0, 5688.0, 2219.0, 1169.0, 684.0, 440.0, 278.0, 178.0, 114.0, 84.0, 59.0, 41.0, 31.0, 20.0, 19.0, 14.0, 11.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020721435546875, -0.020058870315551758, -0.019396305084228516, -0.018733739852905273, -0.01807117462158203, -0.01740860939025879, -0.016746044158935547, -0.016083478927612305, -0.015420913696289062, -0.01475834846496582, -0.014095783233642578, -0.013433218002319336, -0.012770652770996094, -0.012108087539672852, -0.01144552230834961, -0.010782957077026367, -0.010120391845703125, -0.009457826614379883, -0.00879526138305664, -0.008132696151733398, -0.007470130920410156, -0.006807565689086914, -0.006145000457763672, -0.00548243522644043, -0.0048198699951171875, -0.004157304763793945, -0.003494739532470703, -0.002832174301147461, -0.0021696090698242188, -0.0015070438385009766, -0.0008444786071777344, -0.0001819133758544922, 0.00048065185546875, 0.0011432170867919922, 0.0018057823181152344, 0.0024683475494384766, 0.0031309127807617188, 0.003793478012084961, 0.004456043243408203, 0.005118608474731445, 0.0057811737060546875, 0.00644373893737793, 0.007106304168701172, 0.007768869400024414, 0.008431434631347656, 0.009093999862670898, 0.00975656509399414, 0.010419130325317383, 0.011081695556640625, 0.011744260787963867, 0.01240682601928711, 0.013069391250610352, 0.013731956481933594, 0.014394521713256836, 0.015057086944580078, 0.01571965217590332, 0.016382217407226562, 0.017044782638549805, 0.017707347869873047, 0.01836991310119629, 0.01903247833251953, 0.019695043563842773, 0.020357608795166016, 0.021020174026489258, 0.0216827392578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 15.0, 11.0, 6.0, 11.0, 17.0, 66.0, 153.0, 263.0, 211.0, 100.0, 24.0, 11.0, 9.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007415771484375, -0.007160305976867676, -0.0069048404693603516, -0.006649374961853027, -0.006393909454345703, -0.006138443946838379, -0.005882978439331055, -0.0056275129318237305, -0.005372047424316406, -0.005116581916809082, -0.004861116409301758, -0.004605650901794434, -0.004350185394287109, -0.004094719886779785, -0.003839254379272461, -0.0035837888717651367, -0.0033283233642578125, -0.0030728578567504883, -0.002817392349243164, -0.00256192684173584, -0.0023064613342285156, -0.0020509958267211914, -0.0017955303192138672, -0.001540064811706543, -0.0012845993041992188, -0.0010291337966918945, -0.0007736682891845703, -0.0005182027816772461, -0.0002627372741699219, -7.271766662597656e-06, 0.00024819374084472656, 0.0005036592483520508, 0.000759124755859375, 0.0010145902633666992, 0.0012700557708740234, 0.0015255212783813477, 0.0017809867858886719, 0.002036452293395996, 0.0022919178009033203, 0.0025473833084106445, 0.0028028488159179688, 0.003058314323425293, 0.003313779830932617, 0.0035692453384399414, 0.0038247108459472656, 0.00408017635345459, 0.004335641860961914, 0.004591107368469238, 0.0048465728759765625, 0.005102038383483887, 0.005357503890991211, 0.005612969398498535, 0.005868434906005859, 0.006123900413513184, 0.006379365921020508, 0.006634831428527832, 0.006890296936035156, 0.0071457624435424805, 0.007401227951049805, 0.007656693458557129, 0.007912158966064453, 0.008167624473571777, 0.008423089981079102, 0.008678555488586426, 0.00893402099609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 13.0, 11.0, 10.0, 11.0, 11.0, 24.0, 23.0, 31.0, 34.0, 52.0, 71.0, 83.0, 109.0, 151.0, 212.0, 352.0, 686.0, 1449.0, 8627.0, 1021664.0, 11448.0, 1540.0, 689.0, 377.0, 219.0, 139.0, 127.0, 81.0, 64.0, 46.0, 43.0, 32.0, 18.0, 25.0, 12.0, 12.0, 13.0, 4.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.0306854248046875, -0.029796838760375977, -0.028908252716064453, -0.02801966667175293, -0.027131080627441406, -0.026242494583129883, -0.02535390853881836, -0.024465322494506836, -0.023576736450195312, -0.02268815040588379, -0.021799564361572266, -0.020910978317260742, -0.02002239227294922, -0.019133806228637695, -0.018245220184326172, -0.01735663414001465, -0.016468048095703125, -0.015579462051391602, -0.014690876007080078, -0.013802289962768555, -0.012913703918457031, -0.012025117874145508, -0.011136531829833984, -0.010247945785522461, -0.009359359741210938, -0.008470773696899414, -0.007582187652587891, -0.006693601608276367, -0.005805015563964844, -0.00491642951965332, -0.004027843475341797, -0.0031392574310302734, -0.00225067138671875, -0.0013620853424072266, -0.0004734992980957031, 0.0004150867462158203, 0.0013036727905273438, 0.002192258834838867, 0.0030808448791503906, 0.003969430923461914, 0.0048580169677734375, 0.005746603012084961, 0.006635189056396484, 0.007523775100708008, 0.008412361145019531, 0.009300947189331055, 0.010189533233642578, 0.011078119277954102, 0.011966705322265625, 0.012855291366577148, 0.013743877410888672, 0.014632463455200195, 0.015521049499511719, 0.016409635543823242, 0.017298221588134766, 0.01818680763244629, 0.019075393676757812, 0.019963979721069336, 0.02085256576538086, 0.021741151809692383, 0.022629737854003906, 0.02351832389831543, 0.024406909942626953, 0.025295495986938477, 0.02618408203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 12.0, 12.0, 10.0, 10.0, 7.0, 20.0, 16.0, 17.0, 22.0, 29.0, 27.0, 29.0, 29.0, 35.0, 38.0, 45.0, 47.0, 42.0, 37.0, 31.0, 38.0, 44.0, 38.0, 30.0, 40.0, 28.0, 35.0, 34.0, 26.0, 18.0, 25.0, 20.0, 12.0, 18.0, 13.0, 12.0, 12.0, 3.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.02099609375, -0.020388364791870117, -0.019780635833740234, -0.01917290687561035, -0.01856517791748047, -0.017957448959350586, -0.017349720001220703, -0.01674199104309082, -0.016134262084960938, -0.015526533126831055, -0.014918804168701172, -0.014311075210571289, -0.013703346252441406, -0.013095617294311523, -0.01248788833618164, -0.011880159378051758, -0.011272430419921875, -0.010664701461791992, -0.01005697250366211, -0.009449243545532227, -0.008841514587402344, -0.008233785629272461, -0.007626056671142578, -0.007018327713012695, -0.0064105987548828125, -0.00580286979675293, -0.005195140838623047, -0.004587411880493164, -0.003979682922363281, -0.0033719539642333984, -0.0027642250061035156, -0.002156496047973633, -0.00154876708984375, -0.0009410381317138672, -0.0003333091735839844, 0.00027441978454589844, 0.0008821487426757812, 0.001489877700805664, 0.002097606658935547, 0.0027053356170654297, 0.0033130645751953125, 0.003920793533325195, 0.004528522491455078, 0.005136251449584961, 0.005743980407714844, 0.0063517093658447266, 0.006959438323974609, 0.007567167282104492, 0.008174896240234375, 0.008782625198364258, 0.00939035415649414, 0.009998083114624023, 0.010605812072753906, 0.011213541030883789, 0.011821269989013672, 0.012428998947143555, 0.013036727905273438, 0.01364445686340332, 0.014252185821533203, 0.014859914779663086, 0.015467643737792969, 0.01607537269592285, 0.016683101654052734, 0.017290830612182617, 0.0178985595703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 7.0, 7.0, 8.0, 8.0, 6.0, 20.0, 20.0, 24.0, 57.0, 99.0, 135.0, 329.0, 930.0, 9798.0, 976438.0, 56504.0, 3079.0, 566.0, 215.0, 98.0, 67.0, 44.0, 25.0, 17.0, 18.0, 5.0, 6.0, 5.0, 1.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1861324310302734e-05, -1.1487863957881927e-05, -1.111440360546112e-05, -1.0740943253040314e-05, -1.0367482900619507e-05, -9.9940225481987e-06, -9.620562195777893e-06, -9.247101843357086e-06, -8.87364149093628e-06, -8.500181138515472e-06, -8.126720786094666e-06, -7.753260433673859e-06, -7.379800081253052e-06, -7.006339728832245e-06, -6.632879376411438e-06, -6.259419023990631e-06, -5.885958671569824e-06, -5.512498319149017e-06, -5.1390379667282104e-06, -4.7655776143074036e-06, -4.392117261886597e-06, -4.01865690946579e-06, -3.645196557044983e-06, -3.271736204624176e-06, -2.898275852203369e-06, -2.5248154997825623e-06, -2.1513551473617554e-06, -1.7778947949409485e-06, -1.4044344425201416e-06, -1.0309740900993347e-06, -6.575137376785278e-07, -2.8405338525772095e-07, 8.940696716308594e-08, 4.628673195838928e-07, 8.363276720046997e-07, 1.2097880244255066e-06, 1.5832483768463135e-06, 1.9567087292671204e-06, 2.3301690816879272e-06, 2.703629434108734e-06, 3.077089786529541e-06, 3.450550138950348e-06, 3.824010491371155e-06, 4.197470843791962e-06, 4.5709311962127686e-06, 4.9443915486335754e-06, 5.317851901054382e-06, 5.691312253475189e-06, 6.064772605895996e-06, 6.438232958316803e-06, 6.81169331073761e-06, 7.185153663158417e-06, 7.558614015579224e-06, 7.93207436800003e-06, 8.305534720420837e-06, 8.678995072841644e-06, 9.052455425262451e-06, 9.425915777683258e-06, 9.799376130104065e-06, 1.0172836482524872e-05, 1.0546296834945679e-05, 1.0919757187366486e-05, 1.1293217539787292e-05, 1.16666778922081e-05, 1.2040138244628906e-05]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 8.0, 3.0, 4.0, 3.0, 7.0, 10.0, 19.0, 16.0, 40.0, 42.0, 52.0, 86.0, 80.0, 143.0, 104.0, 102.0, 75.0, 53.0, 37.0, 26.0, 23.0, 20.0, 13.0, 7.0, 5.0, 3.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.331371307373047e-06, -7.101334631443024e-06, -6.8712979555130005e-06, -6.641261279582977e-06, -6.411224603652954e-06, -6.181187927722931e-06, -5.951151251792908e-06, -5.7211145758628845e-06, -5.491077899932861e-06, -5.261041224002838e-06, -5.031004548072815e-06, -4.800967872142792e-06, -4.5709311962127686e-06, -4.340894520282745e-06, -4.110857844352722e-06, -3.880821168422699e-06, -3.6507844924926758e-06, -3.4207478165626526e-06, -3.1907111406326294e-06, -2.960674464702606e-06, -2.730637788772583e-06, -2.50060111284256e-06, -2.2705644369125366e-06, -2.0405277609825134e-06, -1.8104910850524902e-06, -1.580454409122467e-06, -1.3504177331924438e-06, -1.1203810572624207e-06, -8.903443813323975e-07, -6.603077054023743e-07, -4.302710294723511e-07, -2.0023435354232788e-07, 2.9802322387695312e-08, 2.598389983177185e-07, 4.898756742477417e-07, 7.199123501777649e-07, 9.499490261077881e-07, 1.1799857020378113e-06, 1.4100223779678345e-06, 1.6400590538978577e-06, 1.8700957298278809e-06, 2.100132405757904e-06, 2.3301690816879272e-06, 2.5602057576179504e-06, 2.7902424335479736e-06, 3.020279109477997e-06, 3.25031578540802e-06, 3.4803524613380432e-06, 3.7103891372680664e-06, 3.94042581319809e-06, 4.170462489128113e-06, 4.400499165058136e-06, 4.630535840988159e-06, 4.860572516918182e-06, 5.0906091928482056e-06, 5.320645868778229e-06, 5.550682544708252e-06, 5.780719220638275e-06, 6.010755896568298e-06, 6.2407925724983215e-06, 6.470829248428345e-06, 6.700865924358368e-06, 6.930902600288391e-06, 7.160939276218414e-06, 7.3909759521484375e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 7.0, 11.0, 8.0, 11.0, 7.0, 23.0, 40.0, 55.0, 86.0, 191.0, 538.0, 5902.0, 1039334.0, 1630.0, 321.0, 156.0, 92.0, 41.0, 34.0, 17.0, 15.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.317223697900772e-05, -2.232380211353302e-05, -2.147536724805832e-05, -2.0626932382583618e-05, -1.9778497517108917e-05, -1.8930062651634216e-05, -1.8081627786159515e-05, -1.7233192920684814e-05, -1.6384758055210114e-05, -1.5536323189735413e-05, -1.4687888324260712e-05, -1.383945345878601e-05, -1.299101859331131e-05, -1.2142583727836609e-05, -1.1294148862361908e-05, -1.0445713996887207e-05, -9.597279131412506e-06, -8.748844265937805e-06, -7.900409400463104e-06, -7.051974534988403e-06, -6.203539669513702e-06, -5.3551048040390015e-06, -4.5066699385643005e-06, -3.6582350730895996e-06, -2.8098002076148987e-06, -1.9613653421401978e-06, -1.1129304766654968e-06, -2.644956111907959e-07, 5.83939254283905e-07, 1.432374119758606e-06, 2.280808985233307e-06, 3.129243850708008e-06, 3.977678716182709e-06, 4.82611358165741e-06, 5.674548447132111e-06, 6.5229833126068115e-06, 7.3714181780815125e-06, 8.219853043556213e-06, 9.068287909030914e-06, 9.916722774505615e-06, 1.0765157639980316e-05, 1.1613592505455017e-05, 1.2462027370929718e-05, 1.3310462236404419e-05, 1.415889710187912e-05, 1.500733196735382e-05, 1.5855766832828522e-05, 1.6704201698303223e-05, 1.7552636563777924e-05, 1.8401071429252625e-05, 1.9249506294727325e-05, 2.0097941160202026e-05, 2.0946376025676727e-05, 2.1794810891151428e-05, 2.264324575662613e-05, 2.349168062210083e-05, 2.434011548757553e-05, 2.5188550353050232e-05, 2.6036985218524933e-05, 2.6885420083999634e-05, 2.7733854949474335e-05, 2.8582289814949036e-05, 2.9430724680423737e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 4.0, 6.0, 5.0, 13.0, 17.0, 22.0, 22.0, 39.0, 70.0, 83.0, 414.0, 94.0, 58.0, 44.0, 28.0, 15.0, 17.0, 12.0, 8.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6391277313232422e-05, -1.5811994671821594e-05, -1.5232712030410767e-05, -1.4653429388999939e-05, -1.4074146747589111e-05, -1.3494864106178284e-05, -1.2915581464767456e-05, -1.2336298823356628e-05, -1.17570161819458e-05, -1.1177733540534973e-05, -1.0598450899124146e-05, -1.0019168257713318e-05, -9.43988561630249e-06, -8.860602974891663e-06, -8.281320333480835e-06, -7.702037692070007e-06, -7.12275505065918e-06, -6.543472409248352e-06, -5.964189767837524e-06, -5.384907126426697e-06, -4.805624485015869e-06, -4.2263418436050415e-06, -3.647059202194214e-06, -3.0677765607833862e-06, -2.4884939193725586e-06, -1.909211277961731e-06, -1.3299286365509033e-06, -7.506459951400757e-07, -1.7136335372924805e-07, 4.079192876815796e-07, 9.872019290924072e-07, 1.5664845705032349e-06, 2.1457672119140625e-06, 2.72504985332489e-06, 3.3043324947357178e-06, 3.883615136146545e-06, 4.462897777557373e-06, 5.042180418968201e-06, 5.621463060379028e-06, 6.200745701789856e-06, 6.780028343200684e-06, 7.359310984611511e-06, 7.938593626022339e-06, 8.517876267433167e-06, 9.097158908843994e-06, 9.676441550254822e-06, 1.025572419166565e-05, 1.0835006833076477e-05, 1.1414289474487305e-05, 1.1993572115898132e-05, 1.257285475730896e-05, 1.3152137398719788e-05, 1.3731420040130615e-05, 1.4310702681541443e-05, 1.488998532295227e-05, 1.5469267964363098e-05, 1.6048550605773926e-05, 1.6627833247184753e-05, 1.720711588859558e-05, 1.778639853000641e-05, 1.8365681171417236e-05, 1.8944963812828064e-05, 1.952424645423889e-05, 2.010352909564972e-05, 2.0682811737060547e-05]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 82.0, 928.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39565974473953247, -0.3821330964565277, -0.36860647797584534, -0.3550798296928406, -0.3415532112121582, -0.32802656292915344, -0.3144999146461487, -0.3009732961654663, -0.28744664788246155, -0.2739199995994568, -0.2603933811187744, -0.24686673283576965, -0.2333400994539261, -0.21981346607208252, -0.20628683269023895, -0.19276019930839539, -0.17923356592655182, -0.16570693254470825, -0.15218029916286469, -0.13865366578102112, -0.12512701749801636, -0.11160038411617279, -0.09807375073432922, -0.08454710990190506, -0.07102047652006149, -0.05749383941292763, -0.04396720230579376, -0.030440568923950195, -0.01691393181681633, -0.0033872947096824646, 0.010139338672161102, 0.023665979504585266, 0.03719261288642883, 0.0507192499935627, 0.06424588710069656, 0.07777252048254013, 0.0912991613149643, 0.10482579469680786, 0.11835242807865143, 0.131879061460495, 0.14540570974349976, 0.15893234312534332, 0.1724589765071869, 0.18598562479019165, 0.19951225817203522, 0.21303889155387878, 0.22656552493572235, 0.24009215831756592, 0.2536187767982483, 0.26714542508125305, 0.2806720435619354, 0.2941986918449402, 0.30772531032562256, 0.3212519586086273, 0.3347786068916321, 0.34830522537231445, 0.3618318736553192, 0.375358521938324, 0.38888514041900635, 0.4024117887020111, 0.4159384071826935, 0.42946505546569824, 0.4429916739463806, 0.4565183222293854, 0.47004497051239014]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 7.0, 8.0, 7.0, 8.0, 8.0, 16.0, 13.0, 22.0, 16.0, 21.0, 19.0, 34.0, 36.0, 31.0, 40.0, 51.0, 36.0, 45.0, 41.0, 68.0, 49.0, 43.0, 40.0, 40.0, 37.0, 30.0, 23.0, 32.0, 24.0, 29.0, 21.0, 13.0, 12.0, 16.0, 13.0, 4.0, 11.0, 11.0, 3.0, 11.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.09758031368255615, -0.09430770576000214, -0.09103509783744812, -0.0877624899148941, -0.08448988199234009, -0.08121727406978607, -0.07794466614723206, -0.07467205822467804, -0.07139945030212402, -0.06812684237957001, -0.06485423445701599, -0.061581626534461975, -0.05830901861190796, -0.05503641068935394, -0.05176380276679993, -0.04849119484424591, -0.045218586921691895, -0.04194597899913788, -0.03867337107658386, -0.035400763154029846, -0.03212815523147583, -0.028855547308921814, -0.025582939386367798, -0.022310331463813782, -0.019037723541259766, -0.01576511561870575, -0.012492507696151733, -0.009219899773597717, -0.005947291851043701, -0.002674683928489685, 0.0005979239940643311, 0.003870531916618347, 0.007143139839172363, 0.01041574776172638, 0.013688355684280396, 0.01696096360683441, 0.020233571529388428, 0.023506179451942444, 0.02677878737449646, 0.030051395297050476, 0.03332400321960449, 0.03659661114215851, 0.039869219064712524, 0.04314182698726654, 0.04641443490982056, 0.04968704283237457, 0.05295965075492859, 0.056232258677482605, 0.05950486660003662, 0.06277747452259064, 0.06605008244514465, 0.06932269036769867, 0.07259529829025269, 0.0758679062128067, 0.07914051413536072, 0.08241312205791473, 0.08568572998046875, 0.08895833790302277, 0.09223094582557678, 0.0955035537481308, 0.09877616167068481, 0.10204876959323883, 0.10532137751579285, 0.10859398543834686, 0.11186659336090088]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 3.0, 1.0, 12.0, 9.0, 5.0, 4.0, 8.0, 8.0, 6.0, 8.0, 14.0, 11.0, 24.0, 21.0, 22.0, 23.0, 65.0, 225.0, 4192602.0, 610.0, 276.0, 112.0, 35.0, 16.0, 19.0, 22.0, 25.0, 10.0, 5.0, 7.0, 6.0, 10.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 6.0, 0.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0], "bins": [-0.0014333724975585938, -0.0013922303915023804, -0.001351088285446167, -0.0013099461793899536, -0.0012688040733337402, -0.0012276619672775269, -0.0011865198612213135, -0.0011453777551651, -0.0011042356491088867, -0.0010630935430526733, -0.00102195143699646, -0.0009808093309402466, -0.0009396672248840332, -0.0008985251188278198, -0.0008573830127716064, -0.0008162409067153931, -0.0007750988006591797, -0.0007339566946029663, -0.0006928145885467529, -0.0006516724824905396, -0.0006105303764343262, -0.0005693882703781128, -0.0005282461643218994, -0.00048710405826568604, -0.00044596195220947266, -0.0004048198461532593, -0.0003636777400970459, -0.0003225356340408325, -0.00028139352798461914, -0.00024025142192840576, -0.00019910931587219238, -0.000157967209815979, -0.00011682510375976562, -7.568299770355225e-05, -3.454089164733887e-05, 6.601214408874512e-06, 4.774332046508789e-05, 8.888542652130127e-05, 0.00013002753257751465, 0.00017116963863372803, 0.0002123117446899414, 0.0002534538507461548, 0.00029459595680236816, 0.00033573806285858154, 0.0003768801689147949, 0.0004180222749710083, 0.0004591643810272217, 0.0005003064870834351, 0.0005414485931396484, 0.0005825906991958618, 0.0006237328052520752, 0.0006648749113082886, 0.000706017017364502, 0.0007471591234207153, 0.0007883012294769287, 0.0008294433355331421, 0.0008705854415893555, 0.0009117275476455688, 0.0009528696537017822, 0.0009940117597579956, 0.001035153865814209, 0.0010762959718704224, 0.0011174380779266357, 0.0011585801839828491, 0.0011997222900390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 11.0, 9.0, 9.0, 16.0, 57.0, 136.0, 257.0, 229.0, 109.0, 29.0, 12.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161378860473633, -0.006906986236572266, -0.0066525936126708984, -0.006398200988769531, -0.006143808364868164, -0.005889415740966797, -0.00563502311706543, -0.0053806304931640625, -0.005126237869262695, -0.004871845245361328, -0.004617452621459961, -0.004363059997558594, -0.0041086673736572266, -0.0038542747497558594, -0.003599882125854492, -0.003345489501953125, -0.003091096878051758, -0.0028367042541503906, -0.0025823116302490234, -0.0023279190063476562, -0.002073526382446289, -0.0018191337585449219, -0.0015647411346435547, -0.0013103485107421875, -0.0010559558868408203, -0.0008015632629394531, -0.0005471706390380859, -0.00029277801513671875, -3.838539123535156e-05, 0.00021600723266601562, 0.0004703998565673828, 0.00072479248046875, 0.0009791851043701172, 0.0012335777282714844, 0.0014879703521728516, 0.0017423629760742188, 0.001996755599975586, 0.002251148223876953, 0.0025055408477783203, 0.0027599334716796875, 0.0030143260955810547, 0.003268718719482422, 0.003523111343383789, 0.0037775039672851562, 0.0040318965911865234, 0.004286289215087891, 0.004540681838989258, 0.004795074462890625, 0.005049467086791992, 0.005303859710693359, 0.0055582523345947266, 0.005812644958496094, 0.006067037582397461, 0.006321430206298828, 0.006575822830200195, 0.0068302154541015625, 0.00708460807800293, 0.007339000701904297, 0.007593393325805664, 0.007847785949707031, 0.008102178573608398, 0.008356571197509766, 0.008610963821411133, 0.0088653564453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 12.0, 35.0, 56.0, 82.0, 77.0, 170.0, 4191054.0, 2308.0, 143.0, 126.0, 103.0, 69.0, 23.0, 13.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004024505615234375, -0.0003880411386489868, -0.00037363171577453613, -0.00035922229290008545, -0.00034481287002563477, -0.0003304034471511841, -0.0003159940242767334, -0.0003015846014022827, -0.00028717517852783203, -0.00027276575565338135, -0.00025835633277893066, -0.00024394690990447998, -0.0002295374870300293, -0.0002151280641555786, -0.00020071864128112793, -0.00018630921840667725, -0.00017189979553222656, -0.00015749037265777588, -0.0001430809497833252, -0.0001286715269088745, -0.00011426210403442383, -9.985268115997314e-05, -8.544325828552246e-05, -7.103383541107178e-05, -5.6624412536621094e-05, -4.221498966217041e-05, -2.7805566787719727e-05, -1.3396143913269043e-05, 1.0132789611816406e-06, 1.5422701835632324e-05, 2.9832124710083008e-05, 4.424154758453369e-05, 5.8650970458984375e-05, 7.306039333343506e-05, 8.746981620788574e-05, 0.00010187923908233643, 0.00011628866195678711, 0.0001306980848312378, 0.00014510750770568848, 0.00015951693058013916, 0.00017392635345458984, 0.00018833577632904053, 0.0002027451992034912, 0.0002171546220779419, 0.00023156404495239258, 0.00024597346782684326, 0.00026038289070129395, 0.00027479231357574463, 0.0002892017364501953, 0.000303611159324646, 0.0003180205821990967, 0.00033243000507354736, 0.00034683942794799805, 0.00036124885082244873, 0.0003756582736968994, 0.0003900676965713501, 0.0004044771194458008, 0.00041888654232025146, 0.00043329596519470215, 0.00044770538806915283, 0.0004621148109436035, 0.0004765242338180542, 0.0004909336566925049, 0.0005053430795669556, 0.0005197525024414062]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4088.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.00014322157949209213, -0.00014053098857402802, -0.0001378403976559639, -0.00013514980673789978, -0.00013245921581983566, -0.00012976862490177155, -0.00012707803398370743, -0.0001243874430656433, -0.00012169685214757919, -0.00011900626122951508, -0.00011631567031145096, -0.00011362507939338684, -0.00011093448847532272, -0.0001082438975572586, -0.00010555330663919449, -0.00010286271572113037, -0.00010017212480306625, -9.748153388500214e-05, -9.479094296693802e-05, -9.21003520488739e-05, -8.940976113080978e-05, -8.671917021274567e-05, -8.402857929468155e-05, -8.133798837661743e-05, -7.864739745855331e-05, -7.59568065404892e-05, -7.326621562242508e-05, -7.057562470436096e-05, -6.788503378629684e-05, -6.519444286823273e-05, -6.250385195016861e-05, -5.981326103210449e-05, -5.7122670114040375e-05, -5.443207919597626e-05, -5.174148827791214e-05, -4.905089735984802e-05, -4.6360306441783905e-05, -4.366971552371979e-05, -4.097912460565567e-05, -3.828853368759155e-05, -3.5597942769527435e-05, -3.290735185146332e-05, -3.02167609333992e-05, -2.7526170015335083e-05, -2.4835579097270966e-05, -2.2144988179206848e-05, -1.945439726114273e-05, -1.6763806343078613e-05, -1.4073215425014496e-05, -1.1382624506950378e-05, -8.692033588886261e-06, -6.0014426708221436e-06, -3.310851752758026e-06, -6.202608346939087e-07, 2.0703300833702087e-06, 4.760921001434326e-06, 7.451511919498444e-06, 1.0142102837562561e-05, 1.2832693755626678e-05, 1.5523284673690796e-05, 1.8213875591754913e-05, 2.090446650981903e-05, 2.3595057427883148e-05, 2.6285648345947266e-05]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 864.0, 135.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002853727783076465, -0.0002710241242311895, -0.00025667547015473247, -0.00024232680152636021, -0.00022797813289798796, -0.00021362947882153094, -0.00019928082474507391, -0.0001849321706686169, -0.00017058350204024464, -0.00015623484796378762, -0.00014188617933541536, -0.00012753752525895834, -0.0001131888639065437, -9.884020255412906e-05, -8.449154847767204e-05, -7.01428871252574e-05, -5.5794225772842765e-05, -4.144556442042813e-05, -2.7096906705992296e-05, -1.2748248991556466e-05, 1.6004123608581722e-06, 1.594907371327281e-05, 3.0297727789729834e-05, 4.464638914214447e-05, 5.899505049455911e-05, 7.334371184697375e-05, 8.769237319938838e-05, 0.00010204102727584541, 0.00011638968862826005, 0.00013073834998067468, 0.0001450870040571317, 0.00015943567268550396, 0.00017378432676196098, 0.000188132980838418, 0.00020248164946679026, 0.00021683030354324728, 0.00023117897217161953, 0.00024552762624807656, 0.0002598762803245336, 0.0002742249344009906, 0.0002885736175812781, 0.0003029222716577351, 0.00031727092573419213, 0.00033161957981064916, 0.00034596826299093664, 0.00036031691706739366, 0.0003746655711438507, 0.0003890142252203077, 0.00040336287929676473, 0.00041771153337322176, 0.0004320601874496788, 0.00044640887062996626, 0.0004607575247064233, 0.0004751061787828803, 0.0004894548328593373, 0.0005038034869357944, 0.0005181521410122514, 0.0005325007950887084, 0.0005468494491651654, 0.0005611981032416224, 0.0005755467573180795, 0.0005898954113945365, 0.0006042440654709935, 0.0006185927777551115, 0.0006329414318315685]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 12.0, 25.0, 46.0, 97.0, 140.0, 181.0, 137.0, 177.0, 99.0, 48.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00029224157333374023, -0.00028496887534856796, -0.0002776961773633957, -0.0002704234793782234, -0.00026315078139305115, -0.0002558780834078789, -0.0002486053854227066, -0.00024133268743753433, -0.00023405998945236206, -0.0002267872914671898, -0.00021951459348201752, -0.00021224189549684525, -0.00020496919751167297, -0.0001976964995265007, -0.00019042380154132843, -0.00018315110355615616, -0.0001758784055709839, -0.00016860570758581161, -0.00016133300960063934, -0.00015406031161546707, -0.0001467876136302948, -0.00013951491564512253, -0.00013224221765995026, -0.00012496951967477798, -0.00011769682168960571, -0.00011042412370443344, -0.00010315142571926117, -9.58787277340889e-05, -8.860602974891663e-05, -8.133333176374435e-05, -7.406063377857208e-05, -6.678793579339981e-05, -5.951523780822754e-05, -5.224253982305527e-05, -4.4969841837882996e-05, -3.7697143852710724e-05, -3.0424445867538452e-05, -2.315174788236618e-05, -1.587904989719391e-05, -8.606351912021637e-06, -1.3336539268493652e-06, 5.9390440583229065e-06, 1.3211742043495178e-05, 2.048444002866745e-05, 2.775713801383972e-05, 3.5029835999011993e-05, 4.2302533984184265e-05, 4.957523196935654e-05, 5.684792995452881e-05, 6.412062793970108e-05, 7.139332592487335e-05, 7.866602391004562e-05, 8.59387218952179e-05, 9.321141988039017e-05, 0.00010048411786556244, 0.00010775681585073471, 0.00011502951383590698, 0.00012230221182107925, 0.00012957490980625153, 0.0001368476077914238, 0.00014412030577659607, 0.00015139300376176834, 0.0001586657017469406, 0.00016593839973211288, 0.00017321109771728516]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 8.0, 2.0, 8.0, 10.0, 16.0, 17.0, 26.0, 29.0, 35.0, 67.0, 88.0, 111.0, 170.0, 242.0, 373.0, 534.0, 909.0, 1455.0, 2649.0, 5553.0, 15080.0, 153695.0, 833031.0, 20151.0, 6659.0, 3032.0, 1639.0, 976.0, 608.0, 430.0, 258.0, 200.0, 135.0, 84.0, 79.0, 50.0, 30.0, 27.0, 34.0, 12.0, 11.0, 8.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020172119140625, -0.01947927474975586, -0.01878643035888672, -0.018093585968017578, -0.017400741577148438, -0.016707897186279297, -0.016015052795410156, -0.015322208404541016, -0.014629364013671875, -0.013936519622802734, -0.013243675231933594, -0.012550830841064453, -0.011857986450195312, -0.011165142059326172, -0.010472297668457031, -0.00977945327758789, -0.00908660888671875, -0.00839376449584961, -0.007700920104980469, -0.007008075714111328, -0.0063152313232421875, -0.005622386932373047, -0.004929542541503906, -0.004236698150634766, -0.003543853759765625, -0.0028510093688964844, -0.0021581649780273438, -0.0014653205871582031, -0.0007724761962890625, -7.963180541992188e-05, 0.0006132125854492188, 0.0013060569763183594, 0.0019989013671875, 0.0026917457580566406, 0.0033845901489257812, 0.004077434539794922, 0.0047702789306640625, 0.005463123321533203, 0.006155967712402344, 0.006848812103271484, 0.007541656494140625, 0.008234500885009766, 0.008927345275878906, 0.009620189666748047, 0.010313034057617188, 0.011005878448486328, 0.011698722839355469, 0.01239156723022461, 0.01308441162109375, 0.01377725601196289, 0.014470100402832031, 0.015162944793701172, 0.015855789184570312, 0.016548633575439453, 0.017241477966308594, 0.017934322357177734, 0.018627166748046875, 0.019320011138916016, 0.020012855529785156, 0.020705699920654297, 0.021398544311523438, 0.022091388702392578, 0.02278423309326172, 0.02347707748413086, 0.024169921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 11.0, 9.0, 9.0, 16.0, 57.0, 136.0, 257.0, 229.0, 109.0, 29.0, 12.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161378860473633, -0.006906986236572266, -0.0066525936126708984, -0.006398200988769531, -0.006143808364868164, -0.005889415740966797, -0.00563502311706543, -0.0053806304931640625, -0.005126237869262695, -0.004871845245361328, -0.004617452621459961, -0.004363059997558594, -0.0041086673736572266, -0.0038542747497558594, -0.003599882125854492, -0.003345489501953125, -0.003091096878051758, -0.0028367042541503906, -0.0025823116302490234, -0.0023279190063476562, -0.002073526382446289, -0.0018191337585449219, -0.0015647411346435547, -0.0013103485107421875, -0.0010559558868408203, -0.0008015632629394531, -0.0005471706390380859, -0.00029277801513671875, -3.838539123535156e-05, 0.00021600723266601562, 0.0004703998565673828, 0.00072479248046875, 0.0009791851043701172, 0.0012335777282714844, 0.0014879703521728516, 0.0017423629760742188, 0.001996755599975586, 0.002251148223876953, 0.0025055408477783203, 0.0027599334716796875, 0.0030143260955810547, 0.003268718719482422, 0.003523111343383789, 0.0037775039672851562, 0.0040318965911865234, 0.004286289215087891, 0.004540681838989258, 0.004795074462890625, 0.005049467086791992, 0.005303859710693359, 0.0055582523345947266, 0.005812644958496094, 0.006067037582397461, 0.006321430206298828, 0.006575822830200195, 0.0068302154541015625, 0.00708460807800293, 0.007339000701904297, 0.007593393325805664, 0.007847785949707031, 0.008102178573608398, 0.008356571197509766, 0.008610963821411133, 0.0088653564453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 12.0, 14.0, 17.0, 22.0, 17.0, 19.0, 19.0, 24.0, 27.0, 32.0, 48.0, 77.0, 114.0, 233.0, 436.0, 1037.0, 2405.0, 170034.0, 868522.0, 3086.0, 1038.0, 534.0, 261.0, 149.0, 76.0, 48.0, 35.0, 38.0, 33.0, 15.0, 13.0, 14.0, 10.0, 18.0, 5.0, 8.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0293121337890625, -0.02836894989013672, -0.027425765991210938, -0.026482582092285156, -0.025539398193359375, -0.024596214294433594, -0.023653030395507812, -0.02270984649658203, -0.02176666259765625, -0.02082347869873047, -0.019880294799804688, -0.018937110900878906, -0.017993927001953125, -0.017050743103027344, -0.016107559204101562, -0.015164375305175781, -0.01422119140625, -0.013278007507324219, -0.012334823608398438, -0.011391639709472656, -0.010448455810546875, -0.009505271911621094, -0.008562088012695312, -0.007618904113769531, -0.00667572021484375, -0.005732536315917969, -0.0047893524169921875, -0.0038461685180664062, -0.002902984619140625, -0.0019598007202148438, -0.0010166168212890625, -7.343292236328125e-05, 0.0008697509765625, 0.0018129348754882812, 0.0027561187744140625, 0.0036993026733398438, 0.004642486572265625, 0.005585670471191406, 0.0065288543701171875, 0.007472038269042969, 0.00841522216796875, 0.009358406066894531, 0.010301589965820312, 0.011244773864746094, 0.012187957763671875, 0.013131141662597656, 0.014074325561523438, 0.015017509460449219, 0.015960693359375, 0.01690387725830078, 0.017847061157226562, 0.018790245056152344, 0.019733428955078125, 0.020676612854003906, 0.021619796752929688, 0.02256298065185547, 0.02350616455078125, 0.02444934844970703, 0.025392532348632812, 0.026335716247558594, 0.027278900146484375, 0.028222084045410156, 0.029165267944335938, 0.03010845184326172, 0.0310516357421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 17.0, 22.0, 16.0, 20.0, 17.0, 22.0, 24.0, 25.0, 28.0, 30.0, 29.0, 41.0, 35.0, 42.0, 36.0, 32.0, 47.0, 45.0, 34.0, 36.0, 42.0, 36.0, 32.0, 31.0, 29.0, 31.0, 30.0, 15.0, 13.0, 14.0, 10.0, 19.0, 4.0, 8.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0174102783203125, -0.016849994659423828, -0.016289710998535156, -0.015729427337646484, -0.015169143676757812, -0.01460886001586914, -0.014048576354980469, -0.013488292694091797, -0.012928009033203125, -0.012367725372314453, -0.011807441711425781, -0.01124715805053711, -0.010686874389648438, -0.010126590728759766, -0.009566307067871094, -0.009006023406982422, -0.00844573974609375, -0.007885456085205078, -0.007325172424316406, -0.006764888763427734, -0.0062046051025390625, -0.005644321441650391, -0.005084037780761719, -0.004523754119873047, -0.003963470458984375, -0.003403186798095703, -0.0028429031372070312, -0.0022826194763183594, -0.0017223358154296875, -0.0011620521545410156, -0.0006017684936523438, -4.1484832763671875e-05, 0.000518798828125, 0.0010790824890136719, 0.0016393661499023438, 0.0021996498107910156, 0.0027599334716796875, 0.0033202171325683594, 0.0038805007934570312, 0.004440784454345703, 0.005001068115234375, 0.005561351776123047, 0.006121635437011719, 0.006681919097900391, 0.0072422027587890625, 0.007802486419677734, 0.008362770080566406, 0.008923053741455078, 0.00948333740234375, 0.010043621063232422, 0.010603904724121094, 0.011164188385009766, 0.011724472045898438, 0.01228475570678711, 0.012845039367675781, 0.013405323028564453, 0.013965606689453125, 0.014525890350341797, 0.015086174011230469, 0.01564645767211914, 0.016206741333007812, 0.016767024993896484, 0.017327308654785156, 0.017887592315673828, 0.0184478759765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 1.0, 7.0, 5.0, 4.0, 4.0, 7.0, 10.0, 24.0, 35.0, 44.0, 86.0, 196.0, 344.0, 1235.0, 44626.0, 997557.0, 3239.0, 567.0, 241.0, 117.0, 63.0, 38.0, 25.0, 18.0, 11.0, 6.0, 8.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4007091522216797e-05, -1.3597309589385986e-05, -1.3187527656555176e-05, -1.2777745723724365e-05, -1.2367963790893555e-05, -1.1958181858062744e-05, -1.1548399925231934e-05, -1.1138617992401123e-05, -1.0728836059570312e-05, -1.0319054126739502e-05, -9.909272193908691e-06, -9.499490261077881e-06, -9.08970832824707e-06, -8.67992639541626e-06, -8.27014446258545e-06, -7.860362529754639e-06, -7.450580596923828e-06, -7.040798664093018e-06, -6.631016731262207e-06, -6.2212347984313965e-06, -5.811452865600586e-06, -5.401670932769775e-06, -4.991888999938965e-06, -4.582107067108154e-06, -4.172325134277344e-06, -3.762543201446533e-06, -3.3527612686157227e-06, -2.942979335784912e-06, -2.5331974029541016e-06, -2.123415470123291e-06, -1.7136335372924805e-06, -1.30385160446167e-06, -8.940696716308594e-07, -4.842877388000488e-07, -7.450580596923828e-08, 3.3527612686157227e-07, 7.450580596923828e-07, 1.1548399925231934e-06, 1.564621925354004e-06, 1.9744038581848145e-06, 2.384185791015625e-06, 2.7939677238464355e-06, 3.203749656677246e-06, 3.6135315895080566e-06, 4.023313522338867e-06, 4.433095455169678e-06, 4.842877388000488e-06, 5.252659320831299e-06, 5.662441253662109e-06, 6.07222318649292e-06, 6.4820051193237305e-06, 6.891787052154541e-06, 7.3015689849853516e-06, 7.711350917816162e-06, 8.121132850646973e-06, 8.530914783477783e-06, 8.940696716308594e-06, 9.350478649139404e-06, 9.760260581970215e-06, 1.0170042514801025e-05, 1.0579824447631836e-05, 1.0989606380462646e-05, 1.1399388313293457e-05, 1.1809170246124268e-05, 1.2218952178955078e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 3.0, 4.0, 4.0, 7.0, 4.0, 6.0, 5.0, 18.0, 23.0, 29.0, 31.0, 56.0, 64.0, 69.0, 102.0, 146.0, 84.0, 74.0, 75.0, 40.0, 34.0, 30.0, 20.0, 14.0, 10.0, 7.0, 4.0, 5.0, 8.0, 4.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.165836334228516e-06, -7.927417755126953e-06, -7.68899917602539e-06, -7.450580596923828e-06, -7.212162017822266e-06, -6.973743438720703e-06, -6.735324859619141e-06, -6.496906280517578e-06, -6.258487701416016e-06, -6.020069122314453e-06, -5.781650543212891e-06, -5.543231964111328e-06, -5.304813385009766e-06, -5.066394805908203e-06, -4.827976226806641e-06, -4.589557647705078e-06, -4.351139068603516e-06, -4.112720489501953e-06, -3.874301910400391e-06, -3.635883331298828e-06, -3.3974647521972656e-06, -3.159046173095703e-06, -2.9206275939941406e-06, -2.682209014892578e-06, -2.4437904357910156e-06, -2.205371856689453e-06, -1.9669532775878906e-06, -1.7285346984863281e-06, -1.4901161193847656e-06, -1.2516975402832031e-06, -1.0132789611816406e-06, -7.748603820800781e-07, -5.364418029785156e-07, -2.980232238769531e-07, -5.960464477539063e-08, 1.7881393432617188e-07, 4.172325134277344e-07, 6.556510925292969e-07, 8.940696716308594e-07, 1.1324882507324219e-06, 1.3709068298339844e-06, 1.6093254089355469e-06, 1.8477439880371094e-06, 2.086162567138672e-06, 2.3245811462402344e-06, 2.562999725341797e-06, 2.8014183044433594e-06, 3.039836883544922e-06, 3.2782554626464844e-06, 3.516674041748047e-06, 3.7550926208496094e-06, 3.993511199951172e-06, 4.231929779052734e-06, 4.470348358154297e-06, 4.708766937255859e-06, 4.947185516357422e-06, 5.185604095458984e-06, 5.424022674560547e-06, 5.662441253662109e-06, 5.900859832763672e-06, 6.139278411865234e-06, 6.377696990966797e-06, 6.616115570068359e-06, 6.854534149169922e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 7.0, 5.0, 16.0, 20.0, 41.0, 92.0, 232.0, 632.0, 1028564.0, 18057.0, 510.0, 178.0, 78.0, 36.0, 17.0, 16.0, 7.0, 9.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.497729241847992e-05, -4.3820589780807495e-05, -4.266388714313507e-05, -4.1507184505462646e-05, -4.035048186779022e-05, -3.91937792301178e-05, -3.8037076592445374e-05, -3.688037395477295e-05, -3.5723671317100525e-05, -3.45669686794281e-05, -3.3410266041755676e-05, -3.225356340408325e-05, -3.109686076641083e-05, -2.9940158128738403e-05, -2.878345549106598e-05, -2.7626752853393555e-05, -2.647005021572113e-05, -2.5313347578048706e-05, -2.4156644940376282e-05, -2.2999942302703857e-05, -2.1843239665031433e-05, -2.068653702735901e-05, -1.9529834389686584e-05, -1.837313175201416e-05, -1.7216429114341736e-05, -1.605972647666931e-05, -1.4903023838996887e-05, -1.3746321201324463e-05, -1.2589618563652039e-05, -1.1432915925979614e-05, -1.027621328830719e-05, -9.119510650634766e-06, -7.962808012962341e-06, -6.806105375289917e-06, -5.649402737617493e-06, -4.492700099945068e-06, -3.335997462272644e-06, -2.1792948246002197e-06, -1.0225921869277954e-06, 1.341104507446289e-07, 1.2908130884170532e-06, 2.4475157260894775e-06, 3.604218363761902e-06, 4.760921001434326e-06, 5.9176236391067505e-06, 7.074326276779175e-06, 8.231028914451599e-06, 9.387731552124023e-06, 1.0544434189796448e-05, 1.1701136827468872e-05, 1.2857839465141296e-05, 1.401454210281372e-05, 1.5171244740486145e-05, 1.632794737815857e-05, 1.7484650015830994e-05, 1.8641352653503418e-05, 1.9798055291175842e-05, 2.0954757928848267e-05, 2.211146056652069e-05, 2.3268163204193115e-05, 2.442486584186554e-05, 2.5581568479537964e-05, 2.6738271117210388e-05, 2.7894973754882812e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 8.0, 10.0, 12.0, 21.0, 36.0, 83.0, 463.0, 146.0, 71.0, 46.0, 17.0, 11.0, 7.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7358531951904297e-05, -2.6673078536987305e-05, -2.5987625122070312e-05, -2.530217170715332e-05, -2.4616718292236328e-05, -2.3931264877319336e-05, -2.3245811462402344e-05, -2.256035804748535e-05, -2.187490463256836e-05, -2.1189451217651367e-05, -2.0503997802734375e-05, -1.9818544387817383e-05, -1.913309097290039e-05, -1.84476375579834e-05, -1.7762184143066406e-05, -1.7076730728149414e-05, -1.6391277313232422e-05, -1.570582389831543e-05, -1.5020370483398438e-05, -1.4334917068481445e-05, -1.3649463653564453e-05, -1.2964010238647461e-05, -1.2278556823730469e-05, -1.1593103408813477e-05, -1.0907649993896484e-05, -1.0222196578979492e-05, -9.5367431640625e-06, -8.851289749145508e-06, -8.165836334228516e-06, -7.4803829193115234e-06, -6.794929504394531e-06, -6.109476089477539e-06, -5.424022674560547e-06, -4.738569259643555e-06, -4.0531158447265625e-06, -3.3676624298095703e-06, -2.682209014892578e-06, -1.996755599975586e-06, -1.3113021850585938e-06, -6.258487701416016e-07, 5.960464477539063e-08, 7.450580596923828e-07, 1.430511474609375e-06, 2.115964889526367e-06, 2.8014183044433594e-06, 3.4868717193603516e-06, 4.172325134277344e-06, 4.857778549194336e-06, 5.543231964111328e-06, 6.22868537902832e-06, 6.9141387939453125e-06, 7.599592208862305e-06, 8.285045623779297e-06, 8.970499038696289e-06, 9.655952453613281e-06, 1.0341405868530273e-05, 1.1026859283447266e-05, 1.1712312698364258e-05, 1.239776611328125e-05, 1.3083219528198242e-05, 1.3768672943115234e-05, 1.4454126358032227e-05, 1.5139579772949219e-05, 1.582503318786621e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 15.0, 833.0, 164.0, 3.0, 2.0, 2.0], "bins": [-0.5653712749481201, -0.5559164881706238, -0.5464617013931274, -0.5370069146156311, -0.5275521278381348, -0.5180974006652832, -0.5086426138877869, -0.49918779730796814, -0.4897330403327942, -0.48027825355529785, -0.4708234667778015, -0.46136870980262756, -0.4519139230251312, -0.4424591362476349, -0.43300434947013855, -0.4235495626926422, -0.4140947759151459, -0.40463998913764954, -0.3951852023601532, -0.38573044538497925, -0.3762756586074829, -0.3668208718299866, -0.35736608505249023, -0.3479112982749939, -0.33845651149749756, -0.3290017247200012, -0.3195469379425049, -0.31009218096733093, -0.3006373941898346, -0.29118260741233826, -0.2817278206348419, -0.2722730338573456, -0.26281827688217163, -0.2533634901046753, -0.24390871822834015, -0.2344539314508438, -0.22499915957450867, -0.21554437279701233, -0.206089586019516, -0.19663479924201965, -0.18718001246452332, -0.17772522568702698, -0.16827045381069183, -0.1588156670331955, -0.14936089515686035, -0.139906108379364, -0.13045132160186768, -0.12099654227495193, -0.11154177039861679, -0.10208699107170105, -0.09263220429420471, -0.08317742496728897, -0.07372264564037323, -0.06426786631345749, -0.05481308326125145, -0.04535830020904541, -0.03590352088212967, -0.02644873969256878, -0.01699395850300789, -0.007539177313446999, 0.0019156038761138916, 0.011370383203029633, 0.020825166255235672, 0.03027994930744171, 0.03973472863435745]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 4.0, 11.0, 12.0, 15.0, 17.0, 21.0, 19.0, 21.0, 29.0, 29.0, 50.0, 43.0, 43.0, 44.0, 47.0, 48.0, 52.0, 58.0, 37.0, 58.0, 39.0, 31.0, 39.0, 28.0, 31.0, 32.0, 20.0, 16.0, 14.0, 9.0, 7.0, 8.0, 13.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0904165506362915, -0.08730985969305038, -0.08420316874980927, -0.08109647780656815, -0.07798978686332703, -0.0748831033706665, -0.07177641242742538, -0.06866972148418427, -0.06556303054094315, -0.062456339597702026, -0.05934964865446091, -0.056242961436510086, -0.05313627049326897, -0.05002957955002785, -0.046922892332077026, -0.04381620138883591, -0.04070951044559479, -0.03760281950235367, -0.03449612855911255, -0.03138944134116173, -0.02828275039792061, -0.02517605945467949, -0.02206937037408352, -0.01896268129348755, -0.01585599035024643, -0.012749300338327885, -0.00964261032640934, -0.006535920314490795, -0.0034292303025722504, -0.0003225402906537056, 0.002784149721264839, 0.005890838801860809, 0.008997529745101929, 0.012104219757020473, 0.015210909768939018, 0.01831759884953499, 0.021424289792776108, 0.024530980736017227, 0.027637669816613197, 0.030744358897209167, 0.03385104984045029, 0.036957740783691406, 0.040064431726932526, 0.04317111894488335, 0.046277809888124466, 0.049384500831365585, 0.052491188049316406, 0.055597878992557526, 0.058704569935798645, 0.061811260879039764, 0.06491795182228088, 0.068024642765522, 0.07113133370876312, 0.07423801720142365, 0.07734470814466476, 0.08045139908790588, 0.083558090031147, 0.08666478097438812, 0.08977147191762924, 0.09287816286087036, 0.09598484635353088, 0.099091537296772, 0.10219822824001312, 0.10530491918325424, 0.10841161012649536]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 7.0, 14.0, 9.0, 13.0, 26.0, 85.0, 2331.0, 4191427.0, 152.0, 74.0, 19.0, 10.0, 9.0, 12.0, 13.0, 3.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007352828979492188, -0.0007142797112464905, -0.0006932765245437622, -0.0006722733378410339, -0.0006512701511383057, -0.0006302669644355774, -0.0006092637777328491, -0.0005882605910301208, -0.0005672574043273926, -0.0005462542176246643, -0.000525251030921936, -0.0005042478442192078, -0.0004832446575164795, -0.0004622414708137512, -0.00044123828411102295, -0.0004202350974082947, -0.0003992319107055664, -0.00037822872400283813, -0.00035722553730010986, -0.0003362223505973816, -0.0003152191638946533, -0.00029421597719192505, -0.0002732127904891968, -0.0002522096037864685, -0.00023120641708374023, -0.00021020323038101196, -0.0001892000436782837, -0.00016819685697555542, -0.00014719367027282715, -0.00012619048357009888, -0.0001051872968673706, -8.418411016464233e-05, -6.318092346191406e-05, -4.217773675918579e-05, -2.117455005645752e-05, -1.7136335372924805e-07, 2.0831823348999023e-05, 4.1835010051727295e-05, 6.283819675445557e-05, 8.384138345718384e-05, 0.00010484457015991211, 0.00012584775686264038, 0.00014685094356536865, 0.00016785413026809692, 0.0001888573169708252, 0.00020986050367355347, 0.00023086369037628174, 0.00025186687707901, 0.0002728700637817383, 0.00029387325048446655, 0.0003148764371871948, 0.0003358796238899231, 0.00035688281059265137, 0.00037788599729537964, 0.0003988891839981079, 0.0004198923707008362, 0.00044089555740356445, 0.0004618987441062927, 0.000482901930809021, 0.0005039051175117493, 0.0005249083042144775, 0.0005459114909172058, 0.0005669146776199341, 0.0005879178643226624, 0.0006089210510253906]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 9.0, 9.0, 16.0, 55.0, 129.0, 264.0, 225.0, 113.0, 31.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161617279052734, -0.006907463073730469, -0.006653308868408203, -0.0063991546630859375, -0.006145000457763672, -0.005890846252441406, -0.005636692047119141, -0.005382537841796875, -0.005128383636474609, -0.004874229431152344, -0.004620075225830078, -0.0043659210205078125, -0.004111766815185547, -0.0038576126098632812, -0.0036034584045410156, -0.00334930419921875, -0.0030951499938964844, -0.0028409957885742188, -0.002586841583251953, -0.0023326873779296875, -0.002078533172607422, -0.0018243789672851562, -0.0015702247619628906, -0.001316070556640625, -0.0010619163513183594, -0.0008077621459960938, -0.0005536079406738281, -0.0002994537353515625, -4.5299530029296875e-05, 0.00020885467529296875, 0.0004630088806152344, 0.0007171630859375, 0.0009713172912597656, 0.0012254714965820312, 0.0014796257019042969, 0.0017337799072265625, 0.001987934112548828, 0.0022420883178710938, 0.0024962425231933594, 0.002750396728515625, 0.0030045509338378906, 0.0032587051391601562, 0.003512859344482422, 0.0037670135498046875, 0.004021167755126953, 0.004275321960449219, 0.004529476165771484, 0.00478363037109375, 0.005037784576416016, 0.005291938781738281, 0.005546092987060547, 0.0058002471923828125, 0.006054401397705078, 0.006308555603027344, 0.006562709808349609, 0.006816864013671875, 0.007071018218994141, 0.007325172424316406, 0.007579326629638672, 0.007833480834960938, 0.008087635040283203, 0.008341789245605469, 0.008595943450927734, 0.00885009765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 35.0, 45.0, 97.0, 128.0, 126.0, 4193410.0, 134.0, 105.0, 84.0, 53.0, 31.0, 18.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008306503295898438, -0.0008111335337162018, -0.0007916167378425598, -0.0007720999419689178, -0.0007525831460952759, -0.0007330663502216339, -0.0007135495543479919, -0.00069403275847435, -0.000674515962600708, -0.000654999166727066, -0.0006354823708534241, -0.0006159655749797821, -0.0005964487791061401, -0.0005769319832324982, -0.0005574151873588562, -0.0005378983914852142, -0.0005183815956115723, -0.0004988647997379303, -0.00047934800386428833, -0.00045983120799064636, -0.0004403144121170044, -0.0004207976162433624, -0.00040128082036972046, -0.0003817640244960785, -0.0003622472286224365, -0.00034273043274879456, -0.0003232136368751526, -0.0003036968410015106, -0.00028418004512786865, -0.0002646632492542267, -0.0002451464533805847, -0.00022562965750694275, -0.00020611286163330078, -0.0001865960657596588, -0.00016707926988601685, -0.00014756247401237488, -0.0001280456781387329, -0.00010852888226509094, -8.901208639144897e-05, -6.949529051780701e-05, -4.997849464416504e-05, -3.046169877052307e-05, -1.0944902896881104e-05, 8.571892976760864e-06, 2.8088688850402832e-05, 4.76054847240448e-05, 6.712228059768677e-05, 8.663907647132874e-05, 0.0001061558723449707, 0.00012567266821861267, 0.00014518946409225464, 0.0001647062599658966, 0.00018422305583953857, 0.00020373985171318054, 0.0002232566475868225, 0.00024277344346046448, 0.00026229023933410645, 0.0002818070352077484, 0.0003013238310813904, 0.00032084062695503235, 0.0003403574228286743, 0.0003598742187023163, 0.00037939101457595825, 0.0003989078104496002, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4093.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.854534149169922e-06, -3.998167812824249e-06, -1.1418014764785767e-06, 1.714564859867096e-06, 4.5709311962127686e-06, 7.427297532558441e-06, 1.0283663868904114e-05, 1.3140030205249786e-05, 1.599639654159546e-05, 1.885276287794113e-05, 2.1709129214286804e-05, 2.4565495550632477e-05, 2.742186188697815e-05, 3.0278228223323822e-05, 3.3134594559669495e-05, 3.599096089601517e-05, 3.884732723236084e-05, 4.170369356870651e-05, 4.4560059905052185e-05, 4.741642624139786e-05, 5.027279257774353e-05, 5.31291589140892e-05, 5.5985525250434875e-05, 5.884189158678055e-05, 6.169825792312622e-05, 6.45546242594719e-05, 6.741099059581757e-05, 7.026735693216324e-05, 7.312372326850891e-05, 7.598008960485458e-05, 7.883645594120026e-05, 8.169282227754593e-05, 8.45491886138916e-05, 8.740555495023727e-05, 9.026192128658295e-05, 9.311828762292862e-05, 9.597465395927429e-05, 9.883102029561996e-05, 0.00010168738663196564, 0.00010454375296831131, 0.00010740011930465698, 0.00011025648564100266, 0.00011311285197734833, 0.000115969218313694, 0.00011882558465003967, 0.00012168195098638535, 0.00012453831732273102, 0.0001273946836590767, 0.00013025104999542236, 0.00013310741633176804, 0.0001359637826681137, 0.00013882014900445938, 0.00014167651534080505, 0.00014453288167715073, 0.0001473892480134964, 0.00015024561434984207, 0.00015310198068618774, 0.00015595834702253342, 0.0001588147133588791, 0.00016167107969522476, 0.00016452744603157043, 0.0001673838123679161, 0.00017024017870426178, 0.00017309654504060745, 0.00017595291137695312]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 980.0, 26.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007240754785016179, -0.0007026340463198721, -0.0006811925559304655, -0.0006597511237487197, -0.000638309633359313, -0.0006168682011775672, -0.0005954267689958215, -0.0005739852786064148, -0.000552543846424669, -0.0005311024142429233, -0.0005096609238535166, -0.0004882194916717708, -0.0004667780303861946, -0.00044533656910061836, -0.0004238951369188726, -0.00040245367563329637, -0.00038101221434772015, -0.0003595707530621439, -0.0003381292917765677, -0.00031668785959482193, -0.0002952463983092457, -0.0002738049370236695, -0.0002523635048419237, -0.0002309220435563475, -0.00020948058227077127, -0.00018803912098519504, -0.00016659767425153404, -0.00014515622751787305, -0.00012371476623229682, -0.00010227331222267821, -8.08318582130596e-05, -5.939041147939861e-05, -3.7948950193822384e-05, -1.6507496184203774e-05, 4.933957825414836e-06, 2.6375411835033447e-05, 4.781686584465206e-05, 6.925831985427067e-05, 9.069977386388928e-05, 0.00011214122059755027, 0.0001335826818831265, 0.00015502414316870272, 0.00017646558990236372, 0.0001979070366360247, 0.00021934849792160094, 0.00024078995920717716, 0.00026223139138892293, 0.00028367285267449915, 0.0003051143139600754, 0.0003265557752456516, 0.0003479972365312278, 0.0003694386687129736, 0.0003908801299985498, 0.00041232159128412604, 0.0004337630234658718, 0.00045520448475144804, 0.00047664594603702426, 0.00049808737821877, 0.0005195288686081767, 0.0005409703007899225, 0.0005624117329716682, 0.0005838532233610749, 0.0006052946555428207, 0.0006267360877245665, 0.0006481775781139731]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 2.0, 14.0, 27.0, 84.0, 106.0, 222.0, 159.0, 192.0, 91.0, 64.0, 13.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014632940292358398, -0.00013832375407218933, -0.00013031810522079468, -0.00012231245636940002, -0.00011430680751800537, -0.00010630115866661072, -9.829550981521606e-05, -9.028986096382141e-05, -8.228421211242676e-05, -7.42785632610321e-05, -6.627291440963745e-05, -5.82672655582428e-05, -5.0261616706848145e-05, -4.225596785545349e-05, -3.425031900405884e-05, -2.6244670152664185e-05, -1.823902130126953e-05, -1.0233372449874878e-05, -2.2277235984802246e-06, 5.777925252914429e-06, 1.3783574104309082e-05, 2.1789222955703735e-05, 2.979487180709839e-05, 3.780052065849304e-05, 4.5806169509887695e-05, 5.381181836128235e-05, 6.1817467212677e-05, 6.982311606407166e-05, 7.782876491546631e-05, 8.583441376686096e-05, 9.384006261825562e-05, 0.00010184571146965027, 0.00010985136032104492, 0.00011785700917243958, 0.00012586265802383423, 0.00013386830687522888, 0.00014187395572662354, 0.0001498796045780182, 0.00015788525342941284, 0.0001658909022808075, 0.00017389655113220215, 0.0001819021999835968, 0.00018990784883499146, 0.0001979134976863861, 0.00020591914653778076, 0.00021392479538917542, 0.00022193044424057007, 0.00022993609309196472, 0.00023794174194335938, 0.00024594739079475403, 0.0002539530396461487, 0.00026195868849754333, 0.000269964337348938, 0.00027796998620033264, 0.0002859756350517273, 0.00029398128390312195, 0.0003019869327545166, 0.00030999258160591125, 0.0003179982304573059, 0.00032600387930870056, 0.0003340095281600952, 0.00034201517701148987, 0.0003500208258628845, 0.0003580264747142792, 0.00036603212356567383]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 7.0, 10.0, 4.0, 8.0, 9.0, 14.0, 10.0, 19.0, 35.0, 63.0, 108.0, 239.0, 488.0, 1033.0, 2908.0, 12267.0, 890052.0, 128634.0, 8578.0, 2330.0, 852.0, 402.0, 190.0, 99.0, 58.0, 26.0, 22.0, 14.0, 13.0, 10.0, 7.0, 5.0, 6.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03643798828125, -0.03539395332336426, -0.034349918365478516, -0.03330588340759277, -0.03226184844970703, -0.03121781349182129, -0.030173778533935547, -0.029129743576049805, -0.028085708618164062, -0.02704167366027832, -0.025997638702392578, -0.024953603744506836, -0.023909568786621094, -0.02286553382873535, -0.02182149887084961, -0.020777463912963867, -0.019733428955078125, -0.018689393997192383, -0.01764535903930664, -0.0166013240814209, -0.015557289123535156, -0.014513254165649414, -0.013469219207763672, -0.01242518424987793, -0.011381149291992188, -0.010337114334106445, -0.009293079376220703, -0.008249044418334961, -0.007205009460449219, -0.0061609745025634766, -0.005116939544677734, -0.004072904586791992, -0.00302886962890625, -0.001984834671020508, -0.0009407997131347656, 0.00010323524475097656, 0.0011472702026367188, 0.002191305160522461, 0.003235340118408203, 0.004279375076293945, 0.0053234100341796875, 0.00636744499206543, 0.007411479949951172, 0.008455514907836914, 0.009499549865722656, 0.010543584823608398, 0.01158761978149414, 0.012631654739379883, 0.013675689697265625, 0.014719724655151367, 0.01576375961303711, 0.01680779457092285, 0.017851829528808594, 0.018895864486694336, 0.019939899444580078, 0.02098393440246582, 0.022027969360351562, 0.023072004318237305, 0.024116039276123047, 0.02516007423400879, 0.02620410919189453, 0.027248144149780273, 0.028292179107666016, 0.029336214065551758, 0.0303802490234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 9.0, 9.0, 16.0, 55.0, 129.0, 264.0, 225.0, 113.0, 31.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161617279052734, -0.006907463073730469, -0.006653308868408203, -0.0063991546630859375, -0.006145000457763672, -0.005890846252441406, -0.005636692047119141, -0.005382537841796875, -0.005128383636474609, -0.004874229431152344, -0.004620075225830078, -0.0043659210205078125, -0.004111766815185547, -0.0038576126098632812, -0.0036034584045410156, -0.00334930419921875, -0.0030951499938964844, -0.0028409957885742188, -0.002586841583251953, -0.0023326873779296875, -0.002078533172607422, -0.0018243789672851562, -0.0015702247619628906, -0.001316070556640625, -0.0010619163513183594, -0.0008077621459960938, -0.0005536079406738281, -0.0002994537353515625, -4.5299530029296875e-05, 0.00020885467529296875, 0.0004630088806152344, 0.0007171630859375, 0.0009713172912597656, 0.0012254714965820312, 0.0014796257019042969, 0.0017337799072265625, 0.001987934112548828, 0.0022420883178710938, 0.0024962425231933594, 0.002750396728515625, 0.0030045509338378906, 0.0032587051391601562, 0.003512859344482422, 0.0037670135498046875, 0.004021167755126953, 0.004275321960449219, 0.004529476165771484, 0.00478363037109375, 0.005037784576416016, 0.005291938781738281, 0.005546092987060547, 0.0058002471923828125, 0.006054401397705078, 0.006308555603027344, 0.006562709808349609, 0.006816864013671875, 0.007071018218994141, 0.007325172424316406, 0.007579326629638672, 0.007833480834960938, 0.008087635040283203, 0.008341789245605469, 0.008595943450927734, 0.00885009765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 7.0, 8.0, 12.0, 14.0, 26.0, 17.0, 28.0, 23.0, 34.0, 34.0, 56.0, 92.0, 180.0, 391.0, 876.0, 3224.0, 964860.0, 75165.0, 1939.0, 724.0, 286.0, 142.0, 70.0, 52.0, 33.0, 37.0, 24.0, 18.0, 23.0, 15.0, 24.0, 14.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0262908935546875, -0.025438547134399414, -0.024586200714111328, -0.023733854293823242, -0.022881507873535156, -0.02202916145324707, -0.021176815032958984, -0.0203244686126709, -0.019472122192382812, -0.018619775772094727, -0.01776742935180664, -0.016915082931518555, -0.01606273651123047, -0.015210390090942383, -0.014358043670654297, -0.013505697250366211, -0.012653350830078125, -0.011801004409790039, -0.010948657989501953, -0.010096311569213867, -0.009243965148925781, -0.008391618728637695, -0.007539272308349609, -0.0066869258880615234, -0.0058345794677734375, -0.0049822330474853516, -0.004129886627197266, -0.0032775402069091797, -0.0024251937866210938, -0.0015728473663330078, -0.0007205009460449219, 0.00013184547424316406, 0.00098419189453125, 0.001836538314819336, 0.002688884735107422, 0.003541231155395508, 0.004393577575683594, 0.00524592399597168, 0.006098270416259766, 0.0069506168365478516, 0.0078029632568359375, 0.008655309677124023, 0.00950765609741211, 0.010360002517700195, 0.011212348937988281, 0.012064695358276367, 0.012917041778564453, 0.013769388198852539, 0.014621734619140625, 0.015474081039428711, 0.016326427459716797, 0.017178773880004883, 0.01803112030029297, 0.018883466720581055, 0.01973581314086914, 0.020588159561157227, 0.021440505981445312, 0.0222928524017334, 0.023145198822021484, 0.02399754524230957, 0.024849891662597656, 0.025702238082885742, 0.026554584503173828, 0.027406930923461914, 0.02825927734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 7.0, 9.0, 12.0, 15.0, 25.0, 16.0, 28.0, 23.0, 31.0, 29.0, 31.0, 36.0, 40.0, 36.0, 36.0, 46.0, 42.0, 42.0, 31.0, 42.0, 29.0, 38.0, 30.0, 38.0, 30.0, 36.0, 25.0, 17.0, 24.0, 14.0, 25.0, 14.0, 16.0, 13.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.016326904296875, -0.015796899795532227, -0.015266895294189453, -0.01473689079284668, -0.014206886291503906, -0.013676881790161133, -0.01314687728881836, -0.012616872787475586, -0.012086868286132812, -0.011556863784790039, -0.011026859283447266, -0.010496854782104492, -0.009966850280761719, -0.009436845779418945, -0.008906841278076172, -0.008376836776733398, -0.007846832275390625, -0.0073168277740478516, -0.006786823272705078, -0.006256818771362305, -0.005726814270019531, -0.005196809768676758, -0.004666805267333984, -0.004136800765991211, -0.0036067962646484375, -0.003076791763305664, -0.0025467872619628906, -0.002016782760620117, -0.0014867782592773438, -0.0009567737579345703, -0.0004267692565917969, 0.00010323524475097656, 0.00063323974609375, 0.0011632442474365234, 0.0016932487487792969, 0.0022232532501220703, 0.0027532577514648438, 0.003283262252807617, 0.0038132667541503906, 0.004343271255493164, 0.0048732757568359375, 0.005403280258178711, 0.005933284759521484, 0.006463289260864258, 0.006993293762207031, 0.007523298263549805, 0.008053302764892578, 0.008583307266235352, 0.009113311767578125, 0.009643316268920898, 0.010173320770263672, 0.010703325271606445, 0.011233329772949219, 0.011763334274291992, 0.012293338775634766, 0.012823343276977539, 0.013353347778320312, 0.013883352279663086, 0.01441335678100586, 0.014943361282348633, 0.015473365783691406, 0.01600337028503418, 0.016533374786376953, 0.017063379287719727, 0.0175933837890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 17.0, 9.0, 15.0, 18.0, 23.0, 20.0, 25.0, 32.0, 72.0, 93.0, 250.0, 414.0, 1661.0, 6416.0, 899259.0, 131110.0, 7112.0, 1013.0, 472.0, 150.0, 115.0, 45.0, 37.0, 19.0, 34.0, 16.0, 20.0, 17.0, 14.0, 6.0, 9.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.3942203521728516e-06, -5.185604095458984e-06, -4.976987838745117e-06, -4.76837158203125e-06, -4.559755325317383e-06, -4.351139068603516e-06, -4.1425228118896484e-06, -3.933906555175781e-06, -3.725290298461914e-06, -3.516674041748047e-06, -3.3080577850341797e-06, -3.0994415283203125e-06, -2.8908252716064453e-06, -2.682209014892578e-06, -2.473592758178711e-06, -2.2649765014648438e-06, -2.0563602447509766e-06, -1.8477439880371094e-06, -1.6391277313232422e-06, -1.430511474609375e-06, -1.2218952178955078e-06, -1.0132789611816406e-06, -8.046627044677734e-07, -5.960464477539062e-07, -3.8743019104003906e-07, -1.7881393432617188e-07, 2.9802322387695312e-08, 2.384185791015625e-07, 4.470348358154297e-07, 6.556510925292969e-07, 8.642673492431641e-07, 1.0728836059570312e-06, 1.2814998626708984e-06, 1.4901161193847656e-06, 1.6987323760986328e-06, 1.9073486328125e-06, 2.115964889526367e-06, 2.3245811462402344e-06, 2.5331974029541016e-06, 2.7418136596679688e-06, 2.950429916381836e-06, 3.159046173095703e-06, 3.3676624298095703e-06, 3.5762786865234375e-06, 3.7848949432373047e-06, 3.993511199951172e-06, 4.202127456665039e-06, 4.410743713378906e-06, 4.6193599700927734e-06, 4.827976226806641e-06, 5.036592483520508e-06, 5.245208740234375e-06, 5.453824996948242e-06, 5.662441253662109e-06, 5.8710575103759766e-06, 6.079673767089844e-06, 6.288290023803711e-06, 6.496906280517578e-06, 6.705522537231445e-06, 6.9141387939453125e-06, 7.12275505065918e-06, 7.331371307373047e-06, 7.539987564086914e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 10.0, 10.0, 22.0, 9.0, 10.0, 17.0, 20.0, 43.0, 30.0, 50.0, 61.0, 53.0, 50.0, 113.0, 69.0, 59.0, 54.0, 43.0, 41.0, 27.0, 24.0, 15.0, 24.0, 11.0, 16.0, 15.0, 14.0, 9.0, 15.0, 8.0, 5.0, 1.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3974647521972656e-06, -3.275461494922638e-06, -3.1534582376480103e-06, -3.0314549803733826e-06, -2.909451723098755e-06, -2.787448465824127e-06, -2.6654452085494995e-06, -2.543441951274872e-06, -2.421438694000244e-06, -2.2994354367256165e-06, -2.1774321794509888e-06, -2.055428922176361e-06, -1.9334256649017334e-06, -1.8114224076271057e-06, -1.689419150352478e-06, -1.5674158930778503e-06, -1.4454126358032227e-06, -1.323409378528595e-06, -1.2014061212539673e-06, -1.0794028639793396e-06, -9.57399606704712e-07, -8.353963494300842e-07, -7.133930921554565e-07, -5.913898348808289e-07, -4.6938657760620117e-07, -3.473833203315735e-07, -2.253800630569458e-07, -1.0337680578231812e-07, 1.862645149230957e-08, 1.4062970876693726e-07, 2.6263296604156494e-07, 3.8463622331619263e-07, 5.066394805908203e-07, 6.28642737865448e-07, 7.506459951400757e-07, 8.726492524147034e-07, 9.94652509689331e-07, 1.1166557669639587e-06, 1.2386590242385864e-06, 1.3606622815132141e-06, 1.4826655387878418e-06, 1.6046687960624695e-06, 1.7266720533370972e-06, 1.8486753106117249e-06, 1.9706785678863525e-06, 2.0926818251609802e-06, 2.214685082435608e-06, 2.3366883397102356e-06, 2.4586915969848633e-06, 2.580694854259491e-06, 2.7026981115341187e-06, 2.8247013688087463e-06, 2.946704626083374e-06, 3.0687078833580017e-06, 3.1907111406326294e-06, 3.312714397907257e-06, 3.4347176551818848e-06, 3.5567209124565125e-06, 3.67872416973114e-06, 3.800727427005768e-06, 3.9227306842803955e-06, 4.044733941555023e-06, 4.166737198829651e-06, 4.2887404561042786e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 10.0, 13.0, 21.0, 28.0, 76.0, 225.0, 1763.0, 1044655.0, 1365.0, 213.0, 77.0, 36.0, 16.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.504753112792969e-05, -3.418140113353729e-05, -3.33152711391449e-05, -3.24491411447525e-05, -3.158301115036011e-05, -3.071688115596771e-05, -2.9850751161575317e-05, -2.8984621167182922e-05, -2.8118491172790527e-05, -2.7252361178398132e-05, -2.6386231184005737e-05, -2.5520101189613342e-05, -2.4653971195220947e-05, -2.3787841200828552e-05, -2.2921711206436157e-05, -2.2055581212043762e-05, -2.1189451217651367e-05, -2.0323321223258972e-05, -1.9457191228866577e-05, -1.8591061234474182e-05, -1.7724931240081787e-05, -1.6858801245689392e-05, -1.5992671251296997e-05, -1.5126541256904602e-05, -1.4260411262512207e-05, -1.3394281268119812e-05, -1.2528151273727417e-05, -1.1662021279335022e-05, -1.0795891284942627e-05, -9.929761290550232e-06, -9.063631296157837e-06, -8.197501301765442e-06, -7.331371307373047e-06, -6.465241312980652e-06, -5.599111318588257e-06, -4.732981324195862e-06, -3.866851329803467e-06, -3.0007213354110718e-06, -2.1345913410186768e-06, -1.2684613466262817e-06, -4.023313522338867e-07, 4.637986421585083e-07, 1.3299286365509033e-06, 2.1960586309432983e-06, 3.0621886253356934e-06, 3.928318619728088e-06, 4.794448614120483e-06, 5.660578608512878e-06, 6.5267086029052734e-06, 7.3928385972976685e-06, 8.258968591690063e-06, 9.125098586082458e-06, 9.991228580474854e-06, 1.0857358574867249e-05, 1.1723488569259644e-05, 1.2589618563652039e-05, 1.3455748558044434e-05, 1.4321878552436829e-05, 1.5188008546829224e-05, 1.605413854122162e-05, 1.6920268535614014e-05, 1.778639853000641e-05, 1.8652528524398804e-05, 1.95186585187912e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 7.0, 7.0, 11.0, 20.0, 20.0, 23.0, 58.0, 84.0, 523.0, 93.0, 52.0, 27.0, 19.0, 14.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1696090698242188e-05, -2.1158717572689056e-05, -2.0621344447135925e-05, -2.0083971321582794e-05, -1.9546598196029663e-05, -1.9009225070476532e-05, -1.84718519449234e-05, -1.793447881937027e-05, -1.739710569381714e-05, -1.6859732568264008e-05, -1.6322359442710876e-05, -1.5784986317157745e-05, -1.5247613191604614e-05, -1.4710240066051483e-05, -1.4172866940498352e-05, -1.3635493814945221e-05, -1.309812068939209e-05, -1.2560747563838959e-05, -1.2023374438285828e-05, -1.1486001312732697e-05, -1.0948628187179565e-05, -1.0411255061626434e-05, -9.873881936073303e-06, -9.336508810520172e-06, -8.799135684967041e-06, -8.26176255941391e-06, -7.724389433860779e-06, -7.187016308307648e-06, -6.649643182754517e-06, -6.1122700572013855e-06, -5.574896931648254e-06, -5.037523806095123e-06, -4.500150680541992e-06, -3.962777554988861e-06, -3.42540442943573e-06, -2.888031303882599e-06, -2.3506581783294678e-06, -1.8132850527763367e-06, -1.2759119272232056e-06, -7.385388016700745e-07, -2.0116567611694336e-07, 3.3620744943618774e-07, 8.735805749893188e-07, 1.41095370054245e-06, 1.948326826095581e-06, 2.485699951648712e-06, 3.0230730772018433e-06, 3.5604462027549744e-06, 4.0978193283081055e-06, 4.6351924538612366e-06, 5.172565579414368e-06, 5.709938704967499e-06, 6.24731183052063e-06, 6.784684956073761e-06, 7.322058081626892e-06, 7.859431207180023e-06, 8.396804332733154e-06, 8.934177458286285e-06, 9.471550583839417e-06, 1.0008923709392548e-05, 1.0546296834945679e-05, 1.108366996049881e-05, 1.1621043086051941e-05, 1.2158416211605072e-05, 1.2695789337158203e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 83.0, 830.0, 83.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06314918398857117, -0.057644203305244446, -0.052139222621917725, -0.046634241938591, -0.04112926125526428, -0.03562428057193756, -0.03011929616332054, -0.02461431547999382, -0.0191093347966671, -0.013604354113340378, -0.008099372498691082, -0.002594390884041786, 0.002910589799284935, 0.008415570482611656, 0.013920553028583527, 0.019425533711910248, 0.02493051439523697, 0.03043549507856369, 0.03594047576189041, 0.04144545644521713, 0.046950437128543854, 0.052455417811870575, 0.057960402220487595, 0.06346538662910461, 0.06897036731243134, 0.07447534799575806, 0.07998032867908478, 0.0854853093624115, 0.09099029004573822, 0.09649527072906494, 0.10200025141239166, 0.10750523209571838, 0.1130102127790451, 0.11851519346237183, 0.12402017414569855, 0.12952515482902527, 0.135030135512352, 0.1405351161956787, 0.14604009687900543, 0.15154507756233215, 0.15705005824565887, 0.1625550389289856, 0.16806001961231232, 0.17356500029563904, 0.17906998097896576, 0.18457496166229248, 0.1900799423456192, 0.19558492302894592, 0.20108991861343384, 0.20659489929676056, 0.21209987998008728, 0.217604860663414, 0.22310984134674072, 0.22861482203006744, 0.23411980271339417, 0.2396247833967209, 0.2451297640800476, 0.2506347596645355, 0.25613972544670105, 0.26164472103118896, 0.2671496868133545, 0.2726546823978424, 0.27815964818000793, 0.28366464376449585, 0.2891696095466614]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 13.0, 12.0, 8.0, 26.0, 27.0, 15.0, 29.0, 29.0, 38.0, 47.0, 56.0, 59.0, 69.0, 65.0, 61.0, 62.0, 51.0, 49.0, 52.0, 33.0, 32.0, 26.0, 23.0, 24.0, 10.0, 15.0, 17.0, 7.0, 11.0, 4.0, 10.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10185462236404419, -0.09835190325975418, -0.09484918415546417, -0.09134646505117416, -0.08784374594688416, -0.08434103429317474, -0.08083831518888474, -0.07733559608459473, -0.07383287698030472, -0.07033015787601471, -0.0668274387717247, -0.06332471966743469, -0.05982200428843498, -0.056319285184144974, -0.052816569805145264, -0.049313850700855255, -0.04581113159656525, -0.04230841249227524, -0.03880569338798523, -0.03530297800898552, -0.03180025890469551, -0.028297539800405502, -0.024794822558760643, -0.021292105317115784, -0.017789386212825775, -0.014286668039858341, -0.010783949866890907, -0.007281231693923473, -0.0037785135209560394, -0.0002757944166660309, 0.0032269228249788284, 0.006729640066623688, 0.010232359170913696, 0.01373507734388113, 0.017237795516848564, 0.020740512758493423, 0.024243231862783432, 0.02774595096707344, 0.0312486682087183, 0.03475138545036316, 0.03825410455465317, 0.041756823658943176, 0.045259542763233185, 0.048762258142232895, 0.0522649772465229, 0.05576769635081291, 0.05927041172981262, 0.06277313083410263, 0.06627584993839264, 0.06977856904268265, 0.07328128814697266, 0.07678400725126266, 0.08028672635555267, 0.08378943800926208, 0.0872921571135521, 0.0907948762178421, 0.09429759532213211, 0.09780031442642212, 0.10130303353071213, 0.10480575263500214, 0.10830846428871155, 0.11181119084358215, 0.11531390249729156, 0.11881662160158157, 0.12231934070587158]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 2.0, 9.0, 9.0, 12.0, 10.0, 7.0, 15.0, 24.0, 18.0, 11.0, 15.0, 17.0, 19.0, 20.0, 37.0, 38.0, 51.0, 71.0, 100.0, 118.0, 228.0, 767.0, 4187432.0, 3638.0, 793.0, 286.0, 116.0, 67.0, 52.0, 71.0, 39.0, 20.0, 20.0, 18.0, 22.0, 12.0, 7.0, 5.0, 9.0, 6.0, 11.0, 8.0, 8.0, 11.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0], "bins": [-0.0014867782592773438, -0.001444116234779358, -0.001401454210281372, -0.0013587921857833862, -0.0013161301612854004, -0.0012734681367874146, -0.0012308061122894287, -0.0011881440877914429, -0.001145482063293457, -0.0011028200387954712, -0.0010601580142974854, -0.0010174959897994995, -0.0009748339653015137, -0.0009321719408035278, -0.000889509916305542, -0.0008468478918075562, -0.0008041858673095703, -0.0007615238428115845, -0.0007188618183135986, -0.0006761997938156128, -0.000633537769317627, -0.0005908757448196411, -0.0005482137203216553, -0.0005055516958236694, -0.0004628896713256836, -0.00042022764682769775, -0.0003775656223297119, -0.0003349035978317261, -0.00029224157333374023, -0.0002495795488357544, -0.00020691752433776855, -0.00016425549983978271, -0.00012159347534179688, -7.893145084381104e-05, -3.6269426345825195e-05, 6.3925981521606445e-06, 4.9054622650146484e-05, 9.171664714813232e-05, 0.00013437867164611816, 0.000177040696144104, 0.00021970272064208984, 0.0002623647451400757, 0.0003050267696380615, 0.00034768879413604736, 0.0003903508186340332, 0.00043301284313201904, 0.0004756748676300049, 0.0005183368921279907, 0.0005609989166259766, 0.0006036609411239624, 0.0006463229656219482, 0.0006889849901199341, 0.0007316470146179199, 0.0007743090391159058, 0.0008169710636138916, 0.0008596330881118774, 0.0009022951126098633, 0.0009449571371078491, 0.000987619161605835, 0.0010302811861038208, 0.0010729432106018066, 0.0011156052350997925, 0.0011582672595977783, 0.0012009292840957642, 0.00124359130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 8.0, 9.0, 16.0, 45.0, 123.0, 269.0, 220.0, 118.0, 42.0, 12.0, 10.0, 11.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162570953369141, -0.006909370422363281, -0.006656169891357422, -0.0064029693603515625, -0.006149768829345703, -0.005896568298339844, -0.005643367767333984, -0.005390167236328125, -0.005136966705322266, -0.004883766174316406, -0.004630565643310547, -0.0043773651123046875, -0.004124164581298828, -0.0038709640502929688, -0.0036177635192871094, -0.00336456298828125, -0.0031113624572753906, -0.0028581619262695312, -0.002604961395263672, -0.0023517608642578125, -0.002098560333251953, -0.0018453598022460938, -0.0015921592712402344, -0.001338958740234375, -0.0010857582092285156, -0.0008325576782226562, -0.0005793571472167969, -0.0003261566162109375, -7.295608520507812e-05, 0.00018024444580078125, 0.0004334449768066406, 0.0006866455078125, 0.0009398460388183594, 0.0011930465698242188, 0.0014462471008300781, 0.0016994476318359375, 0.0019526481628417969, 0.0022058486938476562, 0.0024590492248535156, 0.002712249755859375, 0.0029654502868652344, 0.0032186508178710938, 0.003471851348876953, 0.0037250518798828125, 0.003978252410888672, 0.004231452941894531, 0.004484653472900391, 0.00473785400390625, 0.004991054534912109, 0.005244255065917969, 0.005497455596923828, 0.0057506561279296875, 0.006003856658935547, 0.006257057189941406, 0.006510257720947266, 0.006763458251953125, 0.007016658782958984, 0.007269859313964844, 0.007523059844970703, 0.0077762603759765625, 0.008029460906982422, 0.008282661437988281, 0.00853586196899414, 0.0087890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 19.0, 37.0, 66.0, 91.0, 136.0, 367.0, 1787.0, 4189489.0, 1623.0, 336.0, 129.0, 82.0, 50.0, 35.0, 22.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0015964508056640625, -0.0015613436698913574, -0.0015262365341186523, -0.0014911293983459473, -0.0014560222625732422, -0.0014209151268005371, -0.001385807991027832, -0.001350700855255127, -0.0013155937194824219, -0.0012804865837097168, -0.0012453794479370117, -0.0012102723121643066, -0.0011751651763916016, -0.0011400580406188965, -0.0011049509048461914, -0.0010698437690734863, -0.0010347366333007812, -0.0009996294975280762, -0.0009645223617553711, -0.000929415225982666, -0.0008943080902099609, -0.0008592009544372559, -0.0008240938186645508, -0.0007889866828918457, -0.0007538795471191406, -0.0007187724113464355, -0.0006836652755737305, -0.0006485581398010254, -0.0006134510040283203, -0.0005783438682556152, -0.0005432367324829102, -0.0005081295967102051, -0.0004730224609375, -0.0004379153251647949, -0.00040280818939208984, -0.00036770105361938477, -0.0003325939178466797, -0.0002974867820739746, -0.00026237964630126953, -0.00022727251052856445, -0.00019216537475585938, -0.0001570582389831543, -0.00012195110321044922, -8.684396743774414e-05, -5.173683166503906e-05, -1.6629695892333984e-05, 1.8477439880371094e-05, 5.358457565307617e-05, 8.869171142578125e-05, 0.00012379884719848633, 0.0001589059829711914, 0.00019401311874389648, 0.00022912025451660156, 0.00026422739028930664, 0.0002993345260620117, 0.0003344416618347168, 0.0003695487976074219, 0.00040465593338012695, 0.00043976306915283203, 0.0004748702049255371, 0.0005099773406982422, 0.0005450844764709473, 0.0005801916122436523, 0.0006152987480163574, 0.0006504058837890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4048.0, 24.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020301342010498047, -0.00019025243818759918, -0.0001774914562702179, -0.0001647304743528366, -0.00015196949243545532, -0.00013920851051807404, -0.00012644752860069275, -0.00011368654668331146, -0.00010092556476593018, -8.816458284854889e-05, -7.54036009311676e-05, -6.264261901378632e-05, -4.988163709640503e-05, -3.712065517902374e-05, -2.4359673261642456e-05, -1.159869134426117e-05, 1.1622905731201172e-06, 1.3923272490501404e-05, 2.668425440788269e-05, 3.944523632526398e-05, 5.2206218242645264e-05, 6.496720016002655e-05, 7.772818207740784e-05, 9.048916399478912e-05, 0.00010325014591217041, 0.0001160111278295517, 0.00012877210974693298, 0.00014153309166431427, 0.00015429407358169556, 0.00016705505549907684, 0.00017981603741645813, 0.00019257701933383942, 0.0002053380012512207, 0.000218098983168602, 0.00023085996508598328, 0.00024362094700336456, 0.00025638192892074585, 0.00026914291083812714, 0.0002819038927555084, 0.0002946648746728897, 0.000307425856590271, 0.0003201868385076523, 0.00033294782042503357, 0.00034570880234241486, 0.00035846978425979614, 0.00037123076617717743, 0.0003839917480945587, 0.00039675273001194, 0.0004095137119293213, 0.0004222746938467026, 0.00043503567576408386, 0.00044779665768146515, 0.00046055763959884644, 0.0004733186215162277, 0.000486079603433609, 0.0004988405853509903, 0.0005116015672683716, 0.0005243625491857529, 0.0005371235311031342, 0.0005498845130205154, 0.0005626454949378967, 0.000575406476855278, 0.0005881674587726593, 0.0006009284406900406, 0.0006136894226074219]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 244.0, 733.0, 22.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001141307526268065, -0.0011142055736854672, -0.0010871035046875477, -0.00106000155210495, -0.0010328995995223522, -0.0010057975305244327, -0.000978695577941835, -0.0009515935671515763, -0.0009244915563613176, -0.000897389545571059, -0.0008702875347808003, -0.0008431855821982026, -0.000816083571407944, -0.0007889815606176853, -0.0007618796080350876, -0.0007347775972448289, -0.0007076755864545703, -0.0006805735756643116, -0.000653471564874053, -0.0006263696122914553, -0.0005992676015011966, -0.000572165590710938, -0.0005450636381283402, -0.0005179616273380816, -0.000490859616547823, -0.0004637576057575643, -0.0004366556240711361, -0.00040955364238470793, -0.0003824516315944493, -0.00035534962080419064, -0.00032824763911776245, -0.00030114565743133426, -0.0002740435884334147, -0.00024694157764315605, -0.00021983959595672786, -0.00019273759971838444, -0.00016563560348004103, -0.0001385336072416976, -0.00011143161100335419, -8.432961476501077e-05, -5.7227618526667356e-05, -3.012562228832394e-05, -3.023626049980521e-06, 2.4078370188362896e-05, 5.1180366426706314e-05, 7.828236266504973e-05, 0.00010538435890339315, 0.00013248635514173657, 0.00015958835138007998, 0.0001866903476184234, 0.00021379234385676682, 0.00024089434009511024, 0.00026799633633345366, 0.0002950983471237123, 0.0003222003288101405, 0.0003493023104965687, 0.0003764043212868273, 0.00040350633207708597, 0.00043060831376351416, 0.00045771029544994235, 0.000484812306240201, 0.0005119143170304596, 0.0005390163278207183, 0.000566118280403316, 0.0005932202911935747]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 10.0, 27.0, 46.0, 66.0, 114.0, 153.0, 161.0, 126.0, 117.0, 77.0, 47.0, 26.0, 13.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0013595819473266602, -0.0013292189687490463, -0.0012988559901714325, -0.0012684930115938187, -0.0012381300330162048, -0.001207767054438591, -0.0011774040758609772, -0.0011470410972833633, -0.0011166781187057495, -0.0010863151401281357, -0.0010559521615505219, -0.001025589182972908, -0.0009952262043952942, -0.0009648632258176804, -0.0009345002472400665, -0.0009041372686624527, -0.0008737742900848389, -0.000843411311507225, -0.0008130483329296112, -0.0007826853543519974, -0.0007523223757743835, -0.0007219593971967697, -0.0006915964186191559, -0.000661233440041542, -0.0006308704614639282, -0.0006005074828863144, -0.0005701445043087006, -0.0005397815257310867, -0.0005094185471534729, -0.00047905556857585907, -0.00044869258999824524, -0.0004183296114206314, -0.0003879666328430176, -0.00035760365426540375, -0.0003272406756877899, -0.0002968776971101761, -0.00026651471853256226, -0.00023615173995494843, -0.0002057887613773346, -0.00017542578279972076, -0.00014506280422210693, -0.0001146998256444931, -8.433684706687927e-05, -5.397386848926544e-05, -2.361088991165161e-05, 6.752088665962219e-06, 3.711506724357605e-05, 6.747804582118988e-05, 9.784102439880371e-05, 0.00012820400297641754, 0.00015856698155403137, 0.0001889299601316452, 0.00021929293870925903, 0.00024965591728687286, 0.0002800188958644867, 0.0003103818744421005, 0.00034074485301971436, 0.0003711078315973282, 0.000401470810174942, 0.00043183378875255585, 0.0004621967673301697, 0.0004925597459077835, 0.0005229227244853973, 0.0005532857030630112, 0.000583648681640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 10.0, 13.0, 7.0, 10.0, 21.0, 23.0, 23.0, 47.0, 57.0, 57.0, 109.0, 164.0, 309.0, 458.0, 874.0, 1733.0, 3964.0, 11264.0, 80638.0, 914859.0, 22315.0, 6302.0, 2517.0, 1164.0, 628.0, 319.0, 184.0, 135.0, 80.0, 51.0, 38.0, 34.0, 19.0, 24.0, 27.0, 11.0, 9.0, 9.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01837158203125, -0.01774311065673828, -0.017114639282226562, -0.016486167907714844, -0.015857696533203125, -0.015229225158691406, -0.014600753784179688, -0.013972282409667969, -0.01334381103515625, -0.012715339660644531, -0.012086868286132812, -0.011458396911621094, -0.010829925537109375, -0.010201454162597656, -0.009572982788085938, -0.008944511413574219, -0.0083160400390625, -0.007687568664550781, -0.0070590972900390625, -0.006430625915527344, -0.005802154541015625, -0.005173683166503906, -0.0045452117919921875, -0.003916740417480469, -0.00328826904296875, -0.0026597976684570312, -0.0020313262939453125, -0.0014028549194335938, -0.000774383544921875, -0.00014591217041015625, 0.0004825592041015625, 0.0011110305786132812, 0.001739501953125, 0.0023679733276367188, 0.0029964447021484375, 0.0036249160766601562, 0.004253387451171875, 0.004881858825683594, 0.0055103302001953125, 0.006138801574707031, 0.00676727294921875, 0.007395744323730469, 0.008024215698242188, 0.008652687072753906, 0.009281158447265625, 0.009909629821777344, 0.010538101196289062, 0.011166572570800781, 0.0117950439453125, 0.012423515319824219, 0.013051986694335938, 0.013680458068847656, 0.014308929443359375, 0.014937400817871094, 0.015565872192382812, 0.01619434356689453, 0.01682281494140625, 0.01745128631591797, 0.018079757690429688, 0.018708229064941406, 0.019336700439453125, 0.019965171813964844, 0.020593643188476562, 0.02122211456298828, 0.0218505859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 8.0, 9.0, 16.0, 45.0, 123.0, 269.0, 220.0, 118.0, 42.0, 11.0, 11.0, 11.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162570953369141, -0.006909370422363281, -0.006656169891357422, -0.0064029693603515625, -0.006149768829345703, -0.005896568298339844, -0.005643367767333984, -0.005390167236328125, -0.005136966705322266, -0.004883766174316406, -0.004630565643310547, -0.0043773651123046875, -0.004124164581298828, -0.0038709640502929688, -0.0036177635192871094, -0.00336456298828125, -0.0031113624572753906, -0.0028581619262695312, -0.002604961395263672, -0.0023517608642578125, -0.002098560333251953, -0.0018453598022460938, -0.0015921592712402344, -0.001338958740234375, -0.0010857582092285156, -0.0008325576782226562, -0.0005793571472167969, -0.0003261566162109375, -7.295608520507812e-05, 0.00018024444580078125, 0.0004334449768066406, 0.0006866455078125, 0.0009398460388183594, 0.0011930465698242188, 0.0014462471008300781, 0.0016994476318359375, 0.0019526481628417969, 0.0022058486938476562, 0.0024590492248535156, 0.002712249755859375, 0.0029654502868652344, 0.0032186508178710938, 0.003471851348876953, 0.0037250518798828125, 0.003978252410888672, 0.004231452941894531, 0.004484653472900391, 0.00473785400390625, 0.004991054534912109, 0.005244255065917969, 0.005497455596923828, 0.0057506561279296875, 0.006003856658935547, 0.006257057189941406, 0.006510257720947266, 0.006763458251953125, 0.007016658782958984, 0.007269859313964844, 0.007523059844970703, 0.0077762603759765625, 0.008029460906982422, 0.008282661437988281, 0.00853586196899414, 0.0087890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 17.0, 18.0, 9.0, 19.0, 24.0, 27.0, 21.0, 44.0, 38.0, 69.0, 140.0, 282.0, 709.0, 2291.0, 597852.0, 443244.0, 2288.0, 678.0, 281.0, 129.0, 86.0, 53.0, 33.0, 31.0, 27.0, 22.0, 14.0, 14.0, 15.0, 9.0, 5.0, 8.0, 4.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030914306640625, -0.029848098754882812, -0.028781890869140625, -0.027715682983398438, -0.02664947509765625, -0.025583267211914062, -0.024517059326171875, -0.023450851440429688, -0.0223846435546875, -0.021318435668945312, -0.020252227783203125, -0.019186019897460938, -0.01811981201171875, -0.017053604125976562, -0.015987396240234375, -0.014921188354492188, -0.01385498046875, -0.012788772583007812, -0.011722564697265625, -0.010656356811523438, -0.00959014892578125, -0.008523941040039062, -0.007457733154296875, -0.0063915252685546875, -0.0053253173828125, -0.0042591094970703125, -0.003192901611328125, -0.0021266937255859375, -0.00106048583984375, 5.7220458984375e-06, 0.001071929931640625, 0.0021381378173828125, 0.003204345703125, 0.0042705535888671875, 0.005336761474609375, 0.0064029693603515625, 0.00746917724609375, 0.008535385131835938, 0.009601593017578125, 0.010667800903320312, 0.0117340087890625, 0.012800216674804688, 0.013866424560546875, 0.014932632446289062, 0.01599884033203125, 0.017065048217773438, 0.018131256103515625, 0.019197463989257812, 0.020263671875, 0.021329879760742188, 0.022396087646484375, 0.023462295532226562, 0.02452850341796875, 0.025594711303710938, 0.026660919189453125, 0.027727127075195312, 0.0287933349609375, 0.029859542846679688, 0.030925750732421875, 0.03199195861816406, 0.03305816650390625, 0.03412437438964844, 0.035190582275390625, 0.03625679016113281, 0.037322998046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 10.0, 17.0, 18.0, 10.0, 18.0, 24.0, 28.0, 19.0, 39.0, 28.0, 31.0, 35.0, 42.0, 52.0, 51.0, 55.0, 59.0, 43.0, 39.0, 39.0, 40.0, 44.0, 40.0, 31.0, 30.0, 25.0, 23.0, 15.0, 13.0, 14.0, 10.0, 5.0, 8.0, 4.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.016721248626708984, -0.01612377166748047, -0.015526294708251953, -0.014928817749023438, -0.014331340789794922, -0.013733863830566406, -0.01313638687133789, -0.012538909912109375, -0.01194143295288086, -0.011343955993652344, -0.010746479034423828, -0.010149002075195312, -0.009551525115966797, -0.008954048156738281, -0.008356571197509766, -0.00775909423828125, -0.007161617279052734, -0.006564140319824219, -0.005966663360595703, -0.0053691864013671875, -0.004771709442138672, -0.004174232482910156, -0.0035767555236816406, -0.002979278564453125, -0.0023818016052246094, -0.0017843246459960938, -0.0011868476867675781, -0.0005893707275390625, 8.106231689453125e-06, 0.0006055831909179688, 0.0012030601501464844, 0.001800537109375, 0.0023980140686035156, 0.0029954910278320312, 0.003592967987060547, 0.0041904449462890625, 0.004787921905517578, 0.005385398864746094, 0.005982875823974609, 0.006580352783203125, 0.007177829742431641, 0.007775306701660156, 0.008372783660888672, 0.008970260620117188, 0.009567737579345703, 0.010165214538574219, 0.010762691497802734, 0.01136016845703125, 0.011957645416259766, 0.012555122375488281, 0.013152599334716797, 0.013750076293945312, 0.014347553253173828, 0.014945030212402344, 0.01554250717163086, 0.016139984130859375, 0.01673746109008789, 0.017334938049316406, 0.017932415008544922, 0.018529891967773438, 0.019127368927001953, 0.01972484588623047, 0.020322322845458984, 0.0209197998046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 17.0, 14.0, 20.0, 46.0, 61.0, 111.0, 227.0, 531.0, 2243.0, 34725.0, 998807.0, 9618.0, 1303.0, 401.0, 156.0, 87.0, 54.0, 28.0, 22.0, 12.0, 14.0, 8.0, 5.0, 5.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1458061635494232e-05, -1.111440360546112e-05, -1.0770745575428009e-05, -1.0427087545394897e-05, -1.0083429515361786e-05, -9.739771485328674e-06, -9.396113455295563e-06, -9.052455425262451e-06, -8.70879739522934e-06, -8.365139365196228e-06, -8.021481335163116e-06, -7.677823305130005e-06, -7.334165275096893e-06, -6.990507245063782e-06, -6.64684921503067e-06, -6.303191184997559e-06, -5.959533154964447e-06, -5.6158751249313354e-06, -5.272217094898224e-06, -4.928559064865112e-06, -4.584901034832001e-06, -4.241243004798889e-06, -3.897584974765778e-06, -3.553926944732666e-06, -3.2102689146995544e-06, -2.866610884666443e-06, -2.5229528546333313e-06, -2.1792948246002197e-06, -1.8356367945671082e-06, -1.4919787645339966e-06, -1.148320734500885e-06, -8.046627044677734e-07, -4.6100467443466187e-07, -1.1734664440155029e-07, 2.2631138563156128e-07, 5.699694156646729e-07, 9.136274456977844e-07, 1.257285475730896e-06, 1.6009435057640076e-06, 1.944601535797119e-06, 2.2882595658302307e-06, 2.6319175958633423e-06, 2.975575625896454e-06, 3.3192336559295654e-06, 3.662891685962677e-06, 4.0065497159957886e-06, 4.3502077460289e-06, 4.693865776062012e-06, 5.037523806095123e-06, 5.381181836128235e-06, 5.7248398661613464e-06, 6.068497896194458e-06, 6.41215592622757e-06, 6.755813956260681e-06, 7.099471986293793e-06, 7.443130016326904e-06, 7.786788046360016e-06, 8.130446076393127e-06, 8.474104106426239e-06, 8.81776213645935e-06, 9.161420166492462e-06, 9.505078196525574e-06, 9.848736226558685e-06, 1.0192394256591797e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 19.0, 19.0, 29.0, 38.0, 61.0, 53.0, 107.0, 91.0, 141.0, 112.0, 69.0, 56.0, 39.0, 28.0, 31.0, 16.0, 18.0, 7.0, 11.0, 4.0, 4.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.1336904764175415e-06, -5.949288606643677e-06, -5.764886736869812e-06, -5.580484867095947e-06, -5.3960829973220825e-06, -5.211681127548218e-06, -5.027279257774353e-06, -4.842877388000488e-06, -4.6584755182266235e-06, -4.474073648452759e-06, -4.289671778678894e-06, -4.105269908905029e-06, -3.9208680391311646e-06, -3.7364661693573e-06, -3.552064299583435e-06, -3.3676624298095703e-06, -3.1832605600357056e-06, -2.998858690261841e-06, -2.814456820487976e-06, -2.6300549507141113e-06, -2.4456530809402466e-06, -2.261251211166382e-06, -2.076849341392517e-06, -1.8924474716186523e-06, -1.7080456018447876e-06, -1.5236437320709229e-06, -1.339241862297058e-06, -1.1548399925231934e-06, -9.704381227493286e-07, -7.860362529754639e-07, -6.016343832015991e-07, -4.172325134277344e-07, -2.3283064365386963e-07, -4.842877388000488e-08, 1.3597309589385986e-07, 3.203749656677246e-07, 5.047768354415894e-07, 6.891787052154541e-07, 8.735805749893188e-07, 1.0579824447631836e-06, 1.2423843145370483e-06, 1.426786184310913e-06, 1.6111880540847778e-06, 1.7955899238586426e-06, 1.9799917936325073e-06, 2.164393663406372e-06, 2.348795533180237e-06, 2.5331974029541016e-06, 2.7175992727279663e-06, 2.902001142501831e-06, 3.086403012275696e-06, 3.2708048820495605e-06, 3.4552067518234253e-06, 3.63960862159729e-06, 3.824010491371155e-06, 4.0084123611450195e-06, 4.192814230918884e-06, 4.377216100692749e-06, 4.561617970466614e-06, 4.7460198402404785e-06, 4.930421710014343e-06, 5.114823579788208e-06, 5.299225449562073e-06, 5.4836273193359375e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 19.0, 26.0, 35.0, 80.0, 186.0, 880.0, 1032242.0, 14260.0, 490.0, 125.0, 72.0, 31.0, 33.0, 18.0, 12.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.2961368560791016e-05, -3.206636756658554e-05, -3.1171366572380066e-05, -3.027636557817459e-05, -2.9381364583969116e-05, -2.848636358976364e-05, -2.7591362595558167e-05, -2.669636160135269e-05, -2.5801360607147217e-05, -2.4906359612941742e-05, -2.4011358618736267e-05, -2.3116357624530792e-05, -2.2221356630325317e-05, -2.1326355636119843e-05, -2.0431354641914368e-05, -1.9536353647708893e-05, -1.8641352653503418e-05, -1.7746351659297943e-05, -1.6851350665092468e-05, -1.5956349670886993e-05, -1.5061348676681519e-05, -1.4166347682476044e-05, -1.3271346688270569e-05, -1.2376345694065094e-05, -1.1481344699859619e-05, -1.0586343705654144e-05, -9.69134271144867e-06, -8.796341717243195e-06, -7.90134072303772e-06, -7.006339728832245e-06, -6.11133873462677e-06, -5.216337740421295e-06, -4.32133674621582e-06, -3.4263357520103455e-06, -2.5313347578048706e-06, -1.6363337635993958e-06, -7.413327693939209e-07, 1.5366822481155396e-07, 1.0486692190170288e-06, 1.9436702132225037e-06, 2.8386712074279785e-06, 3.7336722016334534e-06, 4.628673195838928e-06, 5.523674190044403e-06, 6.418675184249878e-06, 7.313676178455353e-06, 8.208677172660828e-06, 9.103678166866302e-06, 9.998679161071777e-06, 1.0893680155277252e-05, 1.1788681149482727e-05, 1.2683682143688202e-05, 1.3578683137893677e-05, 1.4473684132099152e-05, 1.5368685126304626e-05, 1.62636861205101e-05, 1.7158687114715576e-05, 1.805368810892105e-05, 1.8948689103126526e-05, 1.9843690097332e-05, 2.0738691091537476e-05, 2.163369208574295e-05, 2.2528693079948425e-05, 2.34236940741539e-05, 2.4318695068359375e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 12.0, 14.0, 17.0, 31.0, 52.0, 67.0, 507.0, 72.0, 66.0, 32.0, 31.0, 19.0, 22.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.8537044525146484e-05, -1.8034130334854126e-05, -1.7531216144561768e-05, -1.702830195426941e-05, -1.652538776397705e-05, -1.6022473573684692e-05, -1.5519559383392334e-05, -1.5016645193099976e-05, -1.4513731002807617e-05, -1.4010816812515259e-05, -1.35079026222229e-05, -1.3004988431930542e-05, -1.2502074241638184e-05, -1.1999160051345825e-05, -1.1496245861053467e-05, -1.0993331670761108e-05, -1.049041748046875e-05, -9.987503290176392e-06, -9.484589099884033e-06, -8.981674909591675e-06, -8.478760719299316e-06, -7.975846529006958e-06, -7.4729323387146e-06, -6.970018148422241e-06, -6.467103958129883e-06, -5.964189767837524e-06, -5.461275577545166e-06, -4.958361387252808e-06, -4.455447196960449e-06, -3.952533006668091e-06, -3.4496188163757324e-06, -2.946704626083374e-06, -2.4437904357910156e-06, -1.9408762454986572e-06, -1.4379620552062988e-06, -9.350478649139404e-07, -4.3213367462158203e-07, 7.078051567077637e-08, 5.736947059631348e-07, 1.0766088962554932e-06, 1.5795230865478516e-06, 2.08243727684021e-06, 2.5853514671325684e-06, 3.0882656574249268e-06, 3.591179847717285e-06, 4.0940940380096436e-06, 4.597008228302002e-06, 5.09992241859436e-06, 5.602836608886719e-06, 6.105750799179077e-06, 6.6086649894714355e-06, 7.111579179763794e-06, 7.614493370056152e-06, 8.11740756034851e-06, 8.620321750640869e-06, 9.123235940933228e-06, 9.626150131225586e-06, 1.0129064321517944e-05, 1.0631978511810303e-05, 1.1134892702102661e-05, 1.163780689239502e-05, 1.2140721082687378e-05, 1.2643635272979736e-05, 1.3146549463272095e-05, 1.3649463653564453e-05]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 28.0, 133.0, 690.0, 120.0, 24.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10095751285552979, -0.09785737842321396, -0.09475723654031754, -0.09165710210800171, -0.08855696022510529, -0.08545682579278946, -0.08235669136047363, -0.07925654947757721, -0.07615640759468079, -0.07305627316236496, -0.06995613127946854, -0.06685599684715271, -0.06375585496425629, -0.06065572053194046, -0.057555582374334335, -0.05445544421672821, -0.051355309784412384, -0.04825517162680626, -0.045155033469200134, -0.04205489903688431, -0.038954757153987885, -0.03585462272167206, -0.03275448456406593, -0.02965434640645981, -0.026554208248853683, -0.02345407009124756, -0.020353931933641434, -0.017253795638680458, -0.014153657481074333, -0.011053519323468208, -0.007953383028507233, -0.004853244870901108, -0.001753106713294983, 0.0013470309786498547, 0.004447168670594692, 0.0075473058968782425, 0.010647444054484367, 0.013747582212090492, 0.016847718507051468, 0.019947856664657593, 0.023047994822263718, 0.026148132979869843, 0.029248271137475967, 0.03234840929508209, 0.03544854372739792, 0.03854868561029434, 0.04164882004261017, 0.04474895820021629, 0.04784909635782242, 0.05094923451542854, 0.05404937267303467, 0.057149507105350494, 0.06024964898824692, 0.06334978342056274, 0.06644992530345917, 0.069550059735775, 0.07265019416809082, 0.07575032860040665, 0.07885047048330307, 0.0819506049156189, 0.08505074679851532, 0.08815088123083115, 0.09125101566314697, 0.0943511575460434, 0.09745129942893982]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 11.0, 10.0, 10.0, 7.0, 21.0, 21.0, 21.0, 23.0, 24.0, 36.0, 34.0, 44.0, 47.0, 50.0, 47.0, 46.0, 41.0, 58.0, 48.0, 45.0, 33.0, 54.0, 37.0, 42.0, 30.0, 21.0, 17.0, 14.0, 17.0, 18.0, 12.0, 13.0, 7.0, 2.0, 7.0, 1.0, 2.0, 6.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08758425712585449, -0.084969162940979, -0.08235406875610352, -0.07973897457122803, -0.07712388038635254, -0.07450878620147705, -0.07189369201660156, -0.06927859783172607, -0.06666350364685059, -0.0640484094619751, -0.06143331527709961, -0.05881822109222412, -0.05620312690734863, -0.053588032722473145, -0.050972938537597656, -0.04835784435272217, -0.04574275016784668, -0.04312765598297119, -0.0405125617980957, -0.037897467613220215, -0.03528237342834473, -0.03266727924346924, -0.03005218505859375, -0.02743709087371826, -0.024821996688842773, -0.022206902503967285, -0.019591808319091797, -0.01697671413421631, -0.01436161994934082, -0.011746525764465332, -0.009131431579589844, -0.0065163373947143555, -0.003901243209838867, -0.001286149024963379, 0.0013289451599121094, 0.003944039344787598, 0.006559133529663086, 0.009174227714538574, 0.011789321899414062, 0.01440441608428955, 0.01701951026916504, 0.019634604454040527, 0.022249698638916016, 0.024864792823791504, 0.027479887008666992, 0.03009498119354248, 0.03271007537841797, 0.03532516956329346, 0.037940263748168945, 0.040555357933044434, 0.04317045211791992, 0.04578554630279541, 0.0484006404876709, 0.05101573467254639, 0.053630828857421875, 0.05624592304229736, 0.05886101722717285, 0.06147611141204834, 0.06409120559692383, 0.06670629978179932, 0.0693213939666748, 0.07193648815155029, 0.07455158233642578, 0.07716667652130127, 0.07978177070617676]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 11.0, 11.0, 8.0, 14.0, 15.0, 18.0, 19.0, 27.0, 44.0, 63.0, 79.0, 137.0, 169.0, 383.0, 1254.0, 15528.0, 4172339.0, 2448.0, 680.0, 306.0, 180.0, 124.0, 77.0, 67.0, 37.0, 33.0, 37.0, 18.0, 29.0, 18.0, 14.0, 15.0, 12.0, 11.0, 3.0, 10.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0797119140625, -0.07698822021484375, -0.0742645263671875, -0.07154083251953125, -0.068817138671875, -0.06609344482421875, -0.0633697509765625, -0.06064605712890625, -0.05792236328125, -0.05519866943359375, -0.0524749755859375, -0.04975128173828125, -0.047027587890625, -0.04430389404296875, -0.0415802001953125, -0.03885650634765625, -0.0361328125, -0.03340911865234375, -0.0306854248046875, -0.02796173095703125, -0.025238037109375, -0.02251434326171875, -0.0197906494140625, -0.01706695556640625, -0.01434326171875, -0.01161956787109375, -0.0088958740234375, -0.00617218017578125, -0.003448486328125, -0.00072479248046875, 0.0019989013671875, 0.00472259521484375, 0.0074462890625, 0.01016998291015625, 0.0128936767578125, 0.01561737060546875, 0.018341064453125, 0.02106475830078125, 0.0237884521484375, 0.02651214599609375, 0.02923583984375, 0.03195953369140625, 0.0346832275390625, 0.03740692138671875, 0.040130615234375, 0.04285430908203125, 0.0455780029296875, 0.04830169677734375, 0.051025390625, 0.05374908447265625, 0.0564727783203125, 0.05919647216796875, 0.061920166015625, 0.06464385986328125, 0.0673675537109375, 0.07009124755859375, 0.07281494140625, 0.07553863525390625, 0.0782623291015625, 0.08098602294921875, 0.083709716796875, 0.08643341064453125, 0.0891571044921875, 0.09188079833984375, 0.0946044921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 9.0, 15.0, 9.0, 9.0, 13.0, 45.0, 120.0, 257.0, 233.0, 122.0, 43.0, 11.0, 11.0, 11.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162809371948242, -0.006909847259521484, -0.0066568851470947266, -0.006403923034667969, -0.006150960922241211, -0.005897998809814453, -0.005645036697387695, -0.0053920745849609375, -0.00513911247253418, -0.004886150360107422, -0.004633188247680664, -0.004380226135253906, -0.0041272640228271484, -0.0038743019104003906, -0.003621339797973633, -0.003368377685546875, -0.003115415573120117, -0.0028624534606933594, -0.0026094913482666016, -0.0023565292358398438, -0.002103567123413086, -0.0018506050109863281, -0.0015976428985595703, -0.0013446807861328125, -0.0010917186737060547, -0.0008387565612792969, -0.0005857944488525391, -0.00033283233642578125, -7.987022399902344e-05, 0.00017309188842773438, 0.0004260540008544922, 0.00067901611328125, 0.0009319782257080078, 0.0011849403381347656, 0.0014379024505615234, 0.0016908645629882812, 0.001943826675415039, 0.002196788787841797, 0.0024497509002685547, 0.0027027130126953125, 0.0029556751251220703, 0.003208637237548828, 0.003461599349975586, 0.0037145614624023438, 0.0039675235748291016, 0.004220485687255859, 0.004473447799682617, 0.004726409912109375, 0.004979372024536133, 0.005232334136962891, 0.0054852962493896484, 0.005738258361816406, 0.005991220474243164, 0.006244182586669922, 0.00649714469909668, 0.0067501068115234375, 0.007003068923950195, 0.007256031036376953, 0.007508993148803711, 0.007761955261230469, 0.008014917373657227, 0.008267879486083984, 0.008520841598510742, 0.0087738037109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 8.0, 4.0, 4.0, 11.0, 13.0, 17.0, 25.0, 22.0, 29.0, 51.0, 51.0, 58.0, 116.0, 362.0, 2306.0, 30882.0, 4146628.0, 11877.0, 1163.0, 215.0, 121.0, 62.0, 62.0, 38.0, 24.0, 13.0, 23.0, 17.0, 12.0, 6.0, 5.0, 11.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0251617431640625, -0.024384021759033203, -0.023606300354003906, -0.02282857894897461, -0.022050857543945312, -0.021273136138916016, -0.02049541473388672, -0.019717693328857422, -0.018939971923828125, -0.018162250518798828, -0.01738452911376953, -0.016606807708740234, -0.015829086303710938, -0.01505136489868164, -0.014273643493652344, -0.013495922088623047, -0.01271820068359375, -0.011940479278564453, -0.011162757873535156, -0.01038503646850586, -0.009607315063476562, -0.008829593658447266, -0.008051872253417969, -0.007274150848388672, -0.006496429443359375, -0.005718708038330078, -0.004940986633300781, -0.004163265228271484, -0.0033855438232421875, -0.0026078224182128906, -0.0018301010131835938, -0.0010523796081542969, -0.000274658203125, 0.0005030632019042969, 0.0012807846069335938, 0.0020585060119628906, 0.0028362274169921875, 0.0036139488220214844, 0.004391670227050781, 0.005169391632080078, 0.005947113037109375, 0.006724834442138672, 0.007502555847167969, 0.008280277252197266, 0.009057998657226562, 0.00983572006225586, 0.010613441467285156, 0.011391162872314453, 0.01216888427734375, 0.012946605682373047, 0.013724327087402344, 0.01450204849243164, 0.015279769897460938, 0.016057491302490234, 0.01683521270751953, 0.017612934112548828, 0.018390655517578125, 0.019168376922607422, 0.01994609832763672, 0.020723819732666016, 0.021501541137695312, 0.02227926254272461, 0.023056983947753906, 0.023834705352783203, 0.0246124267578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 12.0, 12.0, 13.0, 14.0, 26.0, 55.0, 145.0, 600.0, 2208.0, 639.0, 189.0, 56.0, 12.0, 15.0, 7.0, 9.0, 7.0, 2.0, 2.0, 8.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01253509521484375, -0.012137889862060547, -0.011740684509277344, -0.01134347915649414, -0.010946273803710938, -0.010549068450927734, -0.010151863098144531, -0.009754657745361328, -0.009357452392578125, -0.008960247039794922, -0.008563041687011719, -0.008165836334228516, -0.0077686309814453125, -0.007371425628662109, -0.006974220275878906, -0.006577014923095703, -0.0061798095703125, -0.005782604217529297, -0.005385398864746094, -0.004988193511962891, -0.0045909881591796875, -0.004193782806396484, -0.0037965774536132812, -0.003399372100830078, -0.003002166748046875, -0.002604961395263672, -0.0022077560424804688, -0.0018105506896972656, -0.0014133453369140625, -0.0010161399841308594, -0.0006189346313476562, -0.00022172927856445312, 0.00017547607421875, 0.0005726814270019531, 0.0009698867797851562, 0.0013670921325683594, 0.0017642974853515625, 0.0021615028381347656, 0.0025587081909179688, 0.002955913543701172, 0.003353118896484375, 0.003750324249267578, 0.004147529602050781, 0.004544734954833984, 0.0049419403076171875, 0.005339145660400391, 0.005736351013183594, 0.006133556365966797, 0.00653076171875, 0.006927967071533203, 0.007325172424316406, 0.007722377777099609, 0.008119583129882812, 0.008516788482666016, 0.008913993835449219, 0.009311199188232422, 0.009708404541015625, 0.010105609893798828, 0.010502815246582031, 0.010900020599365234, 0.011297225952148438, 0.01169443130493164, 0.012091636657714844, 0.012488842010498047, 0.01288604736328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 22.0, 104.0, 586.0, 211.0, 41.0, 17.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014731462113559246, -0.013573849573731422, -0.012416237965226173, -0.01125862542539835, -0.010101012885570526, -0.008943401277065277, -0.0077857887372374535, -0.0066281771287322044, -0.005470564588904381, -0.0043129525147378445, -0.0031553402077406645, -0.0019977279007434845, -0.0008401158265769482, 0.00031749624758958817, 0.0014751087874174118, 0.002632720395922661, 0.0037903329357504845, 0.004947945009917021, 0.006105557084083557, 0.007263169623911381, 0.008420782163739204, 0.009578393772244453, 0.010736006312072277, 0.011893617920577526, 0.01305123046040535, 0.014208843000233173, 0.015366454608738422, 0.016524067148566246, 0.017681678757071495, 0.018839292228221893, 0.019996903836727142, 0.02115451544523239, 0.02231213077902794, 0.023469742387533188, 0.024627355858683586, 0.025784967467188835, 0.026942579075694084, 0.028100192546844482, 0.02925780415534973, 0.03041541576385498, 0.03157302737236023, 0.03273063898086548, 0.03388825058937073, 0.03504586219787598, 0.036203477531671524, 0.03736108914017677, 0.03851870074868202, 0.03967631235718727, 0.04083392769098282, 0.04199153929948807, 0.04314915090799332, 0.044306762516498566, 0.04546437785029411, 0.04662198945879936, 0.04777960106730461, 0.04893721267580986, 0.05009482428431511, 0.05125243589282036, 0.05241004750132561, 0.053567662835121155, 0.054725274443626404, 0.05588288605213165, 0.0570404976606369, 0.05819810926914215, 0.0593557208776474]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 20.0, 17.0, 28.0, 24.0, 16.0, 28.0, 28.0, 58.0, 43.0, 50.0, 42.0, 28.0, 45.0, 47.0, 55.0, 53.0, 45.0, 40.0, 53.0, 34.0, 26.0, 26.0, 24.0, 30.0, 18.0, 19.0, 15.0, 14.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.03885149955749512, -0.0377403162419796, -0.03662913292646408, -0.03551795333623886, -0.03440677002072334, -0.033295586705207825, -0.032184407114982605, -0.031073223799467087, -0.02996204048395157, -0.02885085716843605, -0.02773967571556568, -0.026628494262695312, -0.025517310947179794, -0.024406127631664276, -0.023294946178793907, -0.022183764725923538, -0.02107258141040802, -0.019961398094892502, -0.018850216642022133, -0.017739035189151764, -0.016627851873636246, -0.015516669489443302, -0.014405487105250359, -0.013294304721057415, -0.012183122336864471, -0.011071939952671528, -0.009960757568478584, -0.00884957518428564, -0.007738392800092697, -0.006627210415899754, -0.00551602803170681, -0.004404845647513866, -0.003293663263320923, -0.0021824808791279793, -0.0010712984949350357, 3.988388925790787e-05, 0.0011510662734508514, 0.002262248657643795, 0.0033734310418367386, 0.004484613426029682, 0.005595795810222626, 0.006706978194415569, 0.007818160578608513, 0.008929342962801456, 0.0100405253469944, 0.011151707731187344, 0.012262890115380287, 0.01337407249957323, 0.014485254883766174, 0.015596437267959118, 0.01670761965215206, 0.01781880110502243, 0.01892998442053795, 0.020041167736053467, 0.021152349188923836, 0.022263530641794205, 0.023374713957309723, 0.02448589727282524, 0.02559707872569561, 0.02670826017856598, 0.027819443494081497, 0.028930626809597015, 0.030041808262467384, 0.031152989715337753, 0.03226417303085327]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 8.0, 9.0, 10.0, 3.0, 20.0, 24.0, 26.0, 43.0, 51.0, 64.0, 99.0, 121.0, 203.0, 241.0, 333.0, 447.0, 691.0, 985.0, 1526.0, 2742.0, 5228.0, 14781.0, 174752.0, 813876.0, 18174.0, 5891.0, 2858.0, 1596.0, 1046.0, 756.0, 517.0, 401.0, 238.0, 214.0, 160.0, 103.0, 81.0, 66.0, 46.0, 28.0, 22.0, 27.0, 15.0, 13.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.041656494140625, -0.04043436050415039, -0.03921222686767578, -0.03799009323120117, -0.03676795959472656, -0.03554582595825195, -0.034323692321777344, -0.033101558685302734, -0.031879425048828125, -0.030657291412353516, -0.029435157775878906, -0.028213024139404297, -0.026990890502929688, -0.025768756866455078, -0.02454662322998047, -0.02332448959350586, -0.02210235595703125, -0.02088022232055664, -0.01965808868408203, -0.018435955047607422, -0.017213821411132812, -0.015991687774658203, -0.014769554138183594, -0.013547420501708984, -0.012325286865234375, -0.011103153228759766, -0.009881019592285156, -0.008658885955810547, -0.0074367523193359375, -0.006214618682861328, -0.004992485046386719, -0.0037703514099121094, -0.0025482177734375, -0.0013260841369628906, -0.00010395050048828125, 0.0011181831359863281, 0.0023403167724609375, 0.003562450408935547, 0.004784584045410156, 0.006006717681884766, 0.007228851318359375, 0.008450984954833984, 0.009673118591308594, 0.010895252227783203, 0.012117385864257812, 0.013339519500732422, 0.014561653137207031, 0.01578378677368164, 0.01700592041015625, 0.01822805404663086, 0.01945018768310547, 0.020672321319580078, 0.021894454956054688, 0.023116588592529297, 0.024338722229003906, 0.025560855865478516, 0.026782989501953125, 0.028005123138427734, 0.029227256774902344, 0.030449390411376953, 0.03167152404785156, 0.03289365768432617, 0.03411579132080078, 0.03533792495727539, 0.03656005859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 16.0, 10.0, 8.0, 15.0, 43.0, 121.0, 252.0, 239.0, 122.0, 42.0, 11.0, 11.0, 12.0, 9.0, 9.0, 7.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162928581237793, -0.006910085678100586, -0.006657242774963379, -0.006404399871826172, -0.006151556968688965, -0.005898714065551758, -0.005645871162414551, -0.005393028259277344, -0.005140185356140137, -0.00488734245300293, -0.004634499549865723, -0.004381656646728516, -0.004128813743591309, -0.0038759708404541016, -0.0036231279373168945, -0.0033702850341796875, -0.0031174421310424805, -0.0028645992279052734, -0.0026117563247680664, -0.0023589134216308594, -0.0021060705184936523, -0.0018532276153564453, -0.0016003847122192383, -0.0013475418090820312, -0.0010946989059448242, -0.0008418560028076172, -0.0005890130996704102, -0.0003361701965332031, -8.33272933959961e-05, 0.00016951560974121094, 0.00042235851287841797, 0.000675201416015625, 0.000928044319152832, 0.001180887222290039, 0.001433730125427246, 0.0016865730285644531, 0.0019394159317016602, 0.002192258834838867, 0.0024451017379760742, 0.0026979446411132812, 0.0029507875442504883, 0.0032036304473876953, 0.0034564733505249023, 0.0037093162536621094, 0.003962159156799316, 0.0042150020599365234, 0.0044678449630737305, 0.0047206878662109375, 0.0049735307693481445, 0.0052263736724853516, 0.005479216575622559, 0.005732059478759766, 0.005984902381896973, 0.00623774528503418, 0.006490588188171387, 0.006743431091308594, 0.006996273994445801, 0.007249116897583008, 0.007501959800720215, 0.007754802703857422, 0.008007645606994629, 0.008260488510131836, 0.008513331413269043, 0.00876617431640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 5.0, 13.0, 13.0, 16.0, 16.0, 24.0, 31.0, 46.0, 66.0, 85.0, 109.0, 143.0, 221.0, 352.0, 649.0, 1672.0, 41944.0, 997069.0, 3825.0, 886.0, 467.0, 255.0, 163.0, 130.0, 76.0, 60.0, 43.0, 52.0, 34.0, 29.0, 14.0, 11.0, 6.0, 9.0, 6.0, 1.0, 3.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03769636154174805, -0.036360740661621094, -0.03502511978149414, -0.03368949890136719, -0.032353878021240234, -0.03101825714111328, -0.029682636260986328, -0.028347015380859375, -0.027011394500732422, -0.02567577362060547, -0.024340152740478516, -0.023004531860351562, -0.02166891098022461, -0.020333290100097656, -0.018997669219970703, -0.01766204833984375, -0.016326427459716797, -0.014990806579589844, -0.01365518569946289, -0.012319564819335938, -0.010983943939208984, -0.009648323059082031, -0.008312702178955078, -0.006977081298828125, -0.005641460418701172, -0.004305839538574219, -0.0029702186584472656, -0.0016345977783203125, -0.0002989768981933594, 0.0010366439819335938, 0.002372264862060547, 0.0037078857421875, 0.005043506622314453, 0.006379127502441406, 0.007714748382568359, 0.009050369262695312, 0.010385990142822266, 0.011721611022949219, 0.013057231903076172, 0.014392852783203125, 0.015728473663330078, 0.01706409454345703, 0.018399715423583984, 0.019735336303710938, 0.02107095718383789, 0.022406578063964844, 0.023742198944091797, 0.02507781982421875, 0.026413440704345703, 0.027749061584472656, 0.02908468246459961, 0.030420303344726562, 0.031755924224853516, 0.03309154510498047, 0.03442716598510742, 0.035762786865234375, 0.03709840774536133, 0.03843402862548828, 0.039769649505615234, 0.04110527038574219, 0.04244089126586914, 0.043776512145996094, 0.04511213302612305, 0.04644775390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 10.0, 9.0, 14.0, 16.0, 20.0, 25.0, 32.0, 35.0, 43.0, 45.0, 52.0, 45.0, 39.0, 35.0, 53.0, 64.0, 46.0, 46.0, 47.0, 42.0, 37.0, 38.0, 30.0, 23.0, 25.0, 31.0, 21.0, 20.0, 8.0, 6.0, 5.0, 9.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171051025390625, -0.016519784927368164, -0.015934467315673828, -0.015349149703979492, -0.014763832092285156, -0.01417851448059082, -0.013593196868896484, -0.013007879257202148, -0.012422561645507812, -0.011837244033813477, -0.01125192642211914, -0.010666608810424805, -0.010081291198730469, -0.009495973587036133, -0.008910655975341797, -0.008325338363647461, -0.007740020751953125, -0.007154703140258789, -0.006569385528564453, -0.005984067916870117, -0.005398750305175781, -0.004813432693481445, -0.004228115081787109, -0.0036427974700927734, -0.0030574798583984375, -0.0024721622467041016, -0.0018868446350097656, -0.0013015270233154297, -0.0007162094116210938, -0.0001308917999267578, 0.0004544258117675781, 0.001039743423461914, 0.00162506103515625, 0.002210378646850586, 0.002795696258544922, 0.003381013870239258, 0.003966331481933594, 0.00455164909362793, 0.005136966705322266, 0.0057222843170166016, 0.0063076019287109375, 0.0068929195404052734, 0.007478237152099609, 0.008063554763793945, 0.008648872375488281, 0.009234189987182617, 0.009819507598876953, 0.010404825210571289, 0.010990142822265625, 0.011575460433959961, 0.012160778045654297, 0.012746095657348633, 0.013331413269042969, 0.013916730880737305, 0.01450204849243164, 0.015087366104125977, 0.015672683715820312, 0.01625800132751465, 0.016843318939208984, 0.01742863655090332, 0.018013954162597656, 0.018599271774291992, 0.019184589385986328, 0.019769906997680664, 0.020355224609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 11.0, 7.0, 16.0, 22.0, 29.0, 31.0, 37.0, 55.0, 58.0, 103.0, 141.0, 314.0, 455.0, 1007.0, 3273.0, 16442.0, 970193.0, 48851.0, 4466.0, 1402.0, 596.0, 362.0, 162.0, 120.0, 78.0, 66.0, 44.0, 36.0, 25.0, 21.0, 24.0, 12.0, 3.0, 12.0, 10.0, 7.0, 1.0, 7.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.798197627067566e-05, -1.7307698726654053e-05, -1.6633421182632446e-05, -1.595914363861084e-05, -1.5284866094589233e-05, -1.4610588550567627e-05, -1.393631100654602e-05, -1.3262033462524414e-05, -1.2587755918502808e-05, -1.1913478374481201e-05, -1.1239200830459595e-05, -1.0564923286437988e-05, -9.890645742416382e-06, -9.216368198394775e-06, -8.542090654373169e-06, -7.867813110351562e-06, -7.193535566329956e-06, -6.51925802230835e-06, -5.844980478286743e-06, -5.170702934265137e-06, -4.49642539024353e-06, -3.822147846221924e-06, -3.1478703022003174e-06, -2.473592758178711e-06, -1.7993152141571045e-06, -1.125037670135498e-06, -4.507601261138916e-07, 2.2351741790771484e-07, 8.977949619293213e-07, 1.5720725059509277e-06, 2.246350049972534e-06, 2.9206275939941406e-06, 3.594905138015747e-06, 4.2691826820373535e-06, 4.94346022605896e-06, 5.617737770080566e-06, 6.292015314102173e-06, 6.966292858123779e-06, 7.640570402145386e-06, 8.314847946166992e-06, 8.989125490188599e-06, 9.663403034210205e-06, 1.0337680578231812e-05, 1.1011958122253418e-05, 1.1686235666275024e-05, 1.2360513210296631e-05, 1.3034790754318237e-05, 1.3709068298339844e-05, 1.438334584236145e-05, 1.5057623386383057e-05, 1.5731900930404663e-05, 1.640617847442627e-05, 1.7080456018447876e-05, 1.7754733562469482e-05, 1.842901110649109e-05, 1.9103288650512695e-05, 1.9777566194534302e-05, 2.0451843738555908e-05, 2.1126121282577515e-05, 2.180039882659912e-05, 2.2474676370620728e-05, 2.3148953914642334e-05, 2.382323145866394e-05, 2.4497509002685547e-05]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 10.0, 5.0, 16.0, 14.0, 18.0, 21.0, 20.0, 38.0, 25.0, 53.0, 96.0, 96.0, 140.0, 91.0, 79.0, 45.0, 33.0, 32.0, 18.0, 25.0, 20.0, 18.0, 11.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.927417755126953e-06, -7.636845111846924e-06, -7.3462724685668945e-06, -7.055699825286865e-06, -6.765127182006836e-06, -6.474554538726807e-06, -6.183981895446777e-06, -5.893409252166748e-06, -5.602836608886719e-06, -5.3122639656066895e-06, -5.02169132232666e-06, -4.731118679046631e-06, -4.4405460357666016e-06, -4.149973392486572e-06, -3.859400749206543e-06, -3.5688281059265137e-06, -3.2782554626464844e-06, -2.987682819366455e-06, -2.6971101760864258e-06, -2.4065375328063965e-06, -2.115964889526367e-06, -1.8253922462463379e-06, -1.5348196029663086e-06, -1.2442469596862793e-06, -9.5367431640625e-07, -6.631016731262207e-07, -3.725290298461914e-07, -8.195638656616211e-08, 2.086162567138672e-07, 4.991888999938965e-07, 7.897615432739258e-07, 1.080334186553955e-06, 1.3709068298339844e-06, 1.6614794731140137e-06, 1.952052116394043e-06, 2.2426247596740723e-06, 2.5331974029541016e-06, 2.823770046234131e-06, 3.11434268951416e-06, 3.4049153327941895e-06, 3.6954879760742188e-06, 3.986060619354248e-06, 4.276633262634277e-06, 4.567205905914307e-06, 4.857778549194336e-06, 5.148351192474365e-06, 5.4389238357543945e-06, 5.729496479034424e-06, 6.020069122314453e-06, 6.310641765594482e-06, 6.601214408874512e-06, 6.891787052154541e-06, 7.18235969543457e-06, 7.4729323387146e-06, 7.763504981994629e-06, 8.054077625274658e-06, 8.344650268554688e-06, 8.635222911834717e-06, 8.925795555114746e-06, 9.216368198394775e-06, 9.506940841674805e-06, 9.797513484954834e-06, 1.0088086128234863e-05, 1.0378658771514893e-05, 1.0669231414794922e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 7.0, 8.0, 13.0, 17.0, 21.0, 22.0, 43.0, 58.0, 97.0, 160.0, 406.0, 2040.0, 1034552.0, 9792.0, 715.0, 223.0, 128.0, 65.0, 56.0, 30.0, 23.0, 16.0, 6.0, 10.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-8.761882781982422e-05, -8.52951779961586e-05, -8.297152817249298e-05, -8.064787834882736e-05, -7.832422852516174e-05, -7.600057870149612e-05, -7.36769288778305e-05, -7.135327905416489e-05, -6.902962923049927e-05, -6.670597940683365e-05, -6.438232958316803e-05, -6.205867975950241e-05, -5.973502993583679e-05, -5.741138011217117e-05, -5.5087730288505554e-05, -5.2764080464839935e-05, -5.0440430641174316e-05, -4.81167808175087e-05, -4.579313099384308e-05, -4.346948117017746e-05, -4.114583134651184e-05, -3.882218152284622e-05, -3.64985316991806e-05, -3.4174881875514984e-05, -3.1851232051849365e-05, -2.9527582228183746e-05, -2.7203932404518127e-05, -2.488028258085251e-05, -2.255663275718689e-05, -2.023298293352127e-05, -1.7909333109855652e-05, -1.5585683286190033e-05, -1.3262033462524414e-05, -1.0938383638858795e-05, -8.614733815193176e-06, -6.291083991527557e-06, -3.9674341678619385e-06, -1.6437843441963196e-06, 6.798654794692993e-07, 3.0035153031349182e-06, 5.327165126800537e-06, 7.650814950466156e-06, 9.974464774131775e-06, 1.2298114597797394e-05, 1.4621764421463013e-05, 1.694541424512863e-05, 1.926906406879425e-05, 2.159271389245987e-05, 2.3916363716125488e-05, 2.6240013539791107e-05, 2.8563663363456726e-05, 3.0887313187122345e-05, 3.3210963010787964e-05, 3.553461283445358e-05, 3.78582626581192e-05, 4.018191248178482e-05, 4.250556230545044e-05, 4.482921212911606e-05, 4.715286195278168e-05, 4.9476511776447296e-05, 5.1800161600112915e-05, 5.4123811423778534e-05, 5.644746124744415e-05, 5.877111107110977e-05, 6.109476089477539e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 8.0, 8.0, 8.0, 21.0, 16.0, 23.0, 22.0, 44.0, 120.0, 346.0, 120.0, 81.0, 40.0, 35.0, 22.0, 14.0, 17.0, 8.0, 7.0, 4.0, 4.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.844499588012695e-05, -3.745127469301224e-05, -3.645755350589752e-05, -3.5463832318782806e-05, -3.447011113166809e-05, -3.3476389944553375e-05, -3.248266875743866e-05, -3.1488947570323944e-05, -3.049522638320923e-05, -2.9501505196094513e-05, -2.8507784008979797e-05, -2.7514062821865082e-05, -2.6520341634750366e-05, -2.552662044763565e-05, -2.4532899260520935e-05, -2.353917807340622e-05, -2.2545456886291504e-05, -2.155173569917679e-05, -2.0558014512062073e-05, -1.9564293324947357e-05, -1.857057213783264e-05, -1.7576850950717926e-05, -1.658312976360321e-05, -1.5589408576488495e-05, -1.459568738937378e-05, -1.3601966202259064e-05, -1.2608245015144348e-05, -1.1614523828029633e-05, -1.0620802640914917e-05, -9.627081453800201e-06, -8.633360266685486e-06, -7.63963907957077e-06, -6.645917892456055e-06, -5.652196705341339e-06, -4.6584755182266235e-06, -3.664754331111908e-06, -2.6710331439971924e-06, -1.6773119568824768e-06, -6.835907697677612e-07, 3.1013041734695435e-07, 1.30385160446167e-06, 2.2975727915763855e-06, 3.291293978691101e-06, 4.285015165805817e-06, 5.278736352920532e-06, 6.272457540035248e-06, 7.266178727149963e-06, 8.259899914264679e-06, 9.253621101379395e-06, 1.024734228849411e-05, 1.1241063475608826e-05, 1.2234784662723541e-05, 1.3228505849838257e-05, 1.4222227036952972e-05, 1.5215948224067688e-05, 1.6209669411182404e-05, 1.720339059829712e-05, 1.8197111785411835e-05, 1.919083297252655e-05, 2.0184554159641266e-05, 2.117827534675598e-05, 2.2171996533870697e-05, 2.3165717720985413e-05, 2.4159438908100128e-05, 2.5153160095214844e-05]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 30.0, 921.0, 62.0], "bins": [-0.558448314666748, -0.5495374798774719, -0.5406267046928406, -0.5317158699035645, -0.5228050947189331, -0.513894259929657, -0.5049834847450256, -0.4960726499557495, -0.4871618449687958, -0.47825103998184204, -0.4693402349948883, -0.46042943000793457, -0.45151859521865845, -0.4426077902317047, -0.433696985244751, -0.42478618025779724, -0.4158753752708435, -0.40696457028388977, -0.39805376529693604, -0.3891429603099823, -0.38023215532302856, -0.37132132053375244, -0.3624105155467987, -0.35349971055984497, -0.34458890557289124, -0.3356781005859375, -0.32676729559898376, -0.31785649061203003, -0.3089456558227539, -0.30003485083580017, -0.29112404584884644, -0.2822132408618927, -0.2733024060726166, -0.26439160108566284, -0.2554807960987091, -0.24656997621059418, -0.23765917122364044, -0.2287483662366867, -0.21983754634857178, -0.21092674136161804, -0.2020159512758255, -0.19310514628887177, -0.18419432640075684, -0.1752835214138031, -0.16637271642684937, -0.15746191143989563, -0.1485511064529419, -0.13964028656482697, -0.13072948157787323, -0.1218186765909195, -0.11290786415338516, -0.10399705171585083, -0.0950862467288971, -0.08617544174194336, -0.07726462930440903, -0.0683538168668747, -0.05944300442934036, -0.05053219571709633, -0.041621387004852295, -0.03271057829260826, -0.023799769580364227, -0.014888960868120193, -0.00597815215587616, 0.002932656556367874, 0.011843464337289333]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 11.0, 17.0, 17.0, 22.0, 23.0, 22.0, 44.0, 32.0, 36.0, 38.0, 39.0, 66.0, 53.0, 65.0, 54.0, 59.0, 51.0, 41.0, 51.0, 32.0, 33.0, 31.0, 21.0, 17.0, 16.0, 13.0, 17.0, 11.0, 3.0, 10.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08399641513824463, -0.08156851679086685, -0.07914061099290848, -0.0767127126455307, -0.07428480684757233, -0.07185690850019455, -0.06942901015281677, -0.0670011043548584, -0.06457320600748062, -0.062145303934812546, -0.05971740186214447, -0.05728950351476669, -0.05486160144209862, -0.05243369936943054, -0.050005801022052765, -0.04757789894938469, -0.045149996876716614, -0.04272209480404854, -0.04029419273138046, -0.037866294384002686, -0.03543839231133461, -0.033010490238666534, -0.030582590028643608, -0.028154689818620682, -0.025726787745952606, -0.02329888567328453, -0.020870985463261604, -0.018443085253238678, -0.016015183180570602, -0.013587282039225101, -0.0111593808978796, -0.008731480687856674, -0.006303578615188599, -0.0038756774738430977, -0.0014477763324975967, 0.0009801248088479042, 0.003408025950193405, 0.005835927091538906, 0.008263828232884407, 0.010691728442907333, 0.013119630515575409, 0.01554753165692091, 0.01797543279826641, 0.020403333008289337, 0.022831235080957413, 0.02525913715362549, 0.027687037363648415, 0.03011493757367134, 0.032542839646339417, 0.03497074171900749, 0.03739864379167557, 0.039826542139053345, 0.04225444421172142, 0.044682346284389496, 0.04711024463176727, 0.04953814670443535, 0.051966048777103424, 0.0543939508497715, 0.056821852922439575, 0.05924975126981735, 0.06167765334248543, 0.0641055554151535, 0.06653345376253128, 0.06896135210990906, 0.07138925790786743]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 5.0, 8.0, 7.0, 8.0, 5.0, 9.0, 15.0, 27.0, 24.0, 28.0, 44.0, 78.0, 274.0, 1536.0, 4191353.0, 497.0, 104.0, 44.0, 35.0, 34.0, 20.0, 19.0, 17.0, 14.0, 11.0, 5.0, 8.0, 8.0, 6.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.095703125, -2.024200439453125, -1.95269775390625, -1.881195068359375, -1.8096923828125, -1.738189697265625, -1.66668701171875, -1.595184326171875, -1.523681640625, -1.452178955078125, -1.38067626953125, -1.309173583984375, -1.2376708984375, -1.166168212890625, -1.09466552734375, -1.023162841796875, -0.95166015625, -0.880157470703125, -0.80865478515625, -0.737152099609375, -0.6656494140625, -0.594146728515625, -0.52264404296875, -0.451141357421875, -0.379638671875, -0.308135986328125, -0.23663330078125, -0.165130615234375, -0.0936279296875, -0.022125244140625, 0.04937744140625, 0.120880126953125, 0.1923828125, 0.263885498046875, 0.33538818359375, 0.406890869140625, 0.4783935546875, 0.549896240234375, 0.62139892578125, 0.692901611328125, 0.764404296875, 0.835906982421875, 0.90740966796875, 0.978912353515625, 1.0504150390625, 1.121917724609375, 1.19342041015625, 1.264923095703125, 1.33642578125, 1.407928466796875, 1.47943115234375, 1.550933837890625, 1.6224365234375, 1.693939208984375, 1.76544189453125, 1.836944580078125, 1.908447265625, 1.979949951171875, 2.05145263671875, 2.122955322265625, 2.1944580078125, 2.265960693359375, 2.33746337890625, 2.408966064453125, 2.48046875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 5.0, 16.0, 39.0, 112.0, 216.0, 259.0, 145.0, 47.0, 14.0, 11.0, 13.0, 7.0, 10.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007163882255554199, -0.0069119930267333984, -0.006660103797912598, -0.006408214569091797, -0.006156325340270996, -0.005904436111450195, -0.0056525468826293945, -0.005400657653808594, -0.005148768424987793, -0.004896879196166992, -0.004644989967346191, -0.004393100738525391, -0.00414121150970459, -0.003889322280883789, -0.0036374330520629883, -0.0033855438232421875, -0.0031336545944213867, -0.002881765365600586, -0.002629876136779785, -0.0023779869079589844, -0.0021260976791381836, -0.0018742084503173828, -0.001622319221496582, -0.0013704299926757812, -0.0011185407638549805, -0.0008666515350341797, -0.0006147623062133789, -0.0003628730773925781, -0.00011098384857177734, 0.00014090538024902344, 0.0003927946090698242, 0.000644683837890625, 0.0008965730667114258, 0.0011484622955322266, 0.0014003515243530273, 0.0016522407531738281, 0.001904129981994629, 0.0021560192108154297, 0.0024079084396362305, 0.0026597976684570312, 0.002911686897277832, 0.003163576126098633, 0.0034154653549194336, 0.0036673545837402344, 0.003919243812561035, 0.004171133041381836, 0.004423022270202637, 0.0046749114990234375, 0.004926800727844238, 0.005178689956665039, 0.00543057918548584, 0.005682468414306641, 0.005934357643127441, 0.006186246871948242, 0.006438136100769043, 0.006690025329589844, 0.0069419145584106445, 0.007193803787231445, 0.007445693016052246, 0.007697582244873047, 0.007949471473693848, 0.008201360702514648, 0.00845324993133545, 0.00870513916015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 10.0, 11.0, 19.0, 18.0, 35.0, 49.0, 101.0, 145.0, 267.0, 603.0, 1485.0, 4477.0, 26272.0, 4135100.0, 19698.0, 3598.0, 1217.0, 497.0, 269.0, 132.0, 84.0, 51.0, 33.0, 29.0, 19.0, 13.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.04852294921875, -0.046929359436035156, -0.04533576965332031, -0.04374217987060547, -0.042148590087890625, -0.04055500030517578, -0.03896141052246094, -0.037367820739746094, -0.03577423095703125, -0.034180641174316406, -0.03258705139160156, -0.03099346160888672, -0.029399871826171875, -0.02780628204345703, -0.026212692260742188, -0.024619102478027344, -0.0230255126953125, -0.021431922912597656, -0.019838333129882812, -0.01824474334716797, -0.016651153564453125, -0.015057563781738281, -0.013463973999023438, -0.011870384216308594, -0.01027679443359375, -0.008683204650878906, -0.0070896148681640625, -0.005496025085449219, -0.003902435302734375, -0.0023088455200195312, -0.0007152557373046875, 0.0008783340454101562, 0.002471923828125, 0.004065513610839844, 0.0056591033935546875, 0.007252693176269531, 0.008846282958984375, 0.010439872741699219, 0.012033462524414062, 0.013627052307128906, 0.01522064208984375, 0.016814231872558594, 0.018407821655273438, 0.02000141143798828, 0.021595001220703125, 0.02318859100341797, 0.024782180786132812, 0.026375770568847656, 0.0279693603515625, 0.029562950134277344, 0.031156539916992188, 0.03275012969970703, 0.034343719482421875, 0.03593730926513672, 0.03753089904785156, 0.039124488830566406, 0.04071807861328125, 0.042311668395996094, 0.04390525817871094, 0.04549884796142578, 0.047092437744140625, 0.04868602752685547, 0.05027961730957031, 0.051873207092285156, 0.053466796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 5.0, 9.0, 10.0, 26.0, 60.0, 252.0, 3067.0, 407.0, 96.0, 35.0, 14.0, 9.0, 7.0, 7.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.01409149169921875, -0.013717055320739746, -0.013342618942260742, -0.012968182563781738, -0.012593746185302734, -0.01221930980682373, -0.011844873428344727, -0.011470437049865723, -0.011096000671386719, -0.010721564292907715, -0.010347127914428711, -0.009972691535949707, -0.009598255157470703, -0.0092238187789917, -0.008849382400512695, -0.008474946022033691, -0.008100509643554688, -0.007726073265075684, -0.00735163688659668, -0.006977200508117676, -0.006602764129638672, -0.006228327751159668, -0.005853891372680664, -0.00547945499420166, -0.005105018615722656, -0.004730582237243652, -0.0043561458587646484, -0.0039817094802856445, -0.0036072731018066406, -0.0032328367233276367, -0.002858400344848633, -0.002483963966369629, -0.002109527587890625, -0.001735091209411621, -0.0013606548309326172, -0.0009862184524536133, -0.0006117820739746094, -0.00023734569549560547, 0.00013709068298339844, 0.0005115270614624023, 0.0008859634399414062, 0.0012603998184204102, 0.001634836196899414, 0.002009272575378418, 0.002383708953857422, 0.0027581453323364258, 0.0031325817108154297, 0.0035070180892944336, 0.0038814544677734375, 0.004255890846252441, 0.004630327224731445, 0.005004763603210449, 0.005379199981689453, 0.005753636360168457, 0.006128072738647461, 0.006502509117126465, 0.006876945495605469, 0.007251381874084473, 0.0076258182525634766, 0.00800025463104248, 0.008374691009521484, 0.008749127388000488, 0.009123563766479492, 0.009498000144958496, 0.0098724365234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 18.0, 111.0, 628.0, 153.0, 47.0, 22.0, 14.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055271510034799576, -0.048703815788030624, -0.04213612154126167, -0.03556842729449272, -0.02900073304772377, -0.02243303880095482, -0.015865344554185867, -0.009297650307416916, -0.0027299560606479645, 0.003837738186120987, 0.010405432432889938, 0.01697312667965889, 0.02354082092642784, 0.030108515173196793, 0.036676209419965744, 0.043243903666734695, 0.04981159791350365, 0.0563792921602726, 0.06294699013233185, 0.0695146769285202, 0.07608237862586975, 0.0826500654220581, 0.08921776711940765, 0.09578545391559601, 0.10235315561294556, 0.10892084985971451, 0.11548854410648346, 0.12205623835325241, 0.12862393260002136, 0.13519161939620972, 0.14175932109355927, 0.1483270227909088, 0.15489470958709717, 0.16146239638328552, 0.16803009808063507, 0.17459779977798462, 0.18116548657417297, 0.18773317337036133, 0.19430087506771088, 0.20086857676506042, 0.20743626356124878, 0.21400395035743713, 0.22057165205478668, 0.22713935375213623, 0.23370704054832458, 0.24027472734451294, 0.2468424290418625, 0.25341013073921204, 0.2599778175354004, 0.26654550433158875, 0.2731131911277771, 0.27968090772628784, 0.2862485945224762, 0.29281628131866455, 0.2993839979171753, 0.30595168471336365, 0.312519371509552, 0.31908705830574036, 0.3256547451019287, 0.33222246170043945, 0.3387901484966278, 0.34535783529281616, 0.3519255518913269, 0.35849323868751526, 0.3650609254837036]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 7.0, 8.0, 12.0, 11.0, 20.0, 16.0, 35.0, 35.0, 36.0, 40.0, 56.0, 52.0, 44.0, 49.0, 53.0, 51.0, 71.0, 60.0, 48.0, 46.0, 40.0, 47.0, 37.0, 22.0, 22.0, 15.0, 15.0, 11.0, 11.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035768866539001465, -0.0345376580953598, -0.03330644965171814, -0.03207524120807648, -0.030844032764434814, -0.029612824320793152, -0.02838161587715149, -0.027150407433509827, -0.025919198989868164, -0.0246879905462265, -0.02345678210258484, -0.022225573658943176, -0.020994365215301514, -0.01976315677165985, -0.01853194832801819, -0.017300739884376526, -0.016069531440734863, -0.0148383229970932, -0.013607114553451538, -0.012375906109809875, -0.011144697666168213, -0.00991348922252655, -0.008682280778884888, -0.007451072335243225, -0.0062198638916015625, -0.0049886554479599, -0.0037574470043182373, -0.0025262385606765747, -0.0012950301170349121, -6.382167339324951e-05, 0.001167386770248413, 0.0023985952138900757, 0.0036298036575317383, 0.004861012101173401, 0.0060922205448150635, 0.007323428988456726, 0.008554637432098389, 0.009785845875740051, 0.011017054319381714, 0.012248262763023376, 0.013479471206665039, 0.014710679650306702, 0.015941888093948364, 0.017173096537590027, 0.01840430498123169, 0.019635513424873352, 0.020866721868515015, 0.022097930312156677, 0.02332913875579834, 0.024560347199440002, 0.025791555643081665, 0.027022764086723328, 0.02825397253036499, 0.029485180974006653, 0.030716389417648315, 0.03194759786128998, 0.03317880630493164, 0.0344100147485733, 0.035641223192214966, 0.03687243163585663, 0.03810364007949829, 0.039334848523139954, 0.040566056966781616, 0.04179726541042328, 0.04302847385406494]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 11.0, 20.0, 33.0, 38.0, 74.0, 128.0, 196.0, 376.0, 896.0, 2119.0, 6072.0, 26431.0, 954107.0, 44849.0, 8121.0, 2785.0, 1128.0, 536.0, 241.0, 138.0, 87.0, 43.0, 31.0, 12.0, 16.0, 11.0, 4.0, 3.0, 6.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0655517578125, -0.0633382797241211, -0.06112480163574219, -0.05891132354736328, -0.056697845458984375, -0.05448436737060547, -0.05227088928222656, -0.050057411193847656, -0.04784393310546875, -0.045630455017089844, -0.04341697692871094, -0.04120349884033203, -0.038990020751953125, -0.03677654266357422, -0.03456306457519531, -0.032349586486816406, -0.0301361083984375, -0.027922630310058594, -0.025709152221679688, -0.02349567413330078, -0.021282196044921875, -0.01906871795654297, -0.016855239868164062, -0.014641761779785156, -0.01242828369140625, -0.010214805603027344, -0.008001327514648438, -0.005787849426269531, -0.003574371337890625, -0.0013608932495117188, 0.0008525848388671875, 0.0030660629272460938, 0.005279541015625, 0.007493019104003906, 0.009706497192382812, 0.011919975280761719, 0.014133453369140625, 0.01634693145751953, 0.018560409545898438, 0.020773887634277344, 0.02298736572265625, 0.025200843811035156, 0.027414321899414062, 0.02962779998779297, 0.031841278076171875, 0.03405475616455078, 0.03626823425292969, 0.038481712341308594, 0.0406951904296875, 0.042908668518066406, 0.04512214660644531, 0.04733562469482422, 0.049549102783203125, 0.05176258087158203, 0.05397605895996094, 0.056189537048339844, 0.05840301513671875, 0.060616493225097656, 0.06282997131347656, 0.06504344940185547, 0.06725692749023438, 0.06947040557861328, 0.07168388366699219, 0.0738973617553711, 0.07611083984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 3.0, 10.0, 12.0, 12.0, 15.0, 14.0, 67.0, 136.0, 233.0, 216.0, 116.0, 46.0, 16.0, 11.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007381439208984375, -0.007128655910491943, -0.006875872611999512, -0.00662308931350708, -0.0063703060150146484, -0.006117522716522217, -0.005864739418029785, -0.0056119561195373535, -0.005359172821044922, -0.00510638952255249, -0.004853606224060059, -0.004600822925567627, -0.004348039627075195, -0.004095256328582764, -0.003842473030090332, -0.0035896897315979004, -0.0033369064331054688, -0.003084123134613037, -0.0028313398361206055, -0.002578556537628174, -0.002325773239135742, -0.0020729899406433105, -0.001820206642150879, -0.0015674233436584473, -0.0013146400451660156, -0.001061856746673584, -0.0008090734481811523, -0.0005562901496887207, -0.00030350685119628906, -5.072355270385742e-05, 0.00020205974578857422, 0.00045484304428100586, 0.0007076263427734375, 0.0009604096412658691, 0.0012131929397583008, 0.0014659762382507324, 0.001718759536743164, 0.0019715428352355957, 0.0022243261337280273, 0.002477109432220459, 0.0027298927307128906, 0.0029826760292053223, 0.003235459327697754, 0.0034882426261901855, 0.003741025924682617, 0.003993809223175049, 0.0042465925216674805, 0.004499375820159912, 0.004752159118652344, 0.005004942417144775, 0.005257725715637207, 0.005510509014129639, 0.00576329231262207, 0.006016075611114502, 0.006268858909606934, 0.006521642208099365, 0.006774425506591797, 0.0070272088050842285, 0.00727999210357666, 0.007532775402069092, 0.0077855587005615234, 0.008038341999053955, 0.008291125297546387, 0.008543908596038818, 0.00879669189453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 8.0, 6.0, 13.0, 20.0, 23.0, 30.0, 34.0, 47.0, 51.0, 81.0, 130.0, 189.0, 275.0, 440.0, 776.0, 1612.0, 3682.0, 10355.0, 38986.0, 416877.0, 515853.0, 40892.0, 10645.0, 3739.0, 1571.0, 817.0, 473.0, 274.0, 199.0, 116.0, 86.0, 68.0, 43.0, 30.0, 21.0, 24.0, 17.0, 12.0, 9.0, 7.0, 9.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028927326202392578, -0.028023719787597656, -0.027120113372802734, -0.026216506958007812, -0.02531290054321289, -0.02440929412841797, -0.023505687713623047, -0.022602081298828125, -0.021698474884033203, -0.02079486846923828, -0.01989126205444336, -0.018987655639648438, -0.018084049224853516, -0.017180442810058594, -0.016276836395263672, -0.01537322998046875, -0.014469623565673828, -0.013566017150878906, -0.012662410736083984, -0.011758804321289062, -0.01085519790649414, -0.009951591491699219, -0.009047985076904297, -0.008144378662109375, -0.007240772247314453, -0.006337165832519531, -0.005433559417724609, -0.0045299530029296875, -0.0036263465881347656, -0.0027227401733398438, -0.0018191337585449219, -0.00091552734375, -1.1920928955078125e-05, 0.0008916854858398438, 0.0017952919006347656, 0.0026988983154296875, 0.0036025047302246094, 0.004506111145019531, 0.005409717559814453, 0.006313323974609375, 0.007216930389404297, 0.008120536804199219, 0.00902414321899414, 0.009927749633789062, 0.010831356048583984, 0.011734962463378906, 0.012638568878173828, 0.01354217529296875, 0.014445781707763672, 0.015349388122558594, 0.016252994537353516, 0.017156600952148438, 0.01806020736694336, 0.01896381378173828, 0.019867420196533203, 0.020771026611328125, 0.021674633026123047, 0.02257823944091797, 0.02348184585571289, 0.024385452270507812, 0.025289058685302734, 0.026192665100097656, 0.027096271514892578, 0.0279998779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 8.0, 9.0, 8.0, 7.0, 16.0, 20.0, 18.0, 29.0, 40.0, 34.0, 34.0, 35.0, 46.0, 53.0, 52.0, 45.0, 55.0, 46.0, 44.0, 53.0, 26.0, 44.0, 35.0, 46.0, 23.0, 21.0, 25.0, 14.0, 26.0, 15.0, 8.0, 8.0, 8.0, 7.0, 1.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01538848876953125, -0.01487743854522705, -0.014366388320922852, -0.013855338096618652, -0.013344287872314453, -0.012833237648010254, -0.012322187423706055, -0.011811137199401855, -0.011300086975097656, -0.010789036750793457, -0.010277986526489258, -0.009766936302185059, -0.00925588607788086, -0.00874483585357666, -0.008233785629272461, -0.007722735404968262, -0.0072116851806640625, -0.006700634956359863, -0.006189584732055664, -0.005678534507751465, -0.005167484283447266, -0.004656434059143066, -0.004145383834838867, -0.003634333610534668, -0.0031232833862304688, -0.0026122331619262695, -0.0021011829376220703, -0.001590132713317871, -0.0010790824890136719, -0.0005680322647094727, -5.698204040527344e-05, 0.0004540681838989258, 0.000965118408203125, 0.0014761686325073242, 0.0019872188568115234, 0.0024982690811157227, 0.003009319305419922, 0.003520369529724121, 0.00403141975402832, 0.0045424699783325195, 0.005053520202636719, 0.005564570426940918, 0.006075620651245117, 0.006586670875549316, 0.007097721099853516, 0.007608771324157715, 0.008119821548461914, 0.008630871772766113, 0.009141921997070312, 0.009652972221374512, 0.010164022445678711, 0.01067507266998291, 0.01118612289428711, 0.011697173118591309, 0.012208223342895508, 0.012719273567199707, 0.013230323791503906, 0.013741374015808105, 0.014252424240112305, 0.014763474464416504, 0.015274524688720703, 0.015785574913024902, 0.0162966251373291, 0.0168076753616333, 0.0173187255859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 23.0, 35.0, 57.0, 72.0, 106.0, 153.0, 278.0, 465.0, 831.0, 1750.0, 3743.0, 9810.0, 36135.0, 616434.0, 331763.0, 31021.0, 8824.0, 3425.0, 1628.0, 826.0, 391.0, 269.0, 151.0, 111.0, 61.0, 45.0, 28.0, 21.0, 16.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012264251708984375, -0.001188039779663086, -0.0011496543884277344, -0.0011112689971923828, -0.0010728836059570312, -0.0010344982147216797, -0.0009961128234863281, -0.0009577274322509766, -0.000919342041015625, -0.0008809566497802734, -0.0008425712585449219, -0.0008041858673095703, -0.0007658004760742188, -0.0007274150848388672, -0.0006890296936035156, -0.0006506443023681641, -0.0006122589111328125, -0.0005738735198974609, -0.0005354881286621094, -0.0004971027374267578, -0.00045871734619140625, -0.0004203319549560547, -0.0003819465637207031, -0.00034356117248535156, -0.00030517578125, -0.00026679039001464844, -0.00022840499877929688, -0.0001900196075439453, -0.00015163421630859375, -0.00011324882507324219, -7.486343383789062e-05, -3.647804260253906e-05, 1.9073486328125e-06, 4.029273986816406e-05, 7.867813110351562e-05, 0.00011706352233886719, 0.00015544891357421875, 0.0001938343048095703, 0.00023221969604492188, 0.00027060508728027344, 0.000308990478515625, 0.00034737586975097656, 0.0003857612609863281, 0.0004241466522216797, 0.00046253204345703125, 0.0005009174346923828, 0.0005393028259277344, 0.0005776882171630859, 0.0006160736083984375, 0.0006544589996337891, 0.0006928443908691406, 0.0007312297821044922, 0.0007696151733398438, 0.0008080005645751953, 0.0008463859558105469, 0.0008847713470458984, 0.00092315673828125, 0.0009615421295166016, 0.0009999275207519531, 0.0010383129119873047, 0.0010766983032226562, 0.0011150836944580078, 0.0011534690856933594, 0.001191854476928711, 0.0012302398681640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 8.0, 5.0, 8.0, 6.0, 22.0, 123.0, 502.0, 232.0, 33.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.881674587726593e-05, -5.6896358728408813e-05, -5.49759715795517e-05, -5.305558443069458e-05, -5.113519728183746e-05, -4.921481013298035e-05, -4.729442298412323e-05, -4.537403583526611e-05, -4.3453648686408997e-05, -4.153326153755188e-05, -3.961287438869476e-05, -3.7692487239837646e-05, -3.577210009098053e-05, -3.385171294212341e-05, -3.1931325793266296e-05, -3.001093864440918e-05, -2.8090551495552063e-05, -2.6170164346694946e-05, -2.424977719783783e-05, -2.2329390048980713e-05, -2.0409002900123596e-05, -1.848861575126648e-05, -1.6568228602409363e-05, -1.4647841453552246e-05, -1.272745430469513e-05, -1.0807067155838013e-05, -8.886680006980896e-06, -6.966292858123779e-06, -5.045905709266663e-06, -3.125518560409546e-06, -1.2051314115524292e-06, 7.152557373046875e-07, 2.635642886161804e-06, 4.556030035018921e-06, 6.476417183876038e-06, 8.396804332733154e-06, 1.0317191481590271e-05, 1.2237578630447388e-05, 1.4157965779304504e-05, 1.607835292816162e-05, 1.7998740077018738e-05, 1.9919127225875854e-05, 2.183951437473297e-05, 2.3759901523590088e-05, 2.5680288672447205e-05, 2.760067582130432e-05, 2.9521062970161438e-05, 3.1441450119018555e-05, 3.336183726787567e-05, 3.528222441673279e-05, 3.7202611565589905e-05, 3.912299871444702e-05, 4.104338586330414e-05, 4.2963773012161255e-05, 4.488416016101837e-05, 4.680454730987549e-05, 4.8724934458732605e-05, 5.064532160758972e-05, 5.256570875644684e-05, 5.4486095905303955e-05, 5.640648305416107e-05, 5.832687020301819e-05, 6.0247257351875305e-05, 6.216764450073242e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 11.0, 17.0, 11.0, 19.0, 17.0, 29.0, 39.0, 58.0, 94.0, 135.0, 180.0, 322.0, 584.0, 1201.0, 2511.0, 7219.0, 28643.0, 629008.0, 341937.0, 24906.0, 6571.0, 2396.0, 1133.0, 560.0, 307.0, 187.0, 135.0, 92.0, 52.0, 40.0, 30.0, 24.0, 14.0, 12.0, 14.0, 6.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012083053588867188, -0.0011692792177200317, -0.0011302530765533447, -0.0010912269353866577, -0.0010522007942199707, -0.0010131746530532837, -0.0009741485118865967, -0.0009351223707199097, -0.0008960962295532227, -0.0008570700883865356, -0.0008180439472198486, -0.0007790178060531616, -0.0007399916648864746, -0.0007009655237197876, -0.0006619393825531006, -0.0006229132413864136, -0.0005838871002197266, -0.0005448609590530396, -0.0005058348178863525, -0.00046680867671966553, -0.0004277825355529785, -0.0003887563943862915, -0.0003497302532196045, -0.0003107041120529175, -0.00027167797088623047, -0.00023265182971954346, -0.00019362568855285645, -0.00015459954738616943, -0.00011557340621948242, -7.654726505279541e-05, -3.75211238861084e-05, 1.5050172805786133e-06, 4.0531158447265625e-05, 7.955729961395264e-05, 0.00011858344078063965, 0.00015760958194732666, 0.00019663572311401367, 0.00023566186428070068, 0.0002746880054473877, 0.0003137141466140747, 0.0003527402877807617, 0.00039176642894744873, 0.00043079257011413574, 0.00046981871128082275, 0.0005088448524475098, 0.0005478709936141968, 0.0005868971347808838, 0.0006259232759475708, 0.0006649494171142578, 0.0007039755582809448, 0.0007430016994476318, 0.0007820278406143188, 0.0008210539817810059, 0.0008600801229476929, 0.0008991062641143799, 0.0009381324052810669, 0.000977158546447754, 0.001016184687614441, 0.001055210828781128, 0.001094236969947815, 0.001133263111114502, 0.001172289252281189, 0.001211315393447876, 0.001250341534614563, 0.00128936767578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 10.0, 7.0, 15.0, 23.0, 18.0, 18.0, 27.0, 41.0, 42.0, 64.0, 86.0, 75.0, 95.0, 92.0, 69.0, 49.0, 44.0, 52.0, 27.0, 22.0, 18.0, 20.0, 8.0, 11.0, 10.0, 4.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007576942443847656, -0.000734962522983551, -0.0007122308015823364, -0.0006894990801811218, -0.0006667673587799072, -0.0006440356373786926, -0.000621303915977478, -0.0005985721945762634, -0.0005758404731750488, -0.0005531087517738342, -0.0005303770303726196, -0.000507645308971405, -0.00048491358757019043, -0.00046218186616897583, -0.00043945014476776123, -0.00041671842336654663, -0.00039398670196533203, -0.00037125498056411743, -0.00034852325916290283, -0.00032579153776168823, -0.00030305981636047363, -0.00028032809495925903, -0.00025759637355804443, -0.00023486465215682983, -0.00021213293075561523, -0.00018940120935440063, -0.00016666948795318604, -0.00014393776655197144, -0.00012120604515075684, -9.847432374954224e-05, -7.574260234832764e-05, -5.301088094711304e-05, -3.0279159545898438e-05, -7.547438144683838e-06, 1.5184283256530762e-05, 3.791600465774536e-05, 6.064772605895996e-05, 8.337944746017456e-05, 0.00010611116886138916, 0.00012884289026260376, 0.00015157461166381836, 0.00017430633306503296, 0.00019703805446624756, 0.00021976977586746216, 0.00024250149726867676, 0.00026523321866989136, 0.00028796494007110596, 0.00031069666147232056, 0.00033342838287353516, 0.00035616010427474976, 0.00037889182567596436, 0.00040162354707717896, 0.00042435526847839355, 0.00044708698987960815, 0.00046981871128082275, 0.0004925504326820374, 0.000515282154083252, 0.0005380138754844666, 0.0005607455968856812, 0.0005834773182868958, 0.0006062090396881104, 0.000628940761089325, 0.0006516724824905396, 0.0006744042038917542, 0.0006971359252929688]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 10.0, 16.0, 22.0, 30.0, 76.0, 159.0, 247.0, 197.0, 99.0, 43.0, 36.0, 24.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494062840938568, -0.14543524384498596, -0.1414642184972763, -0.13749317824840546, -0.1335221529006958, -0.12955111265182495, -0.1255800873041153, -0.12160904705524445, -0.11763802170753479, -0.11366698890924454, -0.10969595611095428, -0.10572492331266403, -0.10175389051437378, -0.09778285771608353, -0.09381182491779327, -0.08984078466892242, -0.08586975187063217, -0.08189871907234192, -0.07792768627405167, -0.07395665347576141, -0.06998562067747116, -0.06601458787918091, -0.06204355135560036, -0.058072518557310104, -0.05410148575901985, -0.0501304529607296, -0.046159420162439346, -0.042188383638858795, -0.03821735084056854, -0.03424631804227829, -0.030275285243988037, -0.026304252445697784, -0.02233322709798813, -0.018362194299697876, -0.014391160570085049, -0.010420126840472221, -0.006449094042181969, -0.002478061243891716, 0.001492973417043686, 0.005464006215333939, 0.009435039013624191, 0.013406071811914444, 0.017377104610204697, 0.0213481392711401, 0.02531917206943035, 0.029290204867720604, 0.033261239528656006, 0.03723227232694626, 0.04120330512523651, 0.045174337923526764, 0.04914537072181702, 0.05311640352010727, 0.05708743631839752, 0.061058469116687775, 0.06502950191497803, 0.06900054216384888, 0.07297156751155853, 0.07694260030984879, 0.08091363310813904, 0.08488466590642929, 0.08885569870471954, 0.0928267315030098, 0.09679776430130005, 0.1007688045501709, 0.10473983734846115]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 4.0, 9.0, 17.0, 18.0, 15.0, 21.0, 19.0, 24.0, 33.0, 46.0, 39.0, 52.0, 64.0, 57.0, 65.0, 67.0, 59.0, 46.0, 45.0, 39.0, 27.0, 29.0, 29.0, 33.0, 19.0, 26.0, 22.0, 15.0, 5.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.07515132427215576, -0.07287157326936722, -0.07059182226657867, -0.06831207126379013, -0.06603232026100159, -0.06375257670879364, -0.061472825706005096, -0.05919307470321655, -0.05691332370042801, -0.054633572697639465, -0.05235382169485092, -0.050074074417352676, -0.04779432341456413, -0.04551457241177559, -0.043234825134277344, -0.0409550741314888, -0.038675323128700256, -0.03639557212591171, -0.03411582112312317, -0.031836073845624924, -0.02955632284283638, -0.027276571840047836, -0.024996822699904442, -0.022717073559761047, -0.020437322556972504, -0.01815757155418396, -0.015877822414040565, -0.013598072342574596, -0.011318322271108627, -0.009038572199642658, -0.006758822128176689, -0.004479072988033295, -0.002199321985244751, 8.042808622121811e-05, 0.002360178157687187, 0.004639928229153156, 0.006919678300619125, 0.009199428372085094, 0.011479178443551064, 0.013758927583694458, 0.016038678586483, 0.018318429589271545, 0.02059817872941494, 0.022877927869558334, 0.025157678872346878, 0.027437429875135422, 0.029717179015278816, 0.03199692815542221, 0.034276679158210754, 0.0365564301609993, 0.03883618116378784, 0.04111592844128609, 0.04339567944407463, 0.045675430446863174, 0.04795517772436142, 0.05023492872714996, 0.05251467972993851, 0.05479443073272705, 0.057074181735515594, 0.05935392901301384, 0.06163368001580238, 0.06391342729330063, 0.06619317829608917, 0.06847292929887772, 0.07075268030166626]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 3.0, 17.0, 16.0, 27.0, 47.0, 64.0, 178.0, 365.0, 24806.0, 4167989.0, 334.0, 158.0, 78.0, 51.0, 31.0, 26.0, 10.0, 9.0, 10.0, 5.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.197021484375, -0.19024276733398438, -0.18346405029296875, -0.17668533325195312, -0.1699066162109375, -0.16312789916992188, -0.15634918212890625, -0.14957046508789062, -0.142791748046875, -0.13601303100585938, -0.12923431396484375, -0.12245559692382812, -0.1156768798828125, -0.10889816284179688, -0.10211944580078125, -0.09534072875976562, -0.08856201171875, -0.08178329467773438, -0.07500457763671875, -0.06822586059570312, -0.0614471435546875, -0.054668426513671875, -0.04788970947265625, -0.041110992431640625, -0.034332275390625, -0.027553558349609375, -0.02077484130859375, -0.013996124267578125, -0.0072174072265625, -0.000438690185546875, 0.00634002685546875, 0.013118743896484375, 0.0198974609375, 0.026676177978515625, 0.03345489501953125, 0.040233612060546875, 0.0470123291015625, 0.053791046142578125, 0.06056976318359375, 0.06734848022460938, 0.074127197265625, 0.08090591430664062, 0.08768463134765625, 0.09446334838867188, 0.1012420654296875, 0.10802078247070312, 0.11479949951171875, 0.12157821655273438, 0.12835693359375, 0.13513565063476562, 0.14191436767578125, 0.14869308471679688, 0.1554718017578125, 0.16225051879882812, 0.16902923583984375, 0.17580795288085938, 0.182586669921875, 0.18936538696289062, 0.19614410400390625, 0.20292282104492188, 0.2097015380859375, 0.21648025512695312, 0.22325897216796875, 0.23003768920898438, 0.23681640625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 10.0, 11.0, 10.0, 27.0, 34.0, 91.0, 127.0, 187.0, 190.0, 108.0, 65.0, 34.0, 17.0, 13.0, 6.0, 9.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007343292236328125, -0.007091224193572998, -0.006839156150817871, -0.006587088108062744, -0.006335020065307617, -0.00608295202255249, -0.005830883979797363, -0.005578815937042236, -0.005326747894287109, -0.005074679851531982, -0.0048226118087768555, -0.0045705437660217285, -0.0043184757232666016, -0.004066407680511475, -0.0038143396377563477, -0.0035622715950012207, -0.0033102035522460938, -0.003058135509490967, -0.00280606746673584, -0.002553999423980713, -0.002301931381225586, -0.002049863338470459, -0.001797795295715332, -0.001545727252960205, -0.0012936592102050781, -0.0010415911674499512, -0.0007895231246948242, -0.0005374550819396973, -0.0002853870391845703, -3.331899642944336e-05, 0.0002187490463256836, 0.00047081708908081055, 0.0007228851318359375, 0.0009749531745910645, 0.0012270212173461914, 0.0014790892601013184, 0.0017311573028564453, 0.0019832253456115723, 0.0022352933883666992, 0.002487361431121826, 0.002739429473876953, 0.00299149751663208, 0.003243565559387207, 0.003495633602142334, 0.003747701644897461, 0.003999769687652588, 0.004251837730407715, 0.004503905773162842, 0.004755973815917969, 0.005008041858673096, 0.005260109901428223, 0.00551217794418335, 0.0057642459869384766, 0.0060163140296936035, 0.0062683820724487305, 0.006520450115203857, 0.006772518157958984, 0.007024586200714111, 0.007276654243469238, 0.007528722286224365, 0.007780790328979492, 0.00803285837173462, 0.008284926414489746, 0.008536994457244873, 0.0087890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 13.0, 23.0, 30.0, 44.0, 78.0, 121.0, 227.0, 361.0, 668.0, 1237.0, 2546.0, 5282.0, 13430.0, 44260.0, 813420.0, 3219677.0, 62861.0, 16543.0, 6500.0, 3004.0, 1545.0, 896.0, 551.0, 319.0, 210.0, 143.0, 91.0, 58.0, 40.0, 27.0, 20.0, 17.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.008575439453125, -0.008331239223480225, -0.00808703899383545, -0.007842838764190674, -0.0075986385345458984, -0.007354438304901123, -0.007110238075256348, -0.006866037845611572, -0.006621837615966797, -0.0063776373863220215, -0.006133437156677246, -0.005889236927032471, -0.005645036697387695, -0.00540083646774292, -0.0051566362380981445, -0.004912436008453369, -0.004668235778808594, -0.004424035549163818, -0.004179835319519043, -0.003935635089874268, -0.003691434860229492, -0.003447234630584717, -0.0032030344009399414, -0.002958834171295166, -0.0027146339416503906, -0.0024704337120056152, -0.00222623348236084, -0.0019820332527160645, -0.001737833023071289, -0.0014936327934265137, -0.0012494325637817383, -0.0010052323341369629, -0.0007610321044921875, -0.0005168318748474121, -0.0002726316452026367, -2.8431415557861328e-05, 0.00021576881408691406, 0.00045996904373168945, 0.0007041692733764648, 0.0009483695030212402, 0.0011925697326660156, 0.001436769962310791, 0.0016809701919555664, 0.0019251704216003418, 0.002169370651245117, 0.0024135708808898926, 0.002657771110534668, 0.0029019713401794434, 0.0031461715698242188, 0.003390371799468994, 0.0036345720291137695, 0.003878772258758545, 0.00412297248840332, 0.004367172718048096, 0.004611372947692871, 0.0048555731773376465, 0.005099773406982422, 0.005343973636627197, 0.005588173866271973, 0.005832374095916748, 0.0060765743255615234, 0.006320774555206299, 0.006564974784851074, 0.00680917501449585, 0.007053375244140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 7.0, 14.0, 16.0, 19.0, 22.0, 37.0, 52.0, 131.0, 368.0, 1107.0, 1390.0, 501.0, 172.0, 58.0, 27.0, 22.0, 18.0, 21.0, 5.0, 11.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007122039794921875, -0.0068686604499816895, -0.006615281105041504, -0.006361901760101318, -0.006108522415161133, -0.005855143070220947, -0.005601763725280762, -0.005348384380340576, -0.005095005035400391, -0.004841625690460205, -0.0045882463455200195, -0.004334867000579834, -0.0040814876556396484, -0.003828108310699463, -0.0035747289657592773, -0.003321349620819092, -0.0030679702758789062, -0.0028145909309387207, -0.002561211585998535, -0.0023078322410583496, -0.002054452896118164, -0.0018010735511779785, -0.001547694206237793, -0.0012943148612976074, -0.0010409355163574219, -0.0007875561714172363, -0.0005341768264770508, -0.00028079748153686523, -2.7418136596679688e-05, 0.00022596120834350586, 0.0004793405532836914, 0.000732719898223877, 0.0009860992431640625, 0.001239478588104248, 0.0014928579330444336, 0.0017462372779846191, 0.0019996166229248047, 0.0022529959678649902, 0.0025063753128051758, 0.0027597546577453613, 0.003013134002685547, 0.0032665133476257324, 0.003519892692565918, 0.0037732720375061035, 0.004026651382446289, 0.004280030727386475, 0.00453341007232666, 0.004786789417266846, 0.005040168762207031, 0.005293548107147217, 0.005546927452087402, 0.005800306797027588, 0.0060536861419677734, 0.006307065486907959, 0.0065604448318481445, 0.00681382417678833, 0.007067203521728516, 0.007320582866668701, 0.007573962211608887, 0.007827341556549072, 0.008080720901489258, 0.008334100246429443, 0.008587479591369629, 0.008840858936309814, 0.00909423828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 7.0, 15.0, 47.0, 85.0, 205.0, 257.0, 157.0, 78.0, 53.0, 32.0, 10.0, 19.0, 16.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0763329565525055, -0.07402196526527405, -0.0717109739780426, -0.06939999014139175, -0.06708899885416031, -0.06477800756692886, -0.06246701627969742, -0.06015602499246597, -0.057845037430524826, -0.05553404614329338, -0.053223058581352234, -0.05091206729412079, -0.04860107600688934, -0.046290088444948196, -0.04397909715771675, -0.041668109595775604, -0.03935711830854416, -0.037046127021312714, -0.03473513945937157, -0.03242414817214012, -0.030113158747553825, -0.02780216932296753, -0.025491178035736084, -0.023180188611149788, -0.020869199186563492, -0.018558209761977196, -0.0162472203373909, -0.013936229050159454, -0.011625239625573158, -0.009314250200986862, -0.0070032598450779915, -0.004692269489169121, -0.002381272614002228, -7.02827237546444e-05, 0.002240707166492939, 0.004551697056740522, 0.006862686946988106, 0.009173676371574402, 0.011484666727483273, 0.013795657083392143, 0.01610664650797844, 0.018417635932564735, 0.02072862535715103, 0.023039616644382477, 0.025350606068968773, 0.02766159549355507, 0.029972586780786514, 0.03228357434272766, 0.034594565629959106, 0.03690555691719055, 0.0392165444791317, 0.041527535766363144, 0.04383852332830429, 0.046149514615535736, 0.04846050590276718, 0.05077149718999863, 0.053082484751939774, 0.05539347603917122, 0.057704463601112366, 0.06001545488834381, 0.062326446175575256, 0.0646374374628067, 0.06694842129945755, 0.069259412586689, 0.07157040387392044]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 6.0, 11.0, 7.0, 17.0, 18.0, 20.0, 11.0, 23.0, 33.0, 30.0, 41.0, 35.0, 49.0, 60.0, 49.0, 55.0, 48.0, 64.0, 57.0, 48.0, 38.0, 35.0, 46.0, 33.0, 24.0, 26.0, 29.0, 16.0, 11.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031122207641601562, -0.0300825834274292, -0.029042961075901985, -0.02800333872437477, -0.026963714510202408, -0.025924090296030045, -0.02488446794450283, -0.023844845592975616, -0.022805221378803253, -0.02176559716463089, -0.020725974813103676, -0.019686352461576462, -0.0186467282474041, -0.017607104033231735, -0.01656748168170452, -0.015527858398854733, -0.014488235116004944, -0.013448611833155155, -0.012408988550305367, -0.011369365267455578, -0.01032974198460579, -0.009290118701756, -0.008250495418906212, -0.007210872136056423, -0.0061712488532066345, -0.005131625570356846, -0.004092002287507057, -0.0030523790046572685, -0.00201275572180748, -0.0009731324389576912, 6.649084389209747e-05, 0.0011061141267418861, 0.002145737409591675, 0.0031853606924414635, 0.004224983975291252, 0.005264607258141041, 0.0063042305409908295, 0.007343853823840618, 0.008383477106690407, 0.009423100389540195, 0.010462723672389984, 0.011502346955239773, 0.012541970238089561, 0.01358159352093935, 0.014621216803789139, 0.015660841017961502, 0.016700463369488716, 0.01774008572101593, 0.018779709935188293, 0.019819334149360657, 0.02085895650088787, 0.021898578852415085, 0.022938203066587448, 0.02397782728075981, 0.025017449632287025, 0.02605707198381424, 0.027096696197986603, 0.028136320412158966, 0.02917594276368618, 0.030215565115213394, 0.03125518932938576, 0.03229481354355812, 0.033334434032440186, 0.03437405824661255, 0.03541368246078491]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 9.0, 20.0, 29.0, 34.0, 49.0, 80.0, 85.0, 134.0, 188.0, 260.0, 408.0, 616.0, 950.0, 1478.0, 2593.0, 4866.0, 10977.0, 32896.0, 297758.0, 619453.0, 48792.0, 13367.0, 5621.0, 2880.0, 1720.0, 1054.0, 643.0, 462.0, 307.0, 220.0, 149.0, 120.0, 75.0, 65.0, 45.0, 34.0, 22.0, 25.0, 9.0, 5.0, 13.0, 4.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01190948486328125, -0.01150059700012207, -0.01109170913696289, -0.010682821273803711, -0.010273933410644531, -0.009865045547485352, -0.009456157684326172, -0.009047269821166992, -0.008638381958007812, -0.008229494094848633, -0.007820606231689453, -0.0074117183685302734, -0.007002830505371094, -0.006593942642211914, -0.006185054779052734, -0.005776166915893555, -0.005367279052734375, -0.004958391189575195, -0.004549503326416016, -0.004140615463256836, -0.0037317276000976562, -0.0033228397369384766, -0.002913951873779297, -0.002505064010620117, -0.0020961761474609375, -0.0016872882843017578, -0.0012784004211425781, -0.0008695125579833984, -0.00046062469482421875, -5.173683166503906e-05, 0.0003571510314941406, 0.0007660388946533203, 0.0011749267578125, 0.0015838146209716797, 0.0019927024841308594, 0.002401590347290039, 0.0028104782104492188, 0.0032193660736083984, 0.003628253936767578, 0.004037141799926758, 0.0044460296630859375, 0.004854917526245117, 0.005263805389404297, 0.0056726932525634766, 0.006081581115722656, 0.006490468978881836, 0.006899356842041016, 0.007308244705200195, 0.007717132568359375, 0.008126020431518555, 0.008534908294677734, 0.008943796157836914, 0.009352684020996094, 0.009761571884155273, 0.010170459747314453, 0.010579347610473633, 0.010988235473632812, 0.011397123336791992, 0.011806011199951172, 0.012214899063110352, 0.012623786926269531, 0.013032674789428711, 0.01344156265258789, 0.01385045051574707, 0.01425933837890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 16.0, 22.0, 52.0, 85.0, 136.0, 173.0, 153.0, 139.0, 77.0, 37.0, 12.0, 12.0, 8.0, 6.0, 7.0, 6.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007149875164031982, -0.00689542293548584, -0.006640970706939697, -0.006386518478393555, -0.006132066249847412, -0.0058776140213012695, -0.005623161792755127, -0.005368709564208984, -0.005114257335662842, -0.004859805107116699, -0.004605352878570557, -0.004350900650024414, -0.0040964484214782715, -0.003841996192932129, -0.0035875439643859863, -0.0033330917358398438, -0.003078639507293701, -0.0028241872787475586, -0.002569735050201416, -0.0023152828216552734, -0.002060830593109131, -0.0018063783645629883, -0.0015519261360168457, -0.0012974739074707031, -0.0010430216789245605, -0.000788569450378418, -0.0005341172218322754, -0.0002796649932861328, -2.5212764739990234e-05, 0.00022923946380615234, 0.0004836916923522949, 0.0007381439208984375, 0.00099259614944458, 0.0012470483779907227, 0.0015015006065368652, 0.0017559528350830078, 0.0020104050636291504, 0.002264857292175293, 0.0025193095207214355, 0.002773761749267578, 0.0030282139778137207, 0.0032826662063598633, 0.003537118434906006, 0.0037915706634521484, 0.004046022891998291, 0.004300475120544434, 0.004554927349090576, 0.004809379577636719, 0.005063831806182861, 0.005318284034729004, 0.0055727362632751465, 0.005827188491821289, 0.006081640720367432, 0.006336092948913574, 0.006590545177459717, 0.006844997406005859, 0.007099449634552002, 0.0073539018630981445, 0.007608354091644287, 0.00786280632019043, 0.008117258548736572, 0.008371710777282715, 0.008626163005828857, 0.008880615234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 3.0, 9.0, 8.0, 6.0, 9.0, 13.0, 29.0, 34.0, 55.0, 73.0, 93.0, 123.0, 174.0, 261.0, 362.0, 532.0, 958.0, 1805.0, 3726.0, 9992.0, 38042.0, 259903.0, 629901.0, 75074.0, 16282.0, 5278.0, 2407.0, 1221.0, 700.0, 439.0, 306.0, 186.0, 140.0, 106.0, 72.0, 61.0, 46.0, 18.0, 17.0, 20.0, 14.0, 11.0, 9.0, 6.0, 12.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.01168060302734375, -0.011339068412780762, -0.010997533798217773, -0.010655999183654785, -0.010314464569091797, -0.009972929954528809, -0.00963139533996582, -0.009289860725402832, -0.008948326110839844, -0.008606791496276855, -0.008265256881713867, -0.007923722267150879, -0.007582187652587891, -0.007240653038024902, -0.006899118423461914, -0.006557583808898926, -0.0062160491943359375, -0.005874514579772949, -0.005532979965209961, -0.005191445350646973, -0.004849910736083984, -0.004508376121520996, -0.004166841506958008, -0.0038253068923950195, -0.0034837722778320312, -0.003142237663269043, -0.0028007030487060547, -0.0024591684341430664, -0.002117633819580078, -0.0017760992050170898, -0.0014345645904541016, -0.0010930299758911133, -0.000751495361328125, -0.0004099607467651367, -6.842613220214844e-05, 0.00027310848236083984, 0.0006146430969238281, 0.0009561777114868164, 0.0012977123260498047, 0.001639246940612793, 0.0019807815551757812, 0.0023223161697387695, 0.002663850784301758, 0.003005385398864746, 0.0033469200134277344, 0.0036884546279907227, 0.004029989242553711, 0.004371523857116699, 0.0047130584716796875, 0.005054593086242676, 0.005396127700805664, 0.005737662315368652, 0.006079196929931641, 0.006420731544494629, 0.006762266159057617, 0.0071038007736206055, 0.007445335388183594, 0.007786870002746582, 0.00812840461730957, 0.008469939231872559, 0.008811473846435547, 0.009153008460998535, 0.009494543075561523, 0.009836077690124512, 0.0101776123046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 12.0, 13.0, 15.0, 22.0, 28.0, 23.0, 27.0, 23.0, 25.0, 51.0, 37.0, 46.0, 45.0, 55.0, 42.0, 53.0, 40.0, 44.0, 41.0, 36.0, 33.0, 39.0, 47.0, 31.0, 29.0, 19.0, 21.0, 18.0, 14.0, 13.0, 14.0, 4.0, 4.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.016937255859375, -0.016460657119750977, -0.015984058380126953, -0.01550745964050293, -0.015030860900878906, -0.014554262161254883, -0.01407766342163086, -0.013601064682006836, -0.013124465942382812, -0.012647867202758789, -0.012171268463134766, -0.011694669723510742, -0.011218070983886719, -0.010741472244262695, -0.010264873504638672, -0.009788274765014648, -0.009311676025390625, -0.008835077285766602, -0.008358478546142578, -0.007881879806518555, -0.007405281066894531, -0.006928682327270508, -0.006452083587646484, -0.005975484848022461, -0.0054988861083984375, -0.005022287368774414, -0.004545688629150391, -0.004069089889526367, -0.0035924911499023438, -0.0031158924102783203, -0.002639293670654297, -0.0021626949310302734, -0.00168609619140625, -0.0012094974517822266, -0.0007328987121582031, -0.0002562999725341797, 0.00022029876708984375, 0.0006968975067138672, 0.0011734962463378906, 0.001650094985961914, 0.0021266937255859375, 0.002603292465209961, 0.0030798912048339844, 0.003556489944458008, 0.004033088684082031, 0.004509687423706055, 0.004986286163330078, 0.0054628849029541016, 0.005939483642578125, 0.0064160823822021484, 0.006892681121826172, 0.007369279861450195, 0.007845878601074219, 0.008322477340698242, 0.008799076080322266, 0.009275674819946289, 0.009752273559570312, 0.010228872299194336, 0.01070547103881836, 0.011182069778442383, 0.011658668518066406, 0.01213526725769043, 0.012611865997314453, 0.013088464736938477, 0.0135650634765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 11.0, 7.0, 13.0, 17.0, 18.0, 46.0, 63.0, 123.0, 216.0, 490.0, 1072.0, 2793.0, 8046.0, 40662.0, 840008.0, 133517.0, 14357.0, 4132.0, 1614.0, 650.0, 312.0, 132.0, 85.0, 49.0, 38.0, 14.0, 18.0, 11.0, 12.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0029125213623046875, -0.002826124429702759, -0.00273972749710083, -0.0026533305644989014, -0.0025669336318969727, -0.002480536699295044, -0.0023941397666931152, -0.0023077428340911865, -0.002221345901489258, -0.002134948968887329, -0.0020485520362854004, -0.0019621551036834717, -0.001875758171081543, -0.0017893612384796143, -0.0017029643058776855, -0.0016165673732757568, -0.0015301704406738281, -0.0014437735080718994, -0.0013573765754699707, -0.001270979642868042, -0.0011845827102661133, -0.0010981857776641846, -0.0010117888450622559, -0.0009253919124603271, -0.0008389949798583984, -0.0007525980472564697, -0.000666201114654541, -0.0005798041820526123, -0.0004934072494506836, -0.0004070103168487549, -0.00032061338424682617, -0.00023421645164489746, -0.00014781951904296875, -6.142258644104004e-05, 2.4974346160888672e-05, 0.00011137127876281738, 0.0001977682113647461, 0.0002841651439666748, 0.0003705620765686035, 0.0004569590091705322, 0.0005433559417724609, 0.0006297528743743896, 0.0007161498069763184, 0.0008025467395782471, 0.0008889436721801758, 0.0009753406047821045, 0.0010617375373840332, 0.001148134469985962, 0.0012345314025878906, 0.0013209283351898193, 0.001407325267791748, 0.0014937222003936768, 0.0015801191329956055, 0.0016665160655975342, 0.0017529129981994629, 0.0018393099308013916, 0.0019257068634033203, 0.002012103796005249, 0.0020985007286071777, 0.0021848976612091064, 0.002271294593811035, 0.002357691526412964, 0.0024440884590148926, 0.0025304853916168213, 0.00261688232421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 2.0, 6.0, 4.0, 9.0, 4.0, 7.0, 13.0, 17.0, 12.0, 8.0, 23.0, 22.0, 13.0, 45.0, 19.0, 24.0, 32.0, 42.0, 49.0, 26.0, 42.0, 50.0, 19.0, 46.0, 44.0, 51.0, 21.0, 54.0, 42.0, 13.0, 37.0, 37.0, 20.0, 28.0, 18.0, 25.0, 12.0, 11.0, 10.0, 6.0, 14.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.4570693969726562e-06, -3.355555236339569e-06, -3.254041075706482e-06, -3.1525269150733948e-06, -3.0510127544403076e-06, -2.9494985938072205e-06, -2.8479844331741333e-06, -2.746470272541046e-06, -2.644956111907959e-06, -2.543441951274872e-06, -2.4419277906417847e-06, -2.3404136300086975e-06, -2.2388994693756104e-06, -2.137385308742523e-06, -2.035871148109436e-06, -1.934356987476349e-06, -1.8328428268432617e-06, -1.7313286662101746e-06, -1.6298145055770874e-06, -1.5283003449440002e-06, -1.426786184310913e-06, -1.325272023677826e-06, -1.2237578630447388e-06, -1.1222437024116516e-06, -1.0207295417785645e-06, -9.192153811454773e-07, -8.177012205123901e-07, -7.16187059879303e-07, -6.146728992462158e-07, -5.131587386131287e-07, -4.116445779800415e-07, -3.1013041734695435e-07, -2.086162567138672e-07, -1.0710209608078003e-07, -5.587935447692871e-09, 9.592622518539429e-08, 1.9744038581848145e-07, 2.989545464515686e-07, 4.0046870708465576e-07, 5.019828677177429e-07, 6.034970283508301e-07, 7.050111889839172e-07, 8.065253496170044e-07, 9.080395102500916e-07, 1.0095536708831787e-06, 1.1110678315162659e-06, 1.212581992149353e-06, 1.3140961527824402e-06, 1.4156103134155273e-06, 1.5171244740486145e-06, 1.6186386346817017e-06, 1.7201527953147888e-06, 1.821666955947876e-06, 1.923181116580963e-06, 2.0246952772140503e-06, 2.1262094378471375e-06, 2.2277235984802246e-06, 2.3292377591133118e-06, 2.430751919746399e-06, 2.532266080379486e-06, 2.6337802410125732e-06, 2.7352944016456604e-06, 2.8368085622787476e-06, 2.9383227229118347e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 6.0, 16.0, 14.0, 30.0, 47.0, 52.0, 78.0, 128.0, 190.0, 294.0, 614.0, 1287.0, 3043.0, 9196.0, 47904.0, 810208.0, 150891.0, 16280.0, 4482.0, 1810.0, 822.0, 397.0, 301.0, 130.0, 92.0, 58.0, 45.0, 29.0, 34.0, 16.0, 13.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00278472900390625, -0.0027067363262176514, -0.0026287436485290527, -0.002550750970840454, -0.0024727582931518555, -0.002394765615463257, -0.002316772937774658, -0.0022387802600860596, -0.002160787582397461, -0.0020827949047088623, -0.0020048022270202637, -0.001926809549331665, -0.0018488168716430664, -0.0017708241939544678, -0.0016928315162658691, -0.0016148388385772705, -0.0015368461608886719, -0.0014588534832000732, -0.0013808608055114746, -0.001302868127822876, -0.0012248754501342773, -0.0011468827724456787, -0.00106889009475708, -0.0009908974170684814, -0.0009129047393798828, -0.0008349120616912842, -0.0007569193840026855, -0.0006789267063140869, -0.0006009340286254883, -0.0005229413509368896, -0.000444948673248291, -0.0003669559955596924, -0.00028896331787109375, -0.00021097064018249512, -0.00013297796249389648, -5.498528480529785e-05, 2.300739288330078e-05, 0.00010100007057189941, 0.00017899274826049805, 0.0002569854259490967, 0.0003349781036376953, 0.00041297078132629395, 0.0004909634590148926, 0.0005689561367034912, 0.0006469488143920898, 0.0007249414920806885, 0.0008029341697692871, 0.0008809268474578857, 0.0009589195251464844, 0.001036912202835083, 0.0011149048805236816, 0.0011928975582122803, 0.001270890235900879, 0.0013488829135894775, 0.0014268755912780762, 0.0015048682689666748, 0.0015828609466552734, 0.001660853624343872, 0.0017388463020324707, 0.0018168389797210693, 0.001894831657409668, 0.0019728243350982666, 0.0020508170127868652, 0.002128809690475464, 0.0022068023681640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 0.0, 4.0, 11.0, 8.0, 4.0, 13.0, 22.0, 30.0, 40.0, 49.0, 107.0, 105.0, 104.0, 116.0, 97.0, 79.0, 57.0, 41.0, 28.0, 16.0, 17.0, 14.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032978057861328125, -0.0032031238079071045, -0.0031084418296813965, -0.0030137598514556885, -0.0029190778732299805, -0.0028243958950042725, -0.0027297139167785645, -0.0026350319385528564, -0.0025403499603271484, -0.0024456679821014404, -0.0023509860038757324, -0.0022563040256500244, -0.0021616220474243164, -0.0020669400691986084, -0.0019722580909729004, -0.0018775761127471924, -0.0017828941345214844, -0.0016882121562957764, -0.0015935301780700684, -0.0014988481998443604, -0.0014041662216186523, -0.0013094842433929443, -0.0012148022651672363, -0.0011201202869415283, -0.0010254383087158203, -0.0009307563304901123, -0.0008360743522644043, -0.0007413923740386963, -0.0006467103958129883, -0.0005520284175872803, -0.00045734643936157227, -0.00036266446113586426, -0.00026798248291015625, -0.00017330050468444824, -7.861852645874023e-05, 1.6063451766967773e-05, 0.00011074542999267578, 0.0002054274082183838, 0.0003001093864440918, 0.0003947913646697998, 0.0004894733428955078, 0.0005841553211212158, 0.0006788372993469238, 0.0007735192775726318, 0.0008682012557983398, 0.0009628832340240479, 0.0010575652122497559, 0.0011522471904754639, 0.0012469291687011719, 0.0013416111469268799, 0.0014362931251525879, 0.001530975103378296, 0.001625657081604004, 0.001720339059829712, 0.00181502103805542, 0.001909703016281128, 0.002004384994506836, 0.002099066972732544, 0.002193748950958252, 0.00228843092918396, 0.002383112907409668, 0.002477794885635376, 0.002572476863861084, 0.002667158842086792, 0.0027618408203125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 4.0, 23.0, 38.0, 152.0, 391.0, 231.0, 77.0, 42.0, 16.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10761038213968277, -0.10356015712022781, -0.09950992465019226, -0.0954596996307373, -0.09140946716070175, -0.0873592421412468, -0.08330900967121124, -0.07925878465175629, -0.07520855963230133, -0.07115833461284637, -0.06710810214281082, -0.06305787712335587, -0.05900764465332031, -0.054957419633865356, -0.0509071908891201, -0.04685696214437485, -0.042806729674339294, -0.03875650092959404, -0.034706272184848785, -0.03065604530274868, -0.026605816558003426, -0.02255558781325817, -0.018505360931158066, -0.014455132186412811, -0.010404903441667557, -0.0063546751625835896, -0.0023044468834996223, 0.0017457809299230576, 0.005796009674668312, 0.009846238419413567, 0.013896465301513672, 0.017946694046258926, 0.021996930241584778, 0.026047158986330032, 0.030097387731075287, 0.03414761275053024, 0.038197845220565796, 0.04224807024002075, 0.046298298984766006, 0.05034852772951126, 0.054398756474256516, 0.05844898521900177, 0.062499213963747025, 0.06654944270849228, 0.07059966772794724, 0.07464990019798279, 0.07870012521743774, 0.0827503502368927, 0.08680058270692825, 0.09085080772638321, 0.09490104019641876, 0.09895126521587372, 0.10300149768590927, 0.10705172270536423, 0.11110195517539978, 0.11515218019485474, 0.11920240521430969, 0.12325263023376465, 0.1273028552532196, 0.13135309517383575, 0.1354033201932907, 0.13945354521274567, 0.14350377023220062, 0.14755401015281677, 0.15160423517227173]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 7.0, 3.0, 4.0, 7.0, 13.0, 10.0, 13.0, 11.0, 15.0, 12.0, 20.0, 18.0, 22.0, 28.0, 31.0, 35.0, 37.0, 40.0, 39.0, 50.0, 60.0, 66.0, 61.0, 53.0, 38.0, 36.0, 41.0, 31.0, 20.0, 24.0, 24.0, 21.0, 16.0, 19.0, 10.0, 14.0, 14.0, 5.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056395113468170166, -0.05458729341626167, -0.05277947336435318, -0.050971657037734985, -0.04916383698582649, -0.047356016933918, -0.045548200607299805, -0.04374038055539131, -0.04193256050348282, -0.040124740451574326, -0.03831692039966583, -0.03650910407304764, -0.034701284021139145, -0.03289346396923065, -0.031085645779967308, -0.029277827590703964, -0.02747000753879547, -0.025662187486886978, -0.023854369297623634, -0.02204655110836029, -0.020238731056451797, -0.018430911004543304, -0.01662309281527996, -0.014815273694694042, -0.013007454574108124, -0.011199635453522205, -0.009391816332936287, -0.0075839972123503685, -0.00577617809176445, -0.003968358971178532, -0.0021605398505926132, -0.0003527207300066948, 0.0014550983905792236, 0.003262917511165142, 0.0050707366317510605, 0.006878555752336979, 0.008686374872922897, 0.010494193993508816, 0.012302013114094734, 0.014109832234680653, 0.01591765135526657, 0.017725471407175064, 0.019533289596438408, 0.02134110778570175, 0.023148927837610245, 0.024956747889518738, 0.02676456607878208, 0.028572384268045425, 0.03038020431995392, 0.03218802437186241, 0.033995844423770905, 0.0358036607503891, 0.03761148080229759, 0.039419300854206085, 0.04122711718082428, 0.04303493723273277, 0.044842757284641266, 0.04665057733654976, 0.04845839738845825, 0.05026621371507645, 0.05207403376698494, 0.05388185381889343, 0.05568967014551163, 0.05749749019742012, 0.05930531024932861]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 25.0, 36.0, 49.0, 94.0, 212.0, 568.0, 1558.0, 4551.0, 16145.0, 87498.0, 1683851.0, 2298952.0, 80493.0, 14010.0, 3870.0, 1354.0, 492.0, 196.0, 106.0, 64.0, 42.0, 28.0, 21.0, 10.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004331529140472412, -0.004176974296569824, -0.004022419452667236, -0.0038678646087646484, -0.0037133097648620605, -0.0035587549209594727, -0.0034042000770568848, -0.003249645233154297, -0.003095090389251709, -0.002940535545349121, -0.002785980701446533, -0.0026314258575439453, -0.0024768710136413574, -0.0023223161697387695, -0.0021677613258361816, -0.0020132064819335938, -0.0018586516380310059, -0.001704096794128418, -0.00154954195022583, -0.0013949871063232422, -0.0012404322624206543, -0.0010858774185180664, -0.0009313225746154785, -0.0007767677307128906, -0.0006222128868103027, -0.00046765804290771484, -0.00031310319900512695, -0.00015854835510253906, -3.993511199951172e-06, 0.00015056133270263672, 0.0003051161766052246, 0.0004596710205078125, 0.0006142258644104004, 0.0007687807083129883, 0.0009233355522155762, 0.001077890396118164, 0.001232445240020752, 0.0013870000839233398, 0.0015415549278259277, 0.0016961097717285156, 0.0018506646156311035, 0.0020052194595336914, 0.0021597743034362793, 0.002314329147338867, 0.002468883991241455, 0.002623438835144043, 0.002777993679046631, 0.0029325485229492188, 0.0030871033668518066, 0.0032416582107543945, 0.0033962130546569824, 0.0035507678985595703, 0.003705322742462158, 0.003859877586364746, 0.004014432430267334, 0.004168987274169922, 0.00432354211807251, 0.004478096961975098, 0.0046326518058776855, 0.0047872066497802734, 0.004941761493682861, 0.005096316337585449, 0.005250871181488037, 0.005405426025390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 9.0, 11.0, 28.0, 46.0, 58.0, 79.0, 106.0, 140.0, 129.0, 108.0, 86.0, 46.0, 40.0, 34.0, 20.0, 8.0, 10.0, 10.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007427215576171875, -0.007173478603363037, -0.006919741630554199, -0.006666004657745361, -0.0064122676849365234, -0.0061585307121276855, -0.005904793739318848, -0.00565105676651001, -0.005397319793701172, -0.005143582820892334, -0.004889845848083496, -0.004636108875274658, -0.00438237190246582, -0.004128634929656982, -0.0038748979568481445, -0.0036211609840393066, -0.0033674240112304688, -0.003113687038421631, -0.002859950065612793, -0.002606213092803955, -0.002352476119995117, -0.0020987391471862793, -0.0018450021743774414, -0.0015912652015686035, -0.0013375282287597656, -0.0010837912559509277, -0.0008300542831420898, -0.000576317310333252, -0.00032258033752441406, -6.884336471557617e-05, 0.00018489360809326172, 0.0004386305809020996, 0.0006923675537109375, 0.0009461045265197754, 0.0011998414993286133, 0.0014535784721374512, 0.001707315444946289, 0.001961052417755127, 0.002214789390563965, 0.0024685263633728027, 0.0027222633361816406, 0.0029760003089904785, 0.0032297372817993164, 0.0034834742546081543, 0.003737211227416992, 0.00399094820022583, 0.004244685173034668, 0.004498422145843506, 0.004752159118652344, 0.005005896091461182, 0.0052596330642700195, 0.005513370037078857, 0.005767107009887695, 0.006020843982696533, 0.006274580955505371, 0.006528317928314209, 0.006782054901123047, 0.007035791873931885, 0.007289528846740723, 0.0075432658195495605, 0.0077970027923583984, 0.008050739765167236, 0.008304476737976074, 0.008558213710784912, 0.00881195068359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 15.0, 23.0, 45.0, 70.0, 128.0, 224.0, 398.0, 840.0, 1920.0, 5238.0, 17486.0, 90010.0, 3655546.0, 374765.0, 31616.0, 9429.0, 3482.0, 1412.0, 686.0, 339.0, 183.0, 135.0, 92.0, 65.0, 37.0, 23.0, 14.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0050811767578125, -0.004915714263916016, -0.004750251770019531, -0.004584789276123047, -0.0044193267822265625, -0.004253864288330078, -0.004088401794433594, -0.003922939300537109, -0.003757476806640625, -0.0035920143127441406, -0.0034265518188476562, -0.003261089324951172, -0.0030956268310546875, -0.002930164337158203, -0.0027647018432617188, -0.0025992393493652344, -0.00243377685546875, -0.0022683143615722656, -0.0021028518676757812, -0.0019373893737792969, -0.0017719268798828125, -0.0016064643859863281, -0.0014410018920898438, -0.0012755393981933594, -0.001110076904296875, -0.0009446144104003906, -0.0007791519165039062, -0.0006136894226074219, -0.0004482269287109375, -0.0002827644348144531, -0.00011730194091796875, 4.8160552978515625e-05, 0.000213623046875, 0.0003790855407714844, 0.0005445480346679688, 0.0007100105285644531, 0.0008754730224609375, 0.0010409355163574219, 0.0012063980102539062, 0.0013718605041503906, 0.001537322998046875, 0.0017027854919433594, 0.0018682479858398438, 0.002033710479736328, 0.0021991729736328125, 0.002364635467529297, 0.0025300979614257812, 0.0026955604553222656, 0.00286102294921875, 0.0030264854431152344, 0.0031919479370117188, 0.003357410430908203, 0.0035228729248046875, 0.003688335418701172, 0.0038537979125976562, 0.004019260406494141, 0.004184722900390625, 0.004350185394287109, 0.004515647888183594, 0.004681110382080078, 0.0048465728759765625, 0.005012035369873047, 0.005177497863769531, 0.005342960357666016, 0.0055084228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 13.0, 19.0, 12.0, 26.0, 58.0, 136.0, 353.0, 960.0, 1305.0, 717.0, 235.0, 82.0, 35.0, 17.0, 11.0, 13.0, 10.0, 10.0, 7.0, 13.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006290435791015625, -0.006067931652069092, -0.005845427513122559, -0.005622923374176025, -0.005400419235229492, -0.005177915096282959, -0.004955410957336426, -0.004732906818389893, -0.004510402679443359, -0.004287898540496826, -0.004065394401550293, -0.0038428902626037598, -0.0036203861236572266, -0.0033978819847106934, -0.00317537784576416, -0.002952873706817627, -0.0027303695678710938, -0.0025078654289245605, -0.0022853612899780273, -0.002062857151031494, -0.001840353012084961, -0.0016178488731384277, -0.0013953447341918945, -0.0011728405952453613, -0.0009503364562988281, -0.0007278323173522949, -0.0005053281784057617, -0.0002828240394592285, -6.031990051269531e-05, 0.0001621842384338379, 0.0003846883773803711, 0.0006071925163269043, 0.0008296966552734375, 0.0010522007942199707, 0.001274704933166504, 0.0014972090721130371, 0.0017197132110595703, 0.0019422173500061035, 0.0021647214889526367, 0.00238722562789917, 0.002609729766845703, 0.0028322339057922363, 0.0030547380447387695, 0.0032772421836853027, 0.003499746322631836, 0.003722250461578369, 0.003944754600524902, 0.0041672587394714355, 0.004389762878417969, 0.004612267017364502, 0.004834771156311035, 0.005057275295257568, 0.0052797794342041016, 0.005502283573150635, 0.005724787712097168, 0.005947291851043701, 0.006169795989990234, 0.006392300128936768, 0.006614804267883301, 0.006837308406829834, 0.007059812545776367, 0.0072823166847229, 0.007504820823669434, 0.007727324962615967, 0.0079498291015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 7.0, 34.0, 58.0, 140.0, 223.0, 236.0, 154.0, 57.0, 41.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046362124383449554, -0.04495404660701752, -0.04354596510529518, -0.042137887328863144, -0.04072980582714081, -0.03932172805070877, -0.03791365027427673, -0.036505572497844696, -0.03509749099612236, -0.03368941321969032, -0.03228133171796799, -0.03087325394153595, -0.029465174302458763, -0.028057094663381577, -0.02664901688694954, -0.025240937247872353, -0.023832857608795166, -0.02242477796971798, -0.021016698330640793, -0.019608620554208755, -0.01820054091513157, -0.016792461276054382, -0.01538438256829977, -0.013976303860545158, -0.012568224221467972, -0.011160144582390785, -0.009752065874636173, -0.008343987166881561, -0.006935907527804375, -0.005527828354388475, -0.004119749180972576, -0.002711670473217964, -0.0013035908341407776, 0.00010448833927512169, 0.001512567512691021, 0.0029206466861069202, 0.0043287258595228195, 0.005736805032938719, 0.007144884206354618, 0.00855296291410923, 0.009961042553186417, 0.011369122192263603, 0.012777200900018215, 0.014185279607772827, 0.015593359246850014, 0.0170014388859272, 0.018409516662359238, 0.019817596301436424, 0.02122567594051361, 0.022633755579590797, 0.024041835218667984, 0.02544991299510002, 0.026857992634177208, 0.028266072273254395, 0.029674150049686432, 0.03108222968876362, 0.032490309327840805, 0.03389838710427284, 0.03530646860599518, 0.036714546382427216, 0.03812262415885925, 0.03953070566058159, 0.040938783437013626, 0.04234686493873596, 0.043754942715168]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 7.0, 9.0, 11.0, 8.0, 8.0, 18.0, 17.0, 29.0, 31.0, 32.0, 31.0, 39.0, 39.0, 36.0, 46.0, 37.0, 51.0, 56.0, 47.0, 50.0, 47.0, 33.0, 40.0, 34.0, 44.0, 27.0, 24.0, 37.0, 17.0, 10.0, 9.0, 20.0, 7.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.023339927196502686, -0.022639479488134384, -0.021939033642411232, -0.02123858779668808, -0.02053814008831978, -0.019837692379951477, -0.019137246534228325, -0.018436800688505173, -0.01773635298013687, -0.01703590527176857, -0.016335459426045418, -0.015635013580322266, -0.014934565871953964, -0.014234119094908237, -0.01353367231786251, -0.012833225540816784, -0.012132778763771057, -0.01143233198672533, -0.010731885209679604, -0.010031438432633877, -0.00933099165558815, -0.008630544878542423, -0.007930098101496696, -0.00722965132445097, -0.006529204547405243, -0.005828757770359516, -0.005128310993313789, -0.004427864216268063, -0.003727417439222336, -0.003026970662176609, -0.0023265238851308823, -0.0016260771080851555, -0.0009256303310394287, -0.00022518355399370193, 0.00047526322305202484, 0.0011757100000977516, 0.0018761567771434784, 0.002576603554189205, 0.003277050331234932, 0.003977497108280659, 0.0046779438853263855, 0.005378390662372112, 0.006078837439417839, 0.006779284216463566, 0.007479730993509293, 0.00818017777055502, 0.008880624547600746, 0.009581071324646473, 0.0102815181016922, 0.010981964878737926, 0.011682411655783653, 0.01238285843282938, 0.013083305209875107, 0.013783751986920834, 0.01448419876396656, 0.015184645541012287, 0.015885092318058014, 0.016585540026426315, 0.017285985872149467, 0.01798643171787262, 0.01868687942624092, 0.019387327134609222, 0.020087772980332375, 0.020788218826055527, 0.021488666534423828]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 9.0, 20.0, 26.0, 24.0, 40.0, 57.0, 84.0, 126.0, 201.0, 356.0, 593.0, 1006.0, 1925.0, 3839.0, 8772.0, 24460.0, 92561.0, 441373.0, 363249.0, 74155.0, 20746.0, 7617.0, 3453.0, 1582.0, 877.0, 525.0, 294.0, 196.0, 139.0, 79.0, 53.0, 20.0, 26.0, 20.0, 14.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0053863525390625, -0.00520634651184082, -0.005026340484619141, -0.004846334457397461, -0.004666328430175781, -0.0044863224029541016, -0.004306316375732422, -0.004126310348510742, -0.0039463043212890625, -0.003766298294067383, -0.003586292266845703, -0.0034062862396240234, -0.0032262802124023438, -0.003046274185180664, -0.0028662681579589844, -0.0026862621307373047, -0.002506256103515625, -0.0023262500762939453, -0.0021462440490722656, -0.001966238021850586, -0.0017862319946289062, -0.0016062259674072266, -0.0014262199401855469, -0.0012462139129638672, -0.0010662078857421875, -0.0008862018585205078, -0.0007061958312988281, -0.0005261898040771484, -0.00034618377685546875, -0.00016617774963378906, 1.3828277587890625e-05, 0.0001938343048095703, 0.00037384033203125, 0.0005538463592529297, 0.0007338523864746094, 0.0009138584136962891, 0.0010938644409179688, 0.0012738704681396484, 0.0014538764953613281, 0.0016338825225830078, 0.0018138885498046875, 0.001993894577026367, 0.002173900604248047, 0.0023539066314697266, 0.0025339126586914062, 0.002713918685913086, 0.0028939247131347656, 0.0030739307403564453, 0.003253936767578125, 0.0034339427947998047, 0.0036139488220214844, 0.003793954849243164, 0.003973960876464844, 0.0041539669036865234, 0.004333972930908203, 0.004513978958129883, 0.0046939849853515625, 0.004873991012573242, 0.005053997039794922, 0.0052340030670166016, 0.005414009094238281, 0.005594015121459961, 0.005774021148681641, 0.00595402717590332, 0.006134033203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 23.0, 34.0, 45.0, 76.0, 77.0, 122.0, 146.0, 121.0, 102.0, 70.0, 45.0, 33.0, 28.0, 15.0, 9.0, 7.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00734710693359375, -0.007092714309692383, -0.006838321685791016, -0.0065839290618896484, -0.006329536437988281, -0.006075143814086914, -0.005820751190185547, -0.00556635856628418, -0.0053119659423828125, -0.005057573318481445, -0.004803180694580078, -0.004548788070678711, -0.004294395446777344, -0.0040400028228759766, -0.0037856101989746094, -0.003531217575073242, -0.003276824951171875, -0.003022432327270508, -0.0027680397033691406, -0.0025136470794677734, -0.0022592544555664062, -0.002004861831665039, -0.0017504692077636719, -0.0014960765838623047, -0.0012416839599609375, -0.0009872913360595703, -0.0007328987121582031, -0.00047850608825683594, -0.00022411346435546875, 3.0279159545898438e-05, 0.0002846717834472656, 0.0005390644073486328, 0.00079345703125, 0.0010478496551513672, 0.0013022422790527344, 0.0015566349029541016, 0.0018110275268554688, 0.002065420150756836, 0.002319812774658203, 0.0025742053985595703, 0.0028285980224609375, 0.0030829906463623047, 0.003337383270263672, 0.003591775894165039, 0.0038461685180664062, 0.0041005611419677734, 0.004354953765869141, 0.004609346389770508, 0.004863739013671875, 0.005118131637573242, 0.005372524261474609, 0.0056269168853759766, 0.005881309509277344, 0.006135702133178711, 0.006390094757080078, 0.006644487380981445, 0.0068988800048828125, 0.00715327262878418, 0.007407665252685547, 0.007662057876586914, 0.007916450500488281, 0.008170843124389648, 0.008425235748291016, 0.008679628372192383, 0.00893402099609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 11.0, 5.0, 8.0, 9.0, 13.0, 20.0, 17.0, 24.0, 33.0, 55.0, 61.0, 89.0, 103.0, 154.0, 231.0, 298.0, 514.0, 821.0, 1668.0, 4014.0, 14785.0, 92369.0, 679633.0, 213660.0, 28349.0, 6279.0, 2154.0, 1079.0, 687.0, 395.0, 272.0, 202.0, 144.0, 86.0, 80.0, 67.0, 48.0, 31.0, 28.0, 18.0, 9.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.01020050048828125, -0.009914755821228027, -0.009629011154174805, -0.009343266487121582, -0.00905752182006836, -0.008771777153015137, -0.008486032485961914, -0.008200287818908691, -0.007914543151855469, -0.007628798484802246, -0.0073430538177490234, -0.007057309150695801, -0.006771564483642578, -0.0064858198165893555, -0.006200075149536133, -0.00591433048248291, -0.0056285858154296875, -0.005342841148376465, -0.005057096481323242, -0.0047713518142700195, -0.004485607147216797, -0.004199862480163574, -0.0039141178131103516, -0.003628373146057129, -0.0033426284790039062, -0.0030568838119506836, -0.002771139144897461, -0.0024853944778442383, -0.0021996498107910156, -0.001913905143737793, -0.0016281604766845703, -0.0013424158096313477, -0.001056671142578125, -0.0007709264755249023, -0.0004851818084716797, -0.00019943714141845703, 8.630752563476562e-05, 0.0003720521926879883, 0.0006577968597412109, 0.0009435415267944336, 0.0012292861938476562, 0.001515030860900879, 0.0018007755279541016, 0.0020865201950073242, 0.002372264862060547, 0.0026580095291137695, 0.002943754196166992, 0.003229498863220215, 0.0035152435302734375, 0.00380098819732666, 0.004086732864379883, 0.0043724775314331055, 0.004658222198486328, 0.004943966865539551, 0.0052297115325927734, 0.005515456199645996, 0.005801200866699219, 0.006086945533752441, 0.006372690200805664, 0.006658434867858887, 0.006944179534912109, 0.007229924201965332, 0.007515668869018555, 0.007801413536071777, 0.008087158203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 2.0, 4.0, 8.0, 7.0, 11.0, 9.0, 7.0, 9.0, 12.0, 17.0, 16.0, 24.0, 34.0, 33.0, 28.0, 34.0, 36.0, 36.0, 50.0, 48.0, 32.0, 45.0, 35.0, 47.0, 42.0, 41.0, 38.0, 40.0, 42.0, 28.0, 26.0, 26.0, 17.0, 21.0, 16.0, 11.0, 16.0, 13.0, 7.0, 5.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013458251953125, -0.013055801391601562, -0.012653350830078125, -0.012250900268554688, -0.01184844970703125, -0.011445999145507812, -0.011043548583984375, -0.010641098022460938, -0.0102386474609375, -0.009836196899414062, -0.009433746337890625, -0.009031295776367188, -0.00862884521484375, -0.008226394653320312, -0.007823944091796875, -0.0074214935302734375, -0.00701904296875, -0.0066165924072265625, -0.006214141845703125, -0.0058116912841796875, -0.00540924072265625, -0.0050067901611328125, -0.004604339599609375, -0.0042018890380859375, -0.0037994384765625, -0.0033969879150390625, -0.002994537353515625, -0.0025920867919921875, -0.00218963623046875, -0.0017871856689453125, -0.001384735107421875, -0.0009822845458984375, -0.000579833984375, -0.0001773834228515625, 0.000225067138671875, 0.0006275177001953125, 0.00102996826171875, 0.0014324188232421875, 0.001834869384765625, 0.0022373199462890625, 0.0026397705078125, 0.0030422210693359375, 0.003444671630859375, 0.0038471221923828125, 0.00424957275390625, 0.0046520233154296875, 0.005054473876953125, 0.0054569244384765625, 0.005859375, 0.0062618255615234375, 0.006664276123046875, 0.0070667266845703125, 0.00746917724609375, 0.007871627807617188, 0.008274078369140625, 0.008676528930664062, 0.0090789794921875, 0.009481430053710938, 0.009883880615234375, 0.010286331176757812, 0.01068878173828125, 0.011091232299804688, 0.011493682861328125, 0.011896133422851562, 0.012298583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 5.0, 11.0, 15.0, 18.0, 31.0, 32.0, 57.0, 77.0, 158.0, 304.0, 491.0, 1044.0, 2156.0, 5361.0, 16416.0, 68258.0, 506544.0, 358539.0, 63820.0, 15737.0, 5242.0, 2087.0, 967.0, 483.0, 254.0, 157.0, 104.0, 59.0, 40.0, 30.0, 15.0, 13.0, 11.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001148223876953125, -0.0011071860790252686, -0.0010661482810974121, -0.0010251104831695557, -0.0009840726852416992, -0.0009430348873138428, -0.0009019970893859863, -0.0008609592914581299, -0.0008199214935302734, -0.000778883695602417, -0.0007378458976745605, -0.0006968080997467041, -0.0006557703018188477, -0.0006147325038909912, -0.0005736947059631348, -0.0005326569080352783, -0.0004916191101074219, -0.00045058131217956543, -0.000409543514251709, -0.00036850571632385254, -0.0003274679183959961, -0.00028643012046813965, -0.0002453923225402832, -0.00020435452461242676, -0.0001633167266845703, -0.00012227892875671387, -8.124113082885742e-05, -4.0203332901000977e-05, 8.344650268554688e-07, 4.1872262954711914e-05, 8.291006088256836e-05, 0.0001239478588104248, 0.00016498565673828125, 0.0002060234546661377, 0.00024706125259399414, 0.0002880990505218506, 0.00032913684844970703, 0.0003701746463775635, 0.0004112124443054199, 0.00045225024223327637, 0.0004932880401611328, 0.0005343258380889893, 0.0005753636360168457, 0.0006164014339447021, 0.0006574392318725586, 0.000698477029800415, 0.0007395148277282715, 0.0007805526256561279, 0.0008215904235839844, 0.0008626282215118408, 0.0009036660194396973, 0.0009447038173675537, 0.0009857416152954102, 0.0010267794132232666, 0.001067817211151123, 0.0011088550090789795, 0.001149892807006836, 0.0011909306049346924, 0.0012319684028625488, 0.0012730062007904053, 0.0013140439987182617, 0.0013550817966461182, 0.0013961195945739746, 0.001437157392501831, 0.0014781951904296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 12.0, 9.0, 9.0, 16.0, 11.0, 12.0, 29.0, 20.0, 30.0, 27.0, 30.0, 47.0, 35.0, 60.0, 56.0, 41.0, 74.0, 45.0, 67.0, 75.0, 35.0, 56.0, 26.0, 39.0, 35.0, 20.0, 8.0, 14.0, 19.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.374422132968903e-06, -4.218891263008118e-06, -4.063360393047333e-06, -3.907829523086548e-06, -3.752298653125763e-06, -3.596767783164978e-06, -3.441236913204193e-06, -3.285706043243408e-06, -3.1301751732826233e-06, -2.9746443033218384e-06, -2.8191134333610535e-06, -2.6635825634002686e-06, -2.5080516934394836e-06, -2.3525208234786987e-06, -2.196989953517914e-06, -2.041459083557129e-06, -1.885928213596344e-06, -1.730397343635559e-06, -1.5748664736747742e-06, -1.4193356037139893e-06, -1.2638047337532043e-06, -1.1082738637924194e-06, -9.527429938316345e-07, -7.972121238708496e-07, -6.416812539100647e-07, -4.861503839492798e-07, -3.3061951398849487e-07, -1.7508864402770996e-07, -1.955777406692505e-08, 1.3597309589385986e-07, 2.915039658546448e-07, 4.470348358154297e-07, 6.025657057762146e-07, 7.580965757369995e-07, 9.136274456977844e-07, 1.0691583156585693e-06, 1.2246891856193542e-06, 1.3802200555801392e-06, 1.535750925540924e-06, 1.691281795501709e-06, 1.846812665462494e-06, 2.002343535423279e-06, 2.1578744053840637e-06, 2.3134052753448486e-06, 2.4689361453056335e-06, 2.6244670152664185e-06, 2.7799978852272034e-06, 2.9355287551879883e-06, 3.091059625148773e-06, 3.246590495109558e-06, 3.402121365070343e-06, 3.557652235031128e-06, 3.713183104991913e-06, 3.868713974952698e-06, 4.024244844913483e-06, 4.179775714874268e-06, 4.3353065848350525e-06, 4.490837454795837e-06, 4.646368324756622e-06, 4.801899194717407e-06, 4.957430064678192e-06, 5.112960934638977e-06, 5.268491804599762e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 5.0, 9.0, 9.0, 19.0, 35.0, 36.0, 49.0, 73.0, 111.0, 200.0, 303.0, 526.0, 1106.0, 2675.0, 8850.0, 43072.0, 317762.0, 591945.0, 63822.0, 11787.0, 3329.0, 1261.0, 619.0, 350.0, 194.0, 126.0, 68.0, 55.0, 45.0, 39.0, 14.0, 12.0, 7.0, 12.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001293182373046875, -0.0012454688549041748, -0.0011977553367614746, -0.0011500418186187744, -0.0011023283004760742, -0.001054614782333374, -0.0010069012641906738, -0.0009591877460479736, -0.0009114742279052734, -0.0008637607097625732, -0.000816047191619873, -0.0007683336734771729, -0.0007206201553344727, -0.0006729066371917725, -0.0006251931190490723, -0.0005774796009063721, -0.0005297660827636719, -0.0004820525646209717, -0.0004343390464782715, -0.0003866255283355713, -0.0003389120101928711, -0.0002911984920501709, -0.0002434849739074707, -0.0001957714557647705, -0.0001480579376220703, -0.00010034441947937012, -5.263090133666992e-05, -4.9173831939697266e-06, 4.279613494873047e-05, 9.050965309143066e-05, 0.00013822317123413086, 0.00018593668937683105, 0.00023365020751953125, 0.00028136372566223145, 0.00032907724380493164, 0.00037679076194763184, 0.00042450428009033203, 0.0004722177982330322, 0.0005199313163757324, 0.0005676448345184326, 0.0006153583526611328, 0.000663071870803833, 0.0007107853889465332, 0.0007584989070892334, 0.0008062124252319336, 0.0008539259433746338, 0.000901639461517334, 0.0009493529796600342, 0.0009970664978027344, 0.0010447800159454346, 0.0010924935340881348, 0.001140207052230835, 0.0011879205703735352, 0.0012356340885162354, 0.0012833476066589355, 0.0013310611248016357, 0.001378774642944336, 0.0014264881610870361, 0.0014742016792297363, 0.0015219151973724365, 0.0015696287155151367, 0.001617342233657837, 0.0016650557518005371, 0.0017127692699432373, 0.0017604827880859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 11.0, 19.0, 19.0, 21.0, 34.0, 42.0, 64.0, 67.0, 72.0, 82.0, 93.0, 78.0, 84.0, 57.0, 57.0, 39.0, 34.0, 20.0, 21.0, 14.0, 13.0, 18.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002040863037109375, -0.00197407603263855, -0.0019072890281677246, -0.0018405020236968994, -0.0017737150192260742, -0.001706928014755249, -0.0016401410102844238, -0.0015733540058135986, -0.0015065670013427734, -0.0014397799968719482, -0.001372992992401123, -0.0013062059879302979, -0.0012394189834594727, -0.0011726319789886475, -0.0011058449745178223, -0.001039057970046997, -0.0009722709655761719, -0.0009054839611053467, -0.0008386969566345215, -0.0007719099521636963, -0.0007051229476928711, -0.0006383359432220459, -0.0005715489387512207, -0.0005047619342803955, -0.0004379749298095703, -0.0003711879253387451, -0.0003044009208679199, -0.00023761391639709473, -0.00017082691192626953, -0.00010403990745544434, -3.725290298461914e-05, 2.9534101486206055e-05, 9.632110595703125e-05, 0.00016310811042785645, 0.00022989511489868164, 0.00029668211936950684, 0.00036346912384033203, 0.0004302561283111572, 0.0004970431327819824, 0.0005638301372528076, 0.0006306171417236328, 0.000697404146194458, 0.0007641911506652832, 0.0008309781551361084, 0.0008977651596069336, 0.0009645521640777588, 0.001031339168548584, 0.0010981261730194092, 0.0011649131774902344, 0.0012317001819610596, 0.0012984871864318848, 0.00136527419090271, 0.0014320611953735352, 0.0014988481998443604, 0.0015656352043151855, 0.0016324222087860107, 0.001699209213256836, 0.0017659962177276611, 0.0018327832221984863, 0.0018995702266693115, 0.0019663572311401367, 0.002033144235610962, 0.002099931240081787, 0.0021667182445526123, 0.0022335052490234375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 14.0, 24.0, 59.0, 131.0, 237.0, 297.0, 130.0, 46.0, 29.0, 12.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062259502708911896, -0.059788286685943604, -0.05731707066297531, -0.05484585091471672, -0.05237463489174843, -0.049903418868780136, -0.047432199120521545, -0.04496098309755325, -0.04248976707458496, -0.04001855105161667, -0.037547335028648376, -0.035076115280389786, -0.032604899257421494, -0.0301336832344532, -0.02766246534883976, -0.02519124746322632, -0.022720031440258026, -0.020248815417289734, -0.017777597531676292, -0.015306380577385426, -0.012835163623094559, -0.010363946668803692, -0.007892729714512825, -0.0054215118288993835, -0.0029502958059310913, -0.00047907885164022446, 0.0019921381026506424, 0.004463355056941509, 0.006934572011232376, 0.009405788965523243, 0.01187700591981411, 0.014348223805427551, 0.016819432377815247, 0.01929064840078354, 0.02176186628639698, 0.024233084172010422, 0.026704300194978714, 0.029175516217947006, 0.0316467359662056, 0.03411795198917389, 0.03658916801214218, 0.039060384035110474, 0.041531600058078766, 0.04400281980633736, 0.04647403582930565, 0.04894525185227394, 0.05141647160053253, 0.053887687623500824, 0.056358903646469116, 0.05883011966943741, 0.0613013356924057, 0.06377255171537399, 0.06624376773834229, 0.06871499121189117, 0.07118620723485947, 0.07365742325782776, 0.07612863928079605, 0.07859985530376434, 0.08107107132673264, 0.08354228734970093, 0.08601351082324982, 0.08848472684621811, 0.0909559428691864, 0.0934271588921547, 0.09589837491512299]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 3.0, 5.0, 10.0, 16.0, 8.0, 15.0, 18.0, 19.0, 17.0, 30.0, 26.0, 21.0, 29.0, 37.0, 47.0, 58.0, 64.0, 72.0, 93.0, 61.0, 51.0, 38.0, 36.0, 34.0, 34.0, 20.0, 20.0, 16.0, 12.0, 16.0, 11.0, 8.0, 7.0, 8.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06331872940063477, -0.0614977590739727, -0.05967678874731064, -0.057855818420648575, -0.05603484809398651, -0.05421387776732445, -0.052392907440662384, -0.05057193711400032, -0.04875096678733826, -0.04692999646067619, -0.04510902613401413, -0.043288055807352066, -0.04146708548069, -0.03964611515402794, -0.037825144827365875, -0.03600417450070381, -0.03418320417404175, -0.032362233847379684, -0.03054126352071762, -0.028720293194055557, -0.026899322867393494, -0.02507835254073143, -0.023257382214069366, -0.021436411887407303, -0.01961544156074524, -0.017794471234083176, -0.015973500907421112, -0.014152530580759048, -0.012331560254096985, -0.010510589927434921, -0.008689619600772858, -0.006868649274110794, -0.0050476789474487305, -0.003226708620786667, -0.0014057382941246033, 0.00041523203253746033, 0.002236202359199524, 0.0040571726858615875, 0.005878143012523651, 0.007699113339185715, 0.009520083665847778, 0.011341053992509842, 0.013162024319171906, 0.014982994645833969, 0.016803964972496033, 0.018624935299158096, 0.02044590562582016, 0.022266875952482224, 0.024087846279144287, 0.02590881660580635, 0.027729786932468414, 0.029550757259130478, 0.03137172758579254, 0.033192697912454605, 0.03501366823911667, 0.03683463856577873, 0.038655608892440796, 0.04047657921910286, 0.04229754954576492, 0.04411851987242699, 0.04593949019908905, 0.047760460525751114, 0.04958143085241318, 0.05140240117907524, 0.053223371505737305]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 13.0, 5.0, 19.0, 45.0, 41.0, 85.0, 160.0, 299.0, 698.0, 1813.0, 4740.0, 15642.0, 97897.0, 2179245.0, 1789983.0, 84968.0, 12716.0, 3573.0, 1348.0, 436.0, 228.0, 113.0, 57.0, 48.0, 33.0, 18.0, 15.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004108428955078125, -0.0039560794830322266, -0.003803730010986328, -0.0036513805389404297, -0.0034990310668945312, -0.003346681594848633, -0.0031943321228027344, -0.003041982650756836, -0.0028896331787109375, -0.002737283706665039, -0.0025849342346191406, -0.002432584762573242, -0.0022802352905273438, -0.0021278858184814453, -0.001975536346435547, -0.0018231868743896484, -0.00167083740234375, -0.0015184879302978516, -0.0013661384582519531, -0.0012137889862060547, -0.0010614395141601562, -0.0009090900421142578, -0.0007567405700683594, -0.0006043910980224609, -0.0004520416259765625, -0.00029969215393066406, -0.00014734268188476562, 5.0067901611328125e-06, 0.00015735626220703125, 0.0003097057342529297, 0.0004620552062988281, 0.0006144046783447266, 0.000766754150390625, 0.0009191036224365234, 0.0010714530944824219, 0.0012238025665283203, 0.0013761520385742188, 0.0015285015106201172, 0.0016808509826660156, 0.001833200454711914, 0.0019855499267578125, 0.002137899398803711, 0.0022902488708496094, 0.002442598342895508, 0.0025949478149414062, 0.0027472972869873047, 0.002899646759033203, 0.0030519962310791016, 0.003204345703125, 0.0033566951751708984, 0.003509044647216797, 0.0036613941192626953, 0.0038137435913085938, 0.003966093063354492, 0.004118442535400391, 0.004270792007446289, 0.0044231414794921875, 0.004575490951538086, 0.004727840423583984, 0.004880189895629883, 0.005032539367675781, 0.00518488883972168, 0.005337238311767578, 0.0054895877838134766, 0.005641937255859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 13.0, 20.0, 30.0, 52.0, 67.0, 92.0, 104.0, 138.0, 132.0, 103.0, 84.0, 49.0, 35.0, 26.0, 11.0, 7.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007050931453704834, -0.006796717643737793, -0.006542503833770752, -0.006288290023803711, -0.00603407621383667, -0.005779862403869629, -0.005525648593902588, -0.005271434783935547, -0.005017220973968506, -0.004763007164001465, -0.004508793354034424, -0.004254579544067383, -0.004000365734100342, -0.0037461519241333008, -0.0034919381141662598, -0.0032377243041992188, -0.0029835104942321777, -0.0027292966842651367, -0.0024750828742980957, -0.0022208690643310547, -0.0019666552543640137, -0.0017124414443969727, -0.0014582276344299316, -0.0012040138244628906, -0.0009498000144958496, -0.0006955862045288086, -0.0004413723945617676, -0.00018715858459472656, 6.705522537231445e-05, 0.00032126903533935547, 0.0005754828453063965, 0.0008296966552734375, 0.0010839104652404785, 0.0013381242752075195, 0.0015923380851745605, 0.0018465518951416016, 0.0021007657051086426, 0.0023549795150756836, 0.0026091933250427246, 0.0028634071350097656, 0.0031176209449768066, 0.0033718347549438477, 0.0036260485649108887, 0.0038802623748779297, 0.004134476184844971, 0.004388689994812012, 0.004642903804779053, 0.004897117614746094, 0.005151331424713135, 0.005405545234680176, 0.005659759044647217, 0.005913972854614258, 0.006168186664581299, 0.00642240047454834, 0.006676614284515381, 0.006930828094482422, 0.007185041904449463, 0.007439255714416504, 0.007693469524383545, 0.007947683334350586, 0.008201897144317627, 0.008456110954284668, 0.008710324764251709, 0.00896453857421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 15.0, 22.0, 42.0, 67.0, 162.0, 309.0, 571.0, 1288.0, 4493.0, 39978.0, 3992024.0, 143401.0, 8374.0, 1905.0, 743.0, 378.0, 196.0, 122.0, 56.0, 51.0, 22.0, 12.0, 10.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00928497314453125, -0.009009122848510742, -0.008733272552490234, -0.008457422256469727, -0.008181571960449219, -0.007905721664428711, -0.007629871368408203, -0.007354021072387695, -0.0070781707763671875, -0.00680232048034668, -0.006526470184326172, -0.006250619888305664, -0.005974769592285156, -0.0056989192962646484, -0.005423069000244141, -0.005147218704223633, -0.004871368408203125, -0.004595518112182617, -0.004319667816162109, -0.0040438175201416016, -0.0037679672241210938, -0.003492116928100586, -0.003216266632080078, -0.0029404163360595703, -0.0026645660400390625, -0.0023887157440185547, -0.002112865447998047, -0.001837015151977539, -0.0015611648559570312, -0.0012853145599365234, -0.0010094642639160156, -0.0007336139678955078, -0.000457763671875, -0.0001819133758544922, 9.393692016601562e-05, 0.00036978721618652344, 0.0006456375122070312, 0.0009214878082275391, 0.0011973381042480469, 0.0014731884002685547, 0.0017490386962890625, 0.0020248889923095703, 0.002300739288330078, 0.002576589584350586, 0.0028524398803710938, 0.0031282901763916016, 0.0034041404724121094, 0.003679990768432617, 0.003955841064453125, 0.004231691360473633, 0.004507541656494141, 0.0047833919525146484, 0.005059242248535156, 0.005335092544555664, 0.005610942840576172, 0.00588679313659668, 0.0061626434326171875, 0.006438493728637695, 0.006714344024658203, 0.006990194320678711, 0.007266044616699219, 0.0075418949127197266, 0.007817745208740234, 0.008093595504760742, 0.00836944580078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 9.0, 15.0, 31.0, 141.0, 665.0, 1562.0, 1166.0, 308.0, 75.0, 34.0, 18.0, 21.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.009009361267089844, -0.008672714233398438, -0.008336067199707031, -0.007999420166015625, -0.007662773132324219, -0.0073261260986328125, -0.006989479064941406, -0.00665283203125, -0.006316184997558594, -0.0059795379638671875, -0.005642890930175781, -0.005306243896484375, -0.004969596862792969, -0.0046329498291015625, -0.004296302795410156, -0.00395965576171875, -0.0036230087280273438, -0.0032863616943359375, -0.0029497146606445312, -0.002613067626953125, -0.0022764205932617188, -0.0019397735595703125, -0.0016031265258789062, -0.0012664794921875, -0.0009298324584960938, -0.0005931854248046875, -0.00025653839111328125, 8.0108642578125e-05, 0.00041675567626953125, 0.0007534027099609375, 0.0010900497436523438, 0.00142669677734375, 0.0017633438110351562, 0.0020999908447265625, 0.0024366378784179688, 0.002773284912109375, 0.0031099319458007812, 0.0034465789794921875, 0.0037832260131835938, 0.004119873046875, 0.004456520080566406, 0.0047931671142578125, 0.005129814147949219, 0.005466461181640625, 0.005803108215332031, 0.0061397552490234375, 0.006476402282714844, 0.00681304931640625, 0.007149696350097656, 0.0074863433837890625, 0.007822990417480469, 0.008159637451171875, 0.008496284484863281, 0.008832931518554688, 0.009169578552246094, 0.0095062255859375, 0.009842872619628906, 0.010179519653320312, 0.010516166687011719, 0.010852813720703125, 0.011189460754394531, 0.011526107788085938, 0.011862754821777344, 0.01219940185546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 12.0, 72.0, 310.0, 428.0, 124.0, 25.0, 16.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05934443697333336, -0.056237686425447464, -0.05313093960285187, -0.05002418905496597, -0.04691743850708008, -0.04381069168448448, -0.04070394113659859, -0.03759719431400299, -0.034490443766117096, -0.0313836932182312, -0.028276946395635605, -0.02517019584774971, -0.022063447162508965, -0.01895669847726822, -0.015849947929382324, -0.012743199244141579, -0.009636450558900833, -0.0065297014079988, -0.0034229522570967674, -0.00031620264053344727, 0.0027905460447072983, 0.005897294729948044, 0.009004045277833939, 0.012110793963074684, 0.01521754264831543, 0.018324291333556175, 0.02143104001879692, 0.024537790566682816, 0.02764453925192356, 0.030751287937164307, 0.0338580384850502, 0.036964789032936096, 0.040071532130241394, 0.04317828267812729, 0.046285029500722885, 0.04939178004860878, 0.052498526871204376, 0.05560527741909027, 0.058712027966976166, 0.06181877851486206, 0.06492552161216736, 0.06803227216005325, 0.07113902270793915, 0.07424576580524445, 0.07735251635313034, 0.08045926690101624, 0.08356601744890213, 0.08667276799678802, 0.08977951854467392, 0.09288626909255981, 0.09599301964044571, 0.0990997701883316, 0.1022065132856369, 0.1053132638335228, 0.10842001438140869, 0.11152676492929459, 0.11463351547718048, 0.11774026602506638, 0.12084701657295227, 0.12395375967025757, 0.12706051766872406, 0.13016726076602936, 0.13327401876449585, 0.13638076186180115, 0.13948750495910645]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 9.0, 7.0, 8.0, 9.0, 9.0, 12.0, 13.0, 31.0, 28.0, 23.0, 25.0, 26.0, 25.0, 30.0, 35.0, 43.0, 40.0, 48.0, 53.0, 44.0, 47.0, 50.0, 42.0, 47.0, 36.0, 38.0, 33.0, 28.0, 15.0, 21.0, 25.0, 15.0, 10.0, 17.0, 12.0, 7.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020757019519805908, -0.020089566707611084, -0.01942211575806141, -0.018754664808511734, -0.01808721199631691, -0.017419759184122086, -0.01675230823457241, -0.016084857285022736, -0.015417404472827911, -0.014749952591955662, -0.014082500711083412, -0.013415048830211163, -0.012747596949338913, -0.012080145068466663, -0.011412693187594414, -0.010745241306722164, -0.010077789425849915, -0.009410337544977665, -0.008742885664105415, -0.008075433783233166, -0.007407981902360916, -0.0067405300214886665, -0.006073078140616417, -0.005405626259744167, -0.004738174378871918, -0.004070722497999668, -0.0034032706171274185, -0.002735818736255169, -0.0020683668553829193, -0.0014009149745106697, -0.0007334630936384201, -6.60112127661705e-05, 0.0006014406681060791, 0.0012688925489783287, 0.0019363444298505783, 0.002603796310722828, 0.0032712481915950775, 0.003938700072467327, 0.004606151953339577, 0.005273603834211826, 0.005941055715084076, 0.0066085075959563255, 0.007275959476828575, 0.007943411357700825, 0.008610863238573074, 0.009278315119445324, 0.009945767000317574, 0.010613218881189823, 0.011280670762062073, 0.011948122642934322, 0.012615574523806572, 0.013283026404678822, 0.013950478285551071, 0.01461793016642332, 0.01528538204729557, 0.015952832996845245, 0.01662028580904007, 0.017287738621234894, 0.01795518957078457, 0.018622640520334244, 0.019290093332529068, 0.019957546144723892, 0.020624997094273567, 0.021292448043823242, 0.021959900856018066]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 2.0, 7.0, 5.0, 13.0, 9.0, 17.0, 19.0, 37.0, 36.0, 66.0, 77.0, 113.0, 165.0, 258.0, 339.0, 556.0, 915.0, 1493.0, 2569.0, 4973.0, 10781.0, 26944.0, 78453.0, 238079.0, 392982.0, 187874.0, 60600.0, 21765.0, 9061.0, 4294.0, 2247.0, 1330.0, 808.0, 529.0, 334.0, 228.0, 150.0, 105.0, 91.0, 63.0, 48.0, 28.0, 23.0, 16.0, 15.0, 10.0, 13.0, 6.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037708282470703125, -0.0036506950855255127, -0.003530561923980713, -0.003410428762435913, -0.0032902956008911133, -0.0031701624393463135, -0.0030500292778015137, -0.002929896116256714, -0.002809762954711914, -0.0026896297931671143, -0.0025694966316223145, -0.0024493634700775146, -0.002329230308532715, -0.002209097146987915, -0.0020889639854431152, -0.0019688308238983154, -0.0018486976623535156, -0.0017285645008087158, -0.001608431339263916, -0.0014882981777191162, -0.0013681650161743164, -0.0012480318546295166, -0.0011278986930847168, -0.001007765531539917, -0.0008876323699951172, -0.0007674992084503174, -0.0006473660469055176, -0.0005272328853607178, -0.00040709972381591797, -0.00028696656227111816, -0.00016683340072631836, -4.6700239181518555e-05, 7.343292236328125e-05, 0.00019356608390808105, 0.00031369924545288086, 0.00043383240699768066, 0.0005539655685424805, 0.0006740987300872803, 0.0007942318916320801, 0.0009143650531768799, 0.0010344982147216797, 0.0011546313762664795, 0.0012747645378112793, 0.001394897699356079, 0.001515030860900879, 0.0016351640224456787, 0.0017552971839904785, 0.0018754303455352783, 0.001995563507080078, 0.002115696668624878, 0.0022358298301696777, 0.0023559629917144775, 0.0024760961532592773, 0.002596229314804077, 0.002716362476348877, 0.0028364956378936768, 0.0029566287994384766, 0.0030767619609832764, 0.003196895122528076, 0.003317028284072876, 0.0034371614456176758, 0.0035572946071624756, 0.0036774277687072754, 0.003797560930252075, 0.003917694091796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 18.0, 21.0, 34.0, 52.0, 65.0, 106.0, 131.0, 129.0, 141.0, 104.0, 68.0, 33.0, 32.0, 21.0, 11.0, 6.0, 11.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00725555419921875, -0.007000565528869629, -0.006745576858520508, -0.006490588188171387, -0.006235599517822266, -0.0059806108474731445, -0.0057256221771240234, -0.005470633506774902, -0.005215644836425781, -0.00496065616607666, -0.004705667495727539, -0.004450678825378418, -0.004195690155029297, -0.003940701484680176, -0.0036857128143310547, -0.0034307241439819336, -0.0031757354736328125, -0.0029207468032836914, -0.0026657581329345703, -0.0024107694625854492, -0.002155780792236328, -0.001900792121887207, -0.001645803451538086, -0.0013908147811889648, -0.0011358261108398438, -0.0008808374404907227, -0.0006258487701416016, -0.00037086009979248047, -0.00011587142944335938, 0.00013911724090576172, 0.0003941059112548828, 0.0006490945816040039, 0.000904083251953125, 0.001159071922302246, 0.0014140605926513672, 0.0016690492630004883, 0.0019240379333496094, 0.0021790266036987305, 0.0024340152740478516, 0.0026890039443969727, 0.0029439926147460938, 0.003198981285095215, 0.003453969955444336, 0.003708958625793457, 0.003963947296142578, 0.004218935966491699, 0.00447392463684082, 0.004728913307189941, 0.0049839019775390625, 0.005238890647888184, 0.005493879318237305, 0.005748867988586426, 0.006003856658935547, 0.006258845329284668, 0.006513833999633789, 0.00676882266998291, 0.007023811340332031, 0.007278800010681152, 0.0075337886810302734, 0.0077887773513793945, 0.008043766021728516, 0.008298754692077637, 0.008553743362426758, 0.008808732032775879, 0.009063720703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 3.0, 7.0, 6.0, 13.0, 14.0, 19.0, 25.0, 30.0, 48.0, 71.0, 69.0, 122.0, 165.0, 236.0, 390.0, 690.0, 1205.0, 2461.0, 5405.0, 13299.0, 34592.0, 96284.0, 232401.0, 442292.0, 136232.0, 49525.0, 18374.0, 7333.0, 3313.0, 1633.0, 825.0, 464.0, 325.0, 198.0, 136.0, 95.0, 72.0, 40.0, 35.0, 27.0, 15.0, 17.0, 11.0, 10.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0043487548828125, -0.004221528768539429, -0.004094302654266357, -0.003967076539993286, -0.003839850425720215, -0.0037126243114471436, -0.0035853981971740723, -0.003458172082901001, -0.0033309459686279297, -0.0032037198543548584, -0.003076493740081787, -0.002949267625808716, -0.0028220415115356445, -0.0026948153972625732, -0.002567589282989502, -0.0024403631687164307, -0.0023131370544433594, -0.002185910940170288, -0.002058684825897217, -0.0019314587116241455, -0.0018042325973510742, -0.001677006483078003, -0.0015497803688049316, -0.0014225542545318604, -0.001295328140258789, -0.0011681020259857178, -0.0010408759117126465, -0.0009136497974395752, -0.0007864236831665039, -0.0006591975688934326, -0.0005319714546203613, -0.00040474534034729004, -0.00027751922607421875, -0.00015029311180114746, -2.3066997528076172e-05, 0.00010415911674499512, 0.0002313852310180664, 0.0003586113452911377, 0.000485837459564209, 0.0006130635738372803, 0.0007402896881103516, 0.0008675158023834229, 0.0009947419166564941, 0.0011219680309295654, 0.0012491941452026367, 0.001376420259475708, 0.0015036463737487793, 0.0016308724880218506, 0.0017580986022949219, 0.0018853247165679932, 0.0020125508308410645, 0.0021397769451141357, 0.002267003059387207, 0.0023942291736602783, 0.0025214552879333496, 0.002648681402206421, 0.002775907516479492, 0.0029031336307525635, 0.0030303597450256348, 0.003157585859298706, 0.0032848119735717773, 0.0034120380878448486, 0.00353926420211792, 0.003666490316390991, 0.0037937164306640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 11.0, 3.0, 11.0, 9.0, 8.0, 12.0, 11.0, 11.0, 19.0, 20.0, 24.0, 24.0, 21.0, 35.0, 40.0, 36.0, 42.0, 44.0, 47.0, 49.0, 51.0, 42.0, 43.0, 38.0, 29.0, 31.0, 35.0, 40.0, 33.0, 27.0, 20.0, 16.0, 20.0, 17.0, 20.0, 10.0, 6.0, 8.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01067352294921875, -0.010328173637390137, -0.009982824325561523, -0.00963747501373291, -0.009292125701904297, -0.008946776390075684, -0.00860142707824707, -0.008256077766418457, -0.007910728454589844, -0.0075653791427612305, -0.007220029830932617, -0.006874680519104004, -0.006529331207275391, -0.006183981895446777, -0.005838632583618164, -0.005493283271789551, -0.0051479339599609375, -0.004802584648132324, -0.004457235336303711, -0.004111886024475098, -0.0037665367126464844, -0.003421187400817871, -0.003075838088989258, -0.0027304887771606445, -0.0023851394653320312, -0.002039790153503418, -0.0016944408416748047, -0.0013490915298461914, -0.0010037422180175781, -0.0006583929061889648, -0.00031304359436035156, 3.230571746826172e-05, 0.000377655029296875, 0.0007230043411254883, 0.0010683536529541016, 0.0014137029647827148, 0.0017590522766113281, 0.0021044015884399414, 0.0024497509002685547, 0.002795100212097168, 0.0031404495239257812, 0.0034857988357543945, 0.003831148147583008, 0.004176497459411621, 0.004521846771240234, 0.004867196083068848, 0.005212545394897461, 0.005557894706726074, 0.0059032440185546875, 0.006248593330383301, 0.006593942642211914, 0.006939291954040527, 0.007284641265869141, 0.007629990577697754, 0.007975339889526367, 0.00832068920135498, 0.008666038513183594, 0.009011387825012207, 0.00935673713684082, 0.009702086448669434, 0.010047435760498047, 0.01039278507232666, 0.010738134384155273, 0.011083483695983887, 0.0114288330078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 13.0, 10.0, 14.0, 22.0, 46.0, 63.0, 89.0, 148.0, 243.0, 383.0, 663.0, 1264.0, 2450.0, 5363.0, 12850.0, 36830.0, 135403.0, 596869.0, 180712.0, 47304.0, 15473.0, 6353.0, 2747.0, 1373.0, 757.0, 405.0, 270.0, 149.0, 80.0, 81.0, 45.0, 30.0, 18.0, 12.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013113021850585938, -0.0012684464454650879, -0.001225590705871582, -0.0011827349662780762, -0.0011398792266845703, -0.0010970234870910645, -0.0010541677474975586, -0.0010113120079040527, -0.0009684562683105469, -0.000925600528717041, -0.0008827447891235352, -0.0008398890495300293, -0.0007970333099365234, -0.0007541775703430176, -0.0007113218307495117, -0.0006684660911560059, -0.0006256103515625, -0.0005827546119689941, -0.0005398988723754883, -0.0004970431327819824, -0.00045418739318847656, -0.0004113316535949707, -0.00036847591400146484, -0.000325620174407959, -0.0002827644348144531, -0.00023990869522094727, -0.0001970529556274414, -0.00015419721603393555, -0.00011134147644042969, -6.848573684692383e-05, -2.562999725341797e-05, 1.722574234008789e-05, 6.008148193359375e-05, 0.00010293722152709961, 0.00014579296112060547, 0.00018864870071411133, 0.0002315044403076172, 0.00027436017990112305, 0.0003172159194946289, 0.00036007165908813477, 0.0004029273986816406, 0.0004457831382751465, 0.0004886388778686523, 0.0005314946174621582, 0.0005743503570556641, 0.0006172060966491699, 0.0006600618362426758, 0.0007029175758361816, 0.0007457733154296875, 0.0007886290550231934, 0.0008314847946166992, 0.0008743405342102051, 0.0009171962738037109, 0.0009600520133972168, 0.0010029077529907227, 0.0010457634925842285, 0.0010886192321777344, 0.0011314749717712402, 0.001174330711364746, 0.001217186450958252, 0.0012600421905517578, 0.0013028979301452637, 0.0013457536697387695, 0.0013886094093322754, 0.0014314651489257812]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 13.0, 15.0, 17.0, 11.0, 22.0, 11.0, 27.0, 34.0, 37.0, 33.0, 42.0, 44.0, 23.0, 51.0, 50.0, 51.0, 63.0, 48.0, 50.0, 22.0, 55.0, 32.0, 32.0, 41.0, 23.0, 25.0, 12.0, 29.0, 19.0, 8.0, 11.0, 8.0, 4.0, 2.0, 7.0, 2.0, 6.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.516674041748047e-06, -3.405846655368805e-06, -3.295019268989563e-06, -3.184191882610321e-06, -3.073364496231079e-06, -2.962537109851837e-06, -2.8517097234725952e-06, -2.7408823370933533e-06, -2.6300549507141113e-06, -2.5192275643348694e-06, -2.4084001779556274e-06, -2.2975727915763855e-06, -2.1867454051971436e-06, -2.0759180188179016e-06, -1.9650906324386597e-06, -1.8542632460594177e-06, -1.7434358596801758e-06, -1.6326084733009338e-06, -1.521781086921692e-06, -1.41095370054245e-06, -1.300126314163208e-06, -1.189298927783966e-06, -1.0784715414047241e-06, -9.676441550254822e-07, -8.568167686462402e-07, -7.459893822669983e-07, -6.351619958877563e-07, -5.243346095085144e-07, -4.1350722312927246e-07, -3.026798367500305e-07, -1.9185245037078857e-07, -8.102506399154663e-08, 2.9802322387695312e-08, 1.4062970876693726e-07, 2.514570951461792e-07, 3.6228448152542114e-07, 4.731118679046631e-07, 5.83939254283905e-07, 6.94766640663147e-07, 8.055940270423889e-07, 9.164214134216309e-07, 1.0272487998008728e-06, 1.1380761861801147e-06, 1.2489035725593567e-06, 1.3597309589385986e-06, 1.4705583453178406e-06, 1.5813857316970825e-06, 1.6922131180763245e-06, 1.8030405044555664e-06, 1.9138678908348083e-06, 2.0246952772140503e-06, 2.1355226635932922e-06, 2.246350049972534e-06, 2.357177436351776e-06, 2.468004822731018e-06, 2.57883220911026e-06, 2.689659595489502e-06, 2.800486981868744e-06, 2.911314368247986e-06, 3.0221417546272278e-06, 3.1329691410064697e-06, 3.2437965273857117e-06, 3.3546239137649536e-06, 3.4654513001441956e-06, 3.5762786865234375e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 9.0, 18.0, 16.0, 29.0, 32.0, 93.0, 148.0, 338.0, 736.0, 1945.0, 6300.0, 26188.0, 161684.0, 688880.0, 131252.0, 22221.0, 5483.0, 1798.0, 716.0, 308.0, 129.0, 82.0, 39.0, 32.0, 17.0, 16.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00225830078125, -0.002202466130256653, -0.0021466314792633057, -0.0020907968282699585, -0.0020349621772766113, -0.001979127526283264, -0.001923292875289917, -0.0018674582242965698, -0.0018116235733032227, -0.0017557889223098755, -0.0016999542713165283, -0.0016441196203231812, -0.001588284969329834, -0.0015324503183364868, -0.0014766156673431396, -0.0014207810163497925, -0.0013649463653564453, -0.0013091117143630981, -0.001253277063369751, -0.0011974424123764038, -0.0011416077613830566, -0.0010857731103897095, -0.0010299384593963623, -0.0009741038084030151, -0.000918269157409668, -0.0008624345064163208, -0.0008065998554229736, -0.0007507652044296265, -0.0006949305534362793, -0.0006390959024429321, -0.000583261251449585, -0.0005274266004562378, -0.0004715919494628906, -0.00041575729846954346, -0.0003599226474761963, -0.0003040879964828491, -0.00024825334548950195, -0.00019241869449615479, -0.00013658404350280762, -8.074939250946045e-05, -2.491474151611328e-05, 3.091990947723389e-05, 8.675456047058105e-05, 0.00014258921146392822, 0.0001984238624572754, 0.00025425851345062256, 0.0003100931644439697, 0.0003659278154373169, 0.00042176246643066406, 0.00047759711742401123, 0.0005334317684173584, 0.0005892664194107056, 0.0006451010704040527, 0.0007009357213973999, 0.0007567703723907471, 0.0008126050233840942, 0.0008684396743774414, 0.0009242743253707886, 0.0009801089763641357, 0.001035943627357483, 0.00109177827835083, 0.0011476129293441772, 0.0012034475803375244, 0.0012592822313308716, 0.0013151168823242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 9.0, 17.0, 21.0, 21.0, 17.0, 26.0, 48.0, 56.0, 75.0, 84.0, 82.0, 89.0, 98.0, 78.0, 72.0, 50.0, 38.0, 33.0, 17.0, 15.0, 10.0, 14.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.0024108588695526123, -0.0023383498191833496, -0.002265840768814087, -0.0021933317184448242, -0.0021208226680755615, -0.002048313617706299, -0.001975804567337036, -0.0019032955169677734, -0.0018307864665985107, -0.001758277416229248, -0.0016857683658599854, -0.0016132593154907227, -0.00154075026512146, -0.0014682412147521973, -0.0013957321643829346, -0.0013232231140136719, -0.0012507140636444092, -0.0011782050132751465, -0.0011056959629058838, -0.001033186912536621, -0.0009606778621673584, -0.0008881688117980957, -0.000815659761428833, -0.0007431507110595703, -0.0006706416606903076, -0.0005981326103210449, -0.0005256235599517822, -0.00045311450958251953, -0.00038060545921325684, -0.00030809640884399414, -0.00023558735847473145, -0.00016307830810546875, -9.056925773620605e-05, -1.806020736694336e-05, 5.4448843002319336e-05, 0.00012695789337158203, 0.00019946694374084473, 0.0002719759941101074, 0.0003444850444793701, 0.0004169940948486328, 0.0004895031452178955, 0.0005620121955871582, 0.0006345212459564209, 0.0007070302963256836, 0.0007795393466949463, 0.000852048397064209, 0.0009245574474334717, 0.0009970664978027344, 0.001069575548171997, 0.0011420845985412598, 0.0012145936489105225, 0.0012871026992797852, 0.0013596117496490479, 0.0014321208000183105, 0.0015046298503875732, 0.001577138900756836, 0.0016496479511260986, 0.0017221570014953613, 0.001794666051864624, 0.0018671751022338867, 0.0019396841526031494, 0.002012193202972412, 0.002084702253341675, 0.0021572113037109375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 9.0, 18.0, 31.0, 71.0, 220.0, 359.0, 181.0, 72.0, 24.0, 10.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04073881357908249, -0.03827570006251335, -0.035812586545944214, -0.033349473029375076, -0.03088635765016079, -0.028423244133591652, -0.025960128754377365, -0.023497015237808228, -0.02103390172123909, -0.018570788204669952, -0.016107674688100815, -0.013644559308886528, -0.01118144579231739, -0.008718332275748253, -0.006255217827856541, -0.0037921033799648285, -0.001328989863395691, 0.001134124118834734, 0.003597238101065159, 0.006060352083295584, 0.008523466065526009, 0.010986579582095146, 0.013449694029986858, 0.01591280847787857, 0.018375921994447708, 0.020839035511016846, 0.023302149027585983, 0.02576526440680027, 0.028228377923369408, 0.030691491439938545, 0.03315460681915283, 0.03561772033572197, 0.03808082640171051, 0.04054393991827965, 0.043007053434848785, 0.04547016695141792, 0.04793328046798706, 0.0503963977098465, 0.052859511226415634, 0.05532262474298477, 0.05778573825955391, 0.06024885177612305, 0.06271196901798248, 0.06517507880926132, 0.06763819605112076, 0.0701013058423996, 0.07256442308425903, 0.07502754032611847, 0.07749065011739731, 0.07995376735925674, 0.08241687715053558, 0.08487999439239502, 0.08734310418367386, 0.0898062214255333, 0.09226933121681213, 0.09473244845867157, 0.097195565700531, 0.09965868294239044, 0.10212179273366928, 0.10458490997552872, 0.10704801976680756, 0.10951113700866699, 0.11197424679994583, 0.11443736404180527, 0.1169004738330841]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 7.0, 3.0, 6.0, 5.0, 10.0, 15.0, 10.0, 16.0, 13.0, 15.0, 22.0, 27.0, 29.0, 25.0, 20.0, 31.0, 41.0, 41.0, 58.0, 60.0, 69.0, 56.0, 61.0, 35.0, 38.0, 30.0, 33.0, 14.0, 23.0, 21.0, 17.0, 18.0, 24.0, 11.0, 13.0, 14.0, 8.0, 7.0, 7.0, 5.0, 7.0, 10.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.03861534595489502, -0.03742838278412819, -0.03624141961336136, -0.03505445271730423, -0.0338674895465374, -0.03268052637577057, -0.03149355947971344, -0.03030659630894661, -0.02911963313817978, -0.02793266996741295, -0.02674570493400097, -0.02555873990058899, -0.02437177672982216, -0.02318481355905533, -0.02199784852564335, -0.02081088349223137, -0.01962392032146454, -0.018436957150697708, -0.01724999211728573, -0.01606302708387375, -0.014876063913106918, -0.013689099811017513, -0.012502135708928108, -0.011315171606838703, -0.010128207504749298, -0.008941243402659893, -0.007754279300570488, -0.006567315198481083, -0.005380351096391678, -0.004193386994302273, -0.0030064228922128677, -0.0018194587901234627, -0.0006324946880340576, 0.0005544694140553474, 0.0017414335161447525, 0.0029283976182341576, 0.004115361720323563, 0.005302325822412968, 0.006489289924502373, 0.007676254026591778, 0.008863218128681183, 0.010050182230770588, 0.011237146332859993, 0.012424110434949398, 0.013611074537038803, 0.014798038639128208, 0.015985002741217613, 0.017171967774629593, 0.018358930945396423, 0.019545894116163254, 0.020732859149575233, 0.021919824182987213, 0.023106787353754044, 0.024293750524520874, 0.025480715557932854, 0.026667680591344833, 0.027854643762111664, 0.029041606932878494, 0.030228571966290474, 0.031415536999702454, 0.032602500170469284, 0.033789463341236115, 0.03497643023729324, 0.036163393408060074, 0.037350356578826904]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 11.0, 9.0, 17.0, 41.0, 97.0, 197.0, 310.0, 518.0, 972.0, 1897.0, 3573.0, 7771.0, 21326.0, 95203.0, 709223.0, 2688535.0, 556991.0, 79129.0, 17740.0, 5568.0, 2523.0, 1288.0, 658.0, 350.0, 143.0, 66.0, 42.0, 20.0, 16.0, 8.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0032825469970703125, -0.0031899213790893555, -0.0030972957611083984, -0.0030046701431274414, -0.0029120445251464844, -0.0028194189071655273, -0.0027267932891845703, -0.0026341676712036133, -0.0025415420532226562, -0.0024489164352416992, -0.002356290817260742, -0.002263665199279785, -0.002171039581298828, -0.002078413963317871, -0.001985788345336914, -0.001893162727355957, -0.001800537109375, -0.001707911491394043, -0.001615285873413086, -0.001522660255432129, -0.0014300346374511719, -0.0013374090194702148, -0.0012447834014892578, -0.0011521577835083008, -0.0010595321655273438, -0.0009669065475463867, -0.0008742809295654297, -0.0007816553115844727, -0.0006890296936035156, -0.0005964040756225586, -0.0005037784576416016, -0.00041115283966064453, -0.0003185272216796875, -0.00022590160369873047, -0.00013327598571777344, -4.0650367736816406e-05, 5.1975250244140625e-05, 0.00014460086822509766, 0.0002372264862060547, 0.0003298521041870117, 0.00042247772216796875, 0.0005151033401489258, 0.0006077289581298828, 0.0007003545761108398, 0.0007929801940917969, 0.0008856058120727539, 0.000978231430053711, 0.001070857048034668, 0.001163482666015625, 0.001256108283996582, 0.001348733901977539, 0.001441359519958496, 0.0015339851379394531, 0.0016266107559204102, 0.0017192363739013672, 0.0018118619918823242, 0.0019044876098632812, 0.0019971132278442383, 0.0020897388458251953, 0.0021823644638061523, 0.0022749900817871094, 0.0023676156997680664, 0.0024602413177490234, 0.0025528669357299805, 0.0026454925537109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 5.0, 6.0, 13.0, 19.0, 28.0, 46.0, 78.0, 109.0, 109.0, 139.0, 137.0, 106.0, 82.0, 33.0, 35.0, 25.0, 11.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007293701171875, -0.007038474082946777, -0.006783246994018555, -0.006528019905090332, -0.006272792816162109, -0.006017565727233887, -0.005762338638305664, -0.005507111549377441, -0.005251884460449219, -0.004996657371520996, -0.0047414302825927734, -0.004486203193664551, -0.004230976104736328, -0.0039757490158081055, -0.003720521926879883, -0.00346529483795166, -0.0032100677490234375, -0.002954840660095215, -0.002699613571166992, -0.0024443864822387695, -0.002189159393310547, -0.0019339323043823242, -0.0016787052154541016, -0.001423478126525879, -0.0011682510375976562, -0.0009130239486694336, -0.0006577968597412109, -0.0004025697708129883, -0.00014734268188476562, 0.00010788440704345703, 0.0003631114959716797, 0.0006183385848999023, 0.000873565673828125, 0.0011287927627563477, 0.0013840198516845703, 0.001639246940612793, 0.0018944740295410156, 0.0021497011184692383, 0.002404928207397461, 0.0026601552963256836, 0.0029153823852539062, 0.003170609474182129, 0.0034258365631103516, 0.0036810636520385742, 0.003936290740966797, 0.0041915178298950195, 0.004446744918823242, 0.004701972007751465, 0.0049571990966796875, 0.00521242618560791, 0.005467653274536133, 0.0057228803634643555, 0.005978107452392578, 0.006233334541320801, 0.0064885616302490234, 0.006743788719177246, 0.006999015808105469, 0.007254242897033691, 0.007509469985961914, 0.007764697074890137, 0.00801992416381836, 0.008275151252746582, 0.008530378341674805, 0.008785605430603027, 0.00904083251953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 15.0, 25.0, 37.0, 87.0, 159.0, 312.0, 12087.0, 4179898.0, 1242.0, 205.0, 120.0, 57.0, 29.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291595458984375, -0.028197050094604492, -0.027234554290771484, -0.026272058486938477, -0.02530956268310547, -0.02434706687927246, -0.023384571075439453, -0.022422075271606445, -0.021459579467773438, -0.02049708366394043, -0.019534587860107422, -0.018572092056274414, -0.017609596252441406, -0.0166471004486084, -0.01568460464477539, -0.014722108840942383, -0.013759613037109375, -0.012797117233276367, -0.01183462142944336, -0.010872125625610352, -0.009909629821777344, -0.008947134017944336, -0.007984638214111328, -0.00702214241027832, -0.0060596466064453125, -0.005097150802612305, -0.004134654998779297, -0.003172159194946289, -0.0022096633911132812, -0.0012471675872802734, -0.0002846717834472656, 0.0006778240203857422, 0.00164031982421875, 0.002602815628051758, 0.0035653114318847656, 0.0045278072357177734, 0.005490303039550781, 0.006452798843383789, 0.007415294647216797, 0.008377790451049805, 0.009340286254882812, 0.01030278205871582, 0.011265277862548828, 0.012227773666381836, 0.013190269470214844, 0.014152765274047852, 0.01511526107788086, 0.016077756881713867, 0.017040252685546875, 0.018002748489379883, 0.01896524429321289, 0.0199277400970459, 0.020890235900878906, 0.021852731704711914, 0.022815227508544922, 0.02377772331237793, 0.024740219116210938, 0.025702714920043945, 0.026665210723876953, 0.02762770652770996, 0.02859020233154297, 0.029552698135375977, 0.030515193939208984, 0.03147768974304199, 0.032440185546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 19.0, 55.0, 239.0, 1018.0, 1830.0, 701.0, 142.0, 33.0, 11.0, 8.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.018707275390625, -0.01834315061569214, -0.017979025840759277, -0.017614901065826416, -0.017250776290893555, -0.016886651515960693, -0.016522526741027832, -0.01615840196609497, -0.01579427719116211, -0.015430152416229248, -0.015066027641296387, -0.014701902866363525, -0.014337778091430664, -0.013973653316497803, -0.013609528541564941, -0.01324540376663208, -0.012881278991699219, -0.012517154216766357, -0.012153029441833496, -0.011788904666900635, -0.011424779891967773, -0.011060655117034912, -0.01069653034210205, -0.01033240556716919, -0.009968280792236328, -0.009604156017303467, -0.009240031242370605, -0.008875906467437744, -0.008511781692504883, -0.008147656917572021, -0.00778353214263916, -0.007419407367706299, -0.0070552825927734375, -0.006691157817840576, -0.006327033042907715, -0.0059629082679748535, -0.005598783493041992, -0.005234658718109131, -0.0048705339431762695, -0.004506409168243408, -0.004142284393310547, -0.0037781596183776855, -0.0034140348434448242, -0.003049910068511963, -0.0026857852935791016, -0.0023216605186462402, -0.001957535743713379, -0.0015934109687805176, -0.0012292861938476562, -0.0008651614189147949, -0.0005010366439819336, -0.00013691186904907227, 0.00022721290588378906, 0.0005913376808166504, 0.0009554624557495117, 0.001319587230682373, 0.0016837120056152344, 0.0020478367805480957, 0.002411961555480957, 0.0027760863304138184, 0.0031402111053466797, 0.003504335880279541, 0.0038684606552124023, 0.004232585430145264, 0.004596710205078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 8.0, 11.0, 19.0, 36.0, 68.0, 128.0, 164.0, 197.0, 157.0, 95.0, 61.0, 22.0, 10.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05580972880125046, -0.054664552211761475, -0.05351937562227249, -0.05237419903278351, -0.051229022443294525, -0.05008384585380554, -0.04893866926431656, -0.047793492674827576, -0.04664831608533859, -0.04550313949584961, -0.044357962906360626, -0.04321278631687164, -0.04206760972738266, -0.04092243313789368, -0.039777256548404694, -0.03863207995891571, -0.03748689964413643, -0.036341723054647446, -0.03519654646515846, -0.03405136987566948, -0.032906193286180496, -0.03176101669669151, -0.03061583824455738, -0.029470661655068398, -0.028325485065579414, -0.02718030847609043, -0.026035131886601448, -0.024889955297112465, -0.023744776844978333, -0.02259960025548935, -0.021454423666000366, -0.020309247076511383, -0.0191640704870224, -0.018018893897533417, -0.016873717308044434, -0.01572854071855545, -0.014583363197743893, -0.01343818660825491, -0.012293009087443352, -0.011147832497954369, -0.010002655908465385, -0.008857479318976402, -0.007712302263826132, -0.006567125208675861, -0.005421948619186878, -0.004276772029697895, -0.0031315949745476246, -0.001986417919397354, -0.000841241329908371, 0.00030393549241125584, 0.0014491123147308826, 0.0025942891370505095, 0.0037394659593701363, 0.004884642548859119, 0.00602981960400939, 0.00717499665915966, 0.008320173248648643, 0.009465349838137627, 0.01061052642762661, 0.011755703948438168, 0.01290088053792715, 0.014046057127416134, 0.015191234648227692, 0.016336411237716675, 0.017481587827205658]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 8.0, 8.0, 7.0, 10.0, 8.0, 11.0, 17.0, 22.0, 25.0, 30.0, 26.0, 42.0, 27.0, 44.0, 31.0, 37.0, 51.0, 38.0, 36.0, 45.0, 43.0, 45.0, 50.0, 43.0, 45.0, 34.0, 28.0, 40.0, 21.0, 17.0, 19.0, 19.0, 14.0, 10.0, 13.0, 10.0, 12.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02270883321762085, -0.022083088755607605, -0.02145734243094921, -0.020831596106290817, -0.020205851644277573, -0.019580107182264328, -0.018954360857605934, -0.01832861453294754, -0.017702870070934296, -0.01707712560892105, -0.016451379284262657, -0.015825632959604263, -0.015199888497591019, -0.0145741431042552, -0.01394839771091938, -0.013322652317583561, -0.012696906924247742, -0.012071161530911922, -0.011445416137576103, -0.010819670744240284, -0.010193925350904465, -0.009568179957568645, -0.008942434564232826, -0.008316689170897007, -0.007690943777561188, -0.0070651983842253685, -0.006439452990889549, -0.00581370759755373, -0.005187962204217911, -0.0045622168108820915, -0.003936471417546272, -0.003310726024210453, -0.002684980630874634, -0.0020592352375388145, -0.0014334898442029953, -0.0008077444508671761, -0.0001819990575313568, 0.00044374633580446243, 0.0010694917291402817, 0.001695237122476101, 0.00232098251581192, 0.0029467279091477394, 0.0035724733024835587, 0.004198218695819378, 0.004823964089155197, 0.005449709482491016, 0.006075454875826836, 0.006701200269162655, 0.007326945662498474, 0.007952691055834293, 0.008578436449170113, 0.009204181842505932, 0.009829927235841751, 0.01045567262917757, 0.01108141802251339, 0.011707163415849209, 0.012332908809185028, 0.012958654202520847, 0.013584399595856667, 0.014210144989192486, 0.014835890382528305, 0.015461635775864124, 0.016087381169199944, 0.016713127493858337, 0.017338871955871582]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 13.0, 7.0, 18.0, 18.0, 34.0, 36.0, 57.0, 65.0, 91.0, 173.0, 249.0, 342.0, 497.0, 899.0, 1542.0, 3028.0, 6425.0, 15433.0, 44192.0, 142244.0, 395205.0, 295419.0, 91313.0, 29675.0, 10919.0, 4808.0, 2374.0, 1247.0, 782.0, 458.0, 339.0, 186.0, 117.0, 108.0, 64.0, 49.0, 29.0, 32.0, 23.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004314422607421875, -0.004178822040557861, -0.004043221473693848, -0.003907620906829834, -0.0037720203399658203, -0.0036364197731018066, -0.003500819206237793, -0.0033652186393737793, -0.0032296180725097656, -0.003094017505645752, -0.0029584169387817383, -0.0028228163719177246, -0.002687215805053711, -0.0025516152381896973, -0.0024160146713256836, -0.00228041410446167, -0.0021448135375976562, -0.0020092129707336426, -0.001873612403869629, -0.0017380118370056152, -0.0016024112701416016, -0.0014668107032775879, -0.0013312101364135742, -0.0011956095695495605, -0.0010600090026855469, -0.0009244084358215332, -0.0007888078689575195, -0.0006532073020935059, -0.0005176067352294922, -0.0003820061683654785, -0.00024640560150146484, -0.00011080503463745117, 2.47955322265625e-05, 0.00016039609909057617, 0.00029599666595458984, 0.0004315972328186035, 0.0005671977996826172, 0.0007027983665466309, 0.0008383989334106445, 0.0009739995002746582, 0.0011096000671386719, 0.0012452006340026855, 0.0013808012008666992, 0.0015164017677307129, 0.0016520023345947266, 0.0017876029014587402, 0.001923203468322754, 0.0020588040351867676, 0.0021944046020507812, 0.002330005168914795, 0.0024656057357788086, 0.0026012063026428223, 0.002736806869506836, 0.0028724074363708496, 0.0030080080032348633, 0.003143608570098877, 0.0032792091369628906, 0.0034148097038269043, 0.003550410270690918, 0.0036860108375549316, 0.0038216114044189453, 0.003957211971282959, 0.004092812538146973, 0.004228413105010986, 0.004364013671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 20.0, 27.0, 58.0, 80.0, 99.0, 120.0, 138.0, 139.0, 105.0, 59.0, 42.0, 35.0, 23.0, 12.0, 13.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007266998291015625, -0.007012307643890381, -0.006757616996765137, -0.006502926349639893, -0.0062482357025146484, -0.005993545055389404, -0.00573885440826416, -0.005484163761138916, -0.005229473114013672, -0.004974782466888428, -0.004720091819763184, -0.0044654011726379395, -0.004210710525512695, -0.003956019878387451, -0.003701329231262207, -0.003446638584136963, -0.0031919479370117188, -0.0029372572898864746, -0.0026825666427612305, -0.0024278759956359863, -0.002173185348510742, -0.001918494701385498, -0.001663804054260254, -0.0014091134071350098, -0.0011544227600097656, -0.0008997321128845215, -0.0006450414657592773, -0.0003903508186340332, -0.00013566017150878906, 0.00011903047561645508, 0.0003737211227416992, 0.0006284117698669434, 0.0008831024169921875, 0.0011377930641174316, 0.0013924837112426758, 0.00164717435836792, 0.001901865005493164, 0.002156555652618408, 0.0024112462997436523, 0.0026659369468688965, 0.0029206275939941406, 0.0031753182411193848, 0.003430008888244629, 0.003684699535369873, 0.003939390182495117, 0.004194080829620361, 0.0044487714767456055, 0.00470346212387085, 0.004958152770996094, 0.005212843418121338, 0.005467534065246582, 0.005722224712371826, 0.00597691535949707, 0.0062316060066223145, 0.006486296653747559, 0.006740987300872803, 0.006995677947998047, 0.007250368595123291, 0.007505059242248535, 0.007759749889373779, 0.008014440536499023, 0.008269131183624268, 0.008523821830749512, 0.008778512477874756, 0.009033203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 9.0, 12.0, 14.0, 26.0, 35.0, 66.0, 76.0, 91.0, 144.0, 215.0, 297.0, 525.0, 1034.0, 2885.0, 14107.0, 100670.0, 700285.0, 195442.0, 25053.0, 4567.0, 1388.0, 597.0, 387.0, 210.0, 112.0, 83.0, 66.0, 53.0, 27.0, 24.0, 10.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007518768310546875, -0.007265269756317139, -0.007011771202087402, -0.006758272647857666, -0.00650477409362793, -0.006251275539398193, -0.005997776985168457, -0.005744278430938721, -0.005490779876708984, -0.005237281322479248, -0.004983782768249512, -0.004730284214019775, -0.004476785659790039, -0.004223287105560303, -0.003969788551330566, -0.00371628999710083, -0.0034627914428710938, -0.0032092928886413574, -0.002955794334411621, -0.0027022957801818848, -0.0024487972259521484, -0.002195298671722412, -0.0019418001174926758, -0.0016883015632629395, -0.0014348030090332031, -0.0011813044548034668, -0.0009278059005737305, -0.0006743073463439941, -0.0004208087921142578, -0.00016731023788452148, 8.618831634521484e-05, 0.00033968687057495117, 0.0005931854248046875, 0.0008466839790344238, 0.0011001825332641602, 0.0013536810874938965, 0.0016071796417236328, 0.0018606781959533691, 0.0021141767501831055, 0.002367675304412842, 0.002621173858642578, 0.0028746724128723145, 0.0031281709671020508, 0.003381669521331787, 0.0036351680755615234, 0.0038886666297912598, 0.004142165184020996, 0.004395663738250732, 0.004649162292480469, 0.004902660846710205, 0.005156159400939941, 0.005409657955169678, 0.005663156509399414, 0.00591665506362915, 0.006170153617858887, 0.006423652172088623, 0.006677150726318359, 0.006930649280548096, 0.007184147834777832, 0.007437646389007568, 0.007691144943237305, 0.007944643497467041, 0.008198142051696777, 0.008451640605926514, 0.00870513916015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 4.0, 9.0, 8.0, 13.0, 15.0, 21.0, 16.0, 18.0, 33.0, 27.0, 34.0, 47.0, 61.0, 56.0, 40.0, 59.0, 55.0, 71.0, 53.0, 52.0, 53.0, 33.0, 40.0, 38.0, 37.0, 26.0, 23.0, 11.0, 12.0, 9.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.01235342025756836, -0.011912345886230469, -0.011471271514892578, -0.011030197143554688, -0.010589122772216797, -0.010148048400878906, -0.009706974029541016, -0.009265899658203125, -0.008824825286865234, -0.008383750915527344, -0.007942676544189453, -0.0075016021728515625, -0.007060527801513672, -0.006619453430175781, -0.006178379058837891, -0.0057373046875, -0.005296230316162109, -0.004855155944824219, -0.004414081573486328, -0.0039730072021484375, -0.003531932830810547, -0.0030908584594726562, -0.0026497840881347656, -0.002208709716796875, -0.0017676353454589844, -0.0013265609741210938, -0.0008854866027832031, -0.0004444122314453125, -3.337860107421875e-06, 0.00043773651123046875, 0.0008788108825683594, 0.00131988525390625, 0.0017609596252441406, 0.0022020339965820312, 0.002643108367919922, 0.0030841827392578125, 0.003525257110595703, 0.003966331481933594, 0.004407405853271484, 0.004848480224609375, 0.005289554595947266, 0.005730628967285156, 0.006171703338623047, 0.0066127777099609375, 0.007053852081298828, 0.007494926452636719, 0.00793600082397461, 0.0083770751953125, 0.00881814956665039, 0.009259223937988281, 0.009700298309326172, 0.010141372680664062, 0.010582447052001953, 0.011023521423339844, 0.011464595794677734, 0.011905670166015625, 0.012346744537353516, 0.012787818908691406, 0.013228893280029297, 0.013669967651367188, 0.014111042022705078, 0.014552116394042969, 0.01499319076538086, 0.01543426513671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 10.0, 16.0, 12.0, 12.0, 27.0, 40.0, 65.0, 85.0, 119.0, 225.0, 319.0, 563.0, 975.0, 1988.0, 4015.0, 9436.0, 23828.0, 69410.0, 240658.0, 544790.0, 97648.0, 31869.0, 11990.0, 5115.0, 2319.0, 1245.0, 690.0, 382.0, 219.0, 141.0, 93.0, 62.0, 43.0, 38.0, 27.0, 14.0, 12.0, 14.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010242462158203125, -0.0009913593530654907, -0.0009584724903106689, -0.0009255856275558472, -0.0008926987648010254, -0.0008598119020462036, -0.0008269250392913818, -0.0007940381765365601, -0.0007611513137817383, -0.0007282644510269165, -0.0006953775882720947, -0.000662490725517273, -0.0006296038627624512, -0.0005967170000076294, -0.0005638301372528076, -0.0005309432744979858, -0.0004980564117431641, -0.0004651695489883423, -0.0004322826862335205, -0.00039939582347869873, -0.00036650896072387695, -0.0003336220979690552, -0.0003007352352142334, -0.0002678483724594116, -0.00023496150970458984, -0.00020207464694976807, -0.0001691877841949463, -0.0001363009214401245, -0.00010341405868530273, -7.052719593048096e-05, -3.764033317565918e-05, -4.753470420837402e-06, 2.8133392333984375e-05, 6.102025508880615e-05, 9.390711784362793e-05, 0.0001267939805984497, 0.00015968084335327148, 0.00019256770610809326, 0.00022545456886291504, 0.0002583414316177368, 0.0002912282943725586, 0.00032411515712738037, 0.00035700201988220215, 0.0003898888826370239, 0.0004227757453918457, 0.0004556626081466675, 0.0004885494709014893, 0.000521436333656311, 0.0005543231964111328, 0.0005872100591659546, 0.0006200969219207764, 0.0006529837846755981, 0.0006858706474304199, 0.0007187575101852417, 0.0007516443729400635, 0.0007845312356948853, 0.000817418098449707, 0.0008503049612045288, 0.0008831918239593506, 0.0009160786867141724, 0.0009489655494689941, 0.000981852412223816, 0.0010147392749786377, 0.0010476261377334595, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 2.0, 11.0, 12.0, 6.0, 13.0, 18.0, 18.0, 28.0, 27.0, 19.0, 17.0, 37.0, 40.0, 29.0, 51.0, 37.0, 53.0, 21.0, 51.0, 49.0, 34.0, 48.0, 53.0, 33.0, 30.0, 39.0, 46.0, 9.0, 33.0, 24.0, 10.0, 19.0, 19.0, 14.0, 11.0, 9.0, 8.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.2782554626464844e-06, -3.1767413020133972e-06, -3.07522714138031e-06, -2.973712980747223e-06, -2.8721988201141357e-06, -2.7706846594810486e-06, -2.6691704988479614e-06, -2.5676563382148743e-06, -2.466142177581787e-06, -2.3646280169487e-06, -2.263113856315613e-06, -2.1615996956825256e-06, -2.0600855350494385e-06, -1.9585713744163513e-06, -1.8570572137832642e-06, -1.755543053150177e-06, -1.6540288925170898e-06, -1.5525147318840027e-06, -1.4510005712509155e-06, -1.3494864106178284e-06, -1.2479722499847412e-06, -1.146458089351654e-06, -1.044943928718567e-06, -9.434297680854797e-07, -8.419156074523926e-07, -7.404014468193054e-07, -6.388872861862183e-07, -5.373731255531311e-07, -4.3585896492004395e-07, -3.343448042869568e-07, -2.3283064365386963e-07, -1.3131648302078247e-07, -2.9802322387695312e-08, 7.171183824539185e-08, 1.73225998878479e-07, 2.7474015951156616e-07, 3.762543201446533e-07, 4.777684807777405e-07, 5.792826414108276e-07, 6.807968020439148e-07, 7.82310962677002e-07, 8.838251233100891e-07, 9.853392839431763e-07, 1.0868534445762634e-06, 1.1883676052093506e-06, 1.2898817658424377e-06, 1.391395926475525e-06, 1.492910087108612e-06, 1.5944242477416992e-06, 1.6959384083747864e-06, 1.7974525690078735e-06, 1.8989667296409607e-06, 2.000480890274048e-06, 2.101995050907135e-06, 2.203509211540222e-06, 2.3050233721733093e-06, 2.4065375328063965e-06, 2.5080516934394836e-06, 2.609565854072571e-06, 2.711080014705658e-06, 2.812594175338745e-06, 2.9141083359718323e-06, 3.0156224966049194e-06, 3.1171366572380066e-06, 3.2186508178710938e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 11.0, 10.0, 11.0, 14.0, 15.0, 23.0, 24.0, 41.0, 48.0, 74.0, 134.0, 160.0, 263.0, 422.0, 743.0, 1444.0, 3156.0, 7919.0, 21241.0, 65472.0, 242010.0, 556248.0, 99473.0, 30298.0, 10812.0, 4184.0, 1892.0, 950.0, 512.0, 307.0, 197.0, 121.0, 86.0, 60.0, 46.0, 33.0, 20.0, 16.0, 18.0, 8.0, 9.0, 9.0, 8.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0011358261108398438, -0.0011025816202163696, -0.0010693371295928955, -0.0010360926389694214, -0.0010028481483459473, -0.0009696036577224731, -0.000936359167098999, -0.0009031146764755249, -0.0008698701858520508, -0.0008366256952285767, -0.0008033812046051025, -0.0007701367139816284, -0.0007368922233581543, -0.0007036477327346802, -0.0006704032421112061, -0.0006371587514877319, -0.0006039142608642578, -0.0005706697702407837, -0.0005374252796173096, -0.0005041807889938354, -0.00047093629837036133, -0.0004376918077468872, -0.0004044473171234131, -0.00037120282649993896, -0.00033795833587646484, -0.0003047138452529907, -0.0002714693546295166, -0.00023822486400604248, -0.00020498037338256836, -0.00017173588275909424, -0.00013849139213562012, -0.000105246901512146, -7.200241088867188e-05, -3.8757920265197754e-05, -5.513429641723633e-06, 2.7731060981750488e-05, 6.097555160522461e-05, 9.422004222869873e-05, 0.00012746453285217285, 0.00016070902347564697, 0.0001939535140991211, 0.00022719800472259521, 0.00026044249534606934, 0.00029368698596954346, 0.0003269314765930176, 0.0003601759672164917, 0.0003934204578399658, 0.00042666494846343994, 0.00045990943908691406, 0.0004931539297103882, 0.0005263984203338623, 0.0005596429109573364, 0.0005928874015808105, 0.0006261318922042847, 0.0006593763828277588, 0.0006926208734512329, 0.000725865364074707, 0.0007591098546981812, 0.0007923543453216553, 0.0008255988359451294, 0.0008588433265686035, 0.0008920878171920776, 0.0009253323078155518, 0.0009585767984390259, 0.0009918212890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 6.0, 10.0, 11.0, 20.0, 23.0, 31.0, 25.0, 43.0, 47.0, 50.0, 53.0, 76.0, 71.0, 64.0, 64.0, 52.0, 62.0, 49.0, 39.0, 41.0, 25.0, 18.0, 16.0, 8.0, 10.0, 9.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013856887817382812, -0.0013398975133895874, -0.0012941062450408936, -0.0012483149766921997, -0.0012025237083435059, -0.001156732439994812, -0.0011109411716461182, -0.0010651499032974243, -0.0010193586349487305, -0.0009735673666000366, -0.0009277760982513428, -0.0008819848299026489, -0.0008361935615539551, -0.0007904022932052612, -0.0007446110248565674, -0.0006988197565078735, -0.0006530284881591797, -0.0006072372198104858, -0.000561445951461792, -0.0005156546831130981, -0.0004698634147644043, -0.00042407214641571045, -0.0003782808780670166, -0.00033248960971832275, -0.0002866983413696289, -0.00024090707302093506, -0.0001951158046722412, -0.00014932453632354736, -0.00010353326797485352, -5.774199962615967e-05, -1.195073127746582e-05, 3.384053707122803e-05, 7.963180541992188e-05, 0.00012542307376861572, 0.00017121434211730957, 0.00021700561046600342, 0.00026279687881469727, 0.0003085881471633911, 0.00035437941551208496, 0.0004001706838607788, 0.00044596195220947266, 0.0004917532205581665, 0.0005375444889068604, 0.0005833357572555542, 0.000629127025604248, 0.0006749182939529419, 0.0007207095623016357, 0.0007665008306503296, 0.0008122920989990234, 0.0008580833673477173, 0.0009038746356964111, 0.000949665904045105, 0.0009954571723937988, 0.0010412484407424927, 0.0010870397090911865, 0.0011328309774398804, 0.0011786222457885742, 0.001224413514137268, 0.001270204782485962, 0.0013159960508346558, 0.0013617873191833496, 0.0014075785875320435, 0.0014533698558807373, 0.0014991611242294312, 0.001544952392578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 16.0, 31.0, 56.0, 79.0, 132.0, 238.0, 179.0, 91.0, 56.0, 39.0, 18.0, 13.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05052497237920761, -0.04925081506371498, -0.04797666147351265, -0.04670250415802002, -0.04542835056781769, -0.04415419325232506, -0.04288003593683243, -0.041605882346630096, -0.040331725031137466, -0.039057567715644836, -0.037783414125442505, -0.036509256809949875, -0.03523510321974754, -0.03396094590425491, -0.03268679231405258, -0.03141263499855995, -0.03013847954571247, -0.02886432409286499, -0.02759016864001751, -0.02631601318717003, -0.0250418558716774, -0.023767700418829918, -0.022493544965982437, -0.021219387650489807, -0.019945234060287476, -0.018671078607439995, -0.017396923154592514, -0.016122765839099884, -0.014848610386252403, -0.013574454933404922, -0.012300299480557442, -0.011026143096387386, -0.00975198857486248, -0.008477833122015, -0.007203676737844944, -0.005929521284997463, -0.004655365366488695, -0.003381209447979927, -0.0021070539951324463, -0.0008328976109623909, 0.0004412578418850899, 0.0017154136439785361, 0.0029895694460719824, 0.004263725131750107, 0.005537881050258875, 0.006812036968767643, 0.008086192421615124, 0.00936034880578518, 0.01063450425863266, 0.01190865971148014, 0.013182816095650196, 0.014456971548497677, 0.015731127932667732, 0.017005283385515213, 0.018279438838362694, 0.019553594291210175, 0.020827751606702805, 0.022101907059550285, 0.023376062512397766, 0.024650219827890396, 0.025924375280737877, 0.027198530733585358, 0.02847268618643284, 0.02974684163928032, 0.0310209970921278]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 5.0, 5.0, 9.0, 11.0, 13.0, 15.0, 15.0, 11.0, 22.0, 16.0, 29.0, 30.0, 34.0, 21.0, 32.0, 30.0, 34.0, 66.0, 93.0, 81.0, 57.0, 31.0, 39.0, 22.0, 32.0, 31.0, 21.0, 19.0, 19.0, 19.0, 16.0, 20.0, 12.0, 12.0, 4.0, 13.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03422337770462036, -0.03304683044552803, -0.0318702831864357, -0.03069373220205307, -0.02951718494296074, -0.028340637683868408, -0.027164088562130928, -0.025987539440393448, -0.024810992181301117, -0.023634444922208786, -0.022457895800471306, -0.021281346678733826, -0.020104799419641495, -0.018928252160549164, -0.017751703038811684, -0.016575153917074203, -0.015398606657981873, -0.014222058467566967, -0.013045510277152061, -0.011868962086737156, -0.01069241389632225, -0.009515865705907345, -0.00833931751549244, -0.007162769325077534, -0.005986221134662628, -0.004809672944247723, -0.003633124753832817, -0.0024565765634179115, -0.001280028373003006, -0.00010348018258810043, 0.0010730680078268051, 0.0022496161982417107, 0.003426164388656616, 0.004602712579071522, 0.005779260769486427, 0.006955808959901333, 0.008132357150316238, 0.009308905340731144, 0.01048545353114605, 0.011662001721560955, 0.01283854991197586, 0.014015098102390766, 0.015191646292805672, 0.016368195414543152, 0.017544742673635483, 0.018721289932727814, 0.019897839054465294, 0.021074388176202774, 0.022250935435295105, 0.023427482694387436, 0.024604031816124916, 0.025780580937862396, 0.026957128196954727, 0.028133675456047058, 0.02931022457778454, 0.03048677369952202, 0.03166332095861435, 0.03283986821770668, 0.03401641547679901, 0.03519296646118164, 0.03636951372027397, 0.0375460609793663, 0.03872261196374893, 0.03989915922284126, 0.041075706481933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 9.0, 15.0, 26.0, 44.0, 61.0, 79.0, 132.0, 212.0, 393.0, 1208.0, 3823.0, 18501.0, 398648.0, 3593385.0, 164107.0, 9893.0, 2313.0, 603.0, 288.0, 157.0, 123.0, 77.0, 58.0, 33.0, 20.0, 21.0, 12.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00762176513671875, -0.007393479347229004, -0.007165193557739258, -0.006936907768249512, -0.006708621978759766, -0.0064803361892700195, -0.0062520503997802734, -0.006023764610290527, -0.005795478820800781, -0.005567193031311035, -0.005338907241821289, -0.005110621452331543, -0.004882335662841797, -0.004654049873352051, -0.004425764083862305, -0.004197478294372559, -0.0039691925048828125, -0.0037409067153930664, -0.0035126209259033203, -0.0032843351364135742, -0.003056049346923828, -0.002827763557434082, -0.002599477767944336, -0.00237119197845459, -0.0021429061889648438, -0.0019146203994750977, -0.0016863346099853516, -0.0014580488204956055, -0.0012297630310058594, -0.0010014772415161133, -0.0007731914520263672, -0.0005449056625366211, -0.000316619873046875, -8.83340835571289e-05, 0.0001399517059326172, 0.0003682374954223633, 0.0005965232849121094, 0.0008248090744018555, 0.0010530948638916016, 0.0012813806533813477, 0.0015096664428710938, 0.0017379522323608398, 0.001966238021850586, 0.002194523811340332, 0.002422809600830078, 0.0026510953903198242, 0.0028793811798095703, 0.0031076669692993164, 0.0033359527587890625, 0.0035642385482788086, 0.0037925243377685547, 0.004020810127258301, 0.004249095916748047, 0.004477381706237793, 0.004705667495727539, 0.004933953285217285, 0.005162239074707031, 0.005390524864196777, 0.0056188106536865234, 0.0058470964431762695, 0.006075382232666016, 0.006303668022155762, 0.006531953811645508, 0.006760239601135254, 0.006988525390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 10.0, 9.0, 9.0, 23.0, 27.0, 60.0, 67.0, 85.0, 126.0, 152.0, 116.0, 97.0, 90.0, 49.0, 26.0, 22.0, 16.0, 9.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007266998291015625, -0.007013142108917236, -0.006759285926818848, -0.006505429744720459, -0.00625157356262207, -0.005997717380523682, -0.005743861198425293, -0.005490005016326904, -0.005236148834228516, -0.004982292652130127, -0.004728436470031738, -0.00447458028793335, -0.004220724105834961, -0.003966867923736572, -0.0037130117416381836, -0.003459155559539795, -0.0032052993774414062, -0.0029514431953430176, -0.002697587013244629, -0.0024437308311462402, -0.0021898746490478516, -0.0019360184669494629, -0.0016821622848510742, -0.0014283061027526855, -0.0011744499206542969, -0.0009205937385559082, -0.0006667375564575195, -0.00041288137435913086, -0.0001590251922607422, 9.483098983764648e-05, 0.00034868717193603516, 0.0006025433540344238, 0.0008563995361328125, 0.0011102557182312012, 0.0013641119003295898, 0.0016179680824279785, 0.0018718242645263672, 0.002125680446624756, 0.0023795366287231445, 0.002633392810821533, 0.002887248992919922, 0.0031411051750183105, 0.0033949613571166992, 0.003648817539215088, 0.0039026737213134766, 0.004156529903411865, 0.004410386085510254, 0.004664242267608643, 0.004918098449707031, 0.00517195463180542, 0.005425810813903809, 0.005679666996002197, 0.005933523178100586, 0.006187379360198975, 0.006441235542297363, 0.006695091724395752, 0.006948947906494141, 0.007202804088592529, 0.007456660270690918, 0.007710516452789307, 0.007964372634887695, 0.008218228816986084, 0.008472084999084473, 0.008725941181182861, 0.00897979736328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 16.0, 23.0, 44.0, 70.0, 164.0, 297.0, 724.0, 2481.0, 22229.0, 3891278.0, 268545.0, 6138.0, 1291.0, 457.0, 227.0, 134.0, 58.0, 33.0, 26.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01273345947265625, -0.01239621639251709, -0.01205897331237793, -0.01172173023223877, -0.01138448715209961, -0.01104724407196045, -0.010710000991821289, -0.010372757911682129, -0.010035514831542969, -0.009698271751403809, -0.009361028671264648, -0.009023785591125488, -0.008686542510986328, -0.008349299430847168, -0.008012056350708008, -0.007674813270568848, -0.0073375701904296875, -0.007000327110290527, -0.006663084030151367, -0.006325840950012207, -0.005988597869873047, -0.005651354789733887, -0.0053141117095947266, -0.004976868629455566, -0.004639625549316406, -0.004302382469177246, -0.003965139389038086, -0.0036278963088989258, -0.0032906532287597656, -0.0029534101486206055, -0.0026161670684814453, -0.002278923988342285, -0.001941680908203125, -0.0016044378280639648, -0.0012671947479248047, -0.0009299516677856445, -0.0005927085876464844, -0.0002554655075073242, 8.177757263183594e-05, 0.0004190206527709961, 0.0007562637329101562, 0.0010935068130493164, 0.0014307498931884766, 0.0017679929733276367, 0.002105236053466797, 0.002442479133605957, 0.002779722213745117, 0.0031169652938842773, 0.0034542083740234375, 0.0037914514541625977, 0.004128694534301758, 0.004465937614440918, 0.004803180694580078, 0.005140423774719238, 0.0054776668548583984, 0.005814909934997559, 0.006152153015136719, 0.006489396095275879, 0.006826639175415039, 0.007163882255554199, 0.007501125335693359, 0.00783836841583252, 0.00817561149597168, 0.00851285457611084, 0.00885009765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 10.0, 18.0, 26.0, 57.0, 144.0, 342.0, 728.0, 1090.0, 849.0, 464.0, 176.0, 73.0, 30.0, 29.0, 14.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005584716796875, -0.005314230918884277, -0.005043745040893555, -0.004773259162902832, -0.004502773284912109, -0.004232287406921387, -0.003961801528930664, -0.0036913156509399414, -0.0034208297729492188, -0.003150343894958496, -0.0028798580169677734, -0.0026093721389770508, -0.002338886260986328, -0.0020684003829956055, -0.0017979145050048828, -0.0015274286270141602, -0.0012569427490234375, -0.0009864568710327148, -0.0007159709930419922, -0.00044548511505126953, -0.00017499923706054688, 9.548664093017578e-05, 0.00036597251892089844, 0.0006364583969116211, 0.0009069442749023438, 0.0011774301528930664, 0.001447916030883789, 0.0017184019088745117, 0.0019888877868652344, 0.002259373664855957, 0.0025298595428466797, 0.0028003454208374023, 0.003070831298828125, 0.0033413171768188477, 0.0036118030548095703, 0.003882288932800293, 0.004152774810791016, 0.004423260688781738, 0.004693746566772461, 0.004964232444763184, 0.005234718322753906, 0.005505204200744629, 0.0057756900787353516, 0.006046175956726074, 0.006316661834716797, 0.0065871477127075195, 0.006857633590698242, 0.007128119468688965, 0.0073986053466796875, 0.00766909122467041, 0.007939577102661133, 0.008210062980651855, 0.008480548858642578, 0.0087510347366333, 0.009021520614624023, 0.009292006492614746, 0.009562492370605469, 0.009832978248596191, 0.010103464126586914, 0.010373950004577637, 0.01064443588256836, 0.010914921760559082, 0.011185407638549805, 0.011455893516540527, 0.01172637939453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 21.0, 22.0, 41.0, 64.0, 93.0, 107.0, 163.0, 130.0, 92.0, 92.0, 42.0, 42.0, 18.0, 17.0, 4.0, 14.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02202855423092842, -0.020994314923882484, -0.0199600737541914, -0.018925834447145462, -0.017891593277454376, -0.01685735397040844, -0.015823114663362503, -0.014788874424993992, -0.01375463418662548, -0.01272039394825697, -0.011686153709888458, -0.010651914402842522, -0.00961767416447401, -0.0085834339261055, -0.007549194153398275, -0.0065149543806910515, -0.00548071414232254, -0.004446473903954029, -0.003412234131246805, -0.0023779941257089376, -0.00134375412017107, -0.0003095138818025589, 0.000724725890904665, 0.0017589656636118889, 0.0027932059019804, 0.0038274459075182676, 0.004861685913056135, 0.005895925685763359, 0.00693016592413187, 0.007964406162500381, 0.008998645469546318, 0.01003288570791483, 0.011067129671573639, 0.01210136990994215, 0.013135610148310661, 0.014169849455356598, 0.015204089693725109, 0.01623832993209362, 0.017272569239139557, 0.018306810408830643, 0.01934104971587658, 0.020375289022922516, 0.0214095301926136, 0.02244376949965954, 0.023478008806705475, 0.02451224997639656, 0.025546489283442497, 0.026580728590488434, 0.02761496976017952, 0.028649209067225456, 0.029683450236916542, 0.03071768954396248, 0.031751930713653564, 0.03278616815805435, 0.03382040932774544, 0.03485465049743652, 0.03588888794183731, 0.0369231291115284, 0.037957366555929184, 0.03899160772562027, 0.040025848895311356, 0.04106009006500244, 0.04209432750940323, 0.043128568679094315, 0.0441628098487854]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 10.0, 7.0, 12.0, 8.0, 12.0, 17.0, 17.0, 17.0, 20.0, 25.0, 34.0, 24.0, 41.0, 51.0, 57.0, 36.0, 45.0, 57.0, 60.0, 48.0, 45.0, 50.0, 40.0, 43.0, 34.0, 24.0, 26.0, 10.0, 16.0, 13.0, 14.0, 17.0, 10.0, 9.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.019015789031982422, -0.01829322800040245, -0.01757066510617733, -0.01684810221195221, -0.016125541180372238, -0.015402979217469692, -0.014680417254567146, -0.0139578552916646, -0.013235293328762054, -0.012512731365859509, -0.011790169402956963, -0.011067607440054417, -0.01034504547715187, -0.009622483514249325, -0.008899921551346779, -0.008177359588444233, -0.007454797625541687, -0.006732235662639141, -0.006009673699736595, -0.005287111736834049, -0.004564549773931503, -0.0038419878110289574, -0.0031194258481264114, -0.0023968638852238655, -0.0016743019223213196, -0.0009517399594187737, -0.00022917799651622772, 0.0004933839663863182, 0.0012159459292888641, 0.00193850789219141, 0.002661069855093956, 0.003383631817996502, 0.004106193780899048, 0.004828755743801594, 0.00555131770670414, 0.006273879669606686, 0.006996441632509232, 0.0077190035954117775, 0.008441565558314323, 0.00916412752121687, 0.009886689484119415, 0.010609251447021961, 0.011331813409924507, 0.012054375372827053, 0.012776937335729599, 0.013499499298632145, 0.01422206126153469, 0.014944623224437237, 0.015667185187339783, 0.016389746218919754, 0.017112309113144875, 0.017834872007369995, 0.018557433038949966, 0.019279994070529938, 0.02000255696475506, 0.02072511985898018, 0.02144768089056015, 0.02217024192214012, 0.022892804816365242, 0.023615367710590363, 0.024337928742170334, 0.025060489773750305, 0.025783052667975426, 0.026505615562200546, 0.027228176593780518]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 5.0, 8.0, 14.0, 18.0, 24.0, 18.0, 52.0, 57.0, 93.0, 137.0, 195.0, 366.0, 717.0, 1382.0, 3015.0, 7844.0, 24992.0, 107828.0, 497145.0, 316374.0, 61892.0, 16169.0, 5405.0, 2276.0, 1053.0, 585.0, 302.0, 194.0, 124.0, 74.0, 55.0, 36.0, 27.0, 13.0, 16.0, 14.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007717132568359375, -0.00748896598815918, -0.007260799407958984, -0.007032632827758789, -0.006804466247558594, -0.0065762996673583984, -0.006348133087158203, -0.006119966506958008, -0.0058917999267578125, -0.005663633346557617, -0.005435466766357422, -0.0052073001861572266, -0.004979133605957031, -0.004750967025756836, -0.004522800445556641, -0.004294633865356445, -0.00406646728515625, -0.0038383007049560547, -0.0036101341247558594, -0.003381967544555664, -0.0031538009643554688, -0.0029256343841552734, -0.002697467803955078, -0.002469301223754883, -0.0022411346435546875, -0.002012968063354492, -0.0017848014831542969, -0.0015566349029541016, -0.0013284683227539062, -0.001100301742553711, -0.0008721351623535156, -0.0006439685821533203, -0.000415802001953125, -0.0001876354217529297, 4.0531158447265625e-05, 0.00026869773864746094, 0.0004968643188476562, 0.0007250308990478516, 0.0009531974792480469, 0.0011813640594482422, 0.0014095306396484375, 0.0016376972198486328, 0.0018658638000488281, 0.0020940303802490234, 0.0023221969604492188, 0.002550363540649414, 0.0027785301208496094, 0.0030066967010498047, 0.00323486328125, 0.0034630298614501953, 0.0036911964416503906, 0.003919363021850586, 0.004147529602050781, 0.0043756961822509766, 0.004603862762451172, 0.004832029342651367, 0.0050601959228515625, 0.005288362503051758, 0.005516529083251953, 0.0057446956634521484, 0.005972862243652344, 0.006201028823852539, 0.006429195404052734, 0.00665736198425293, 0.006885528564453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 15.0, 20.0, 33.0, 64.0, 81.0, 116.0, 96.0, 143.0, 119.0, 101.0, 69.0, 63.0, 20.0, 17.0, 19.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.006996810436248779, -0.006741881370544434, -0.006486952304840088, -0.006232023239135742, -0.0059770941734313965, -0.005722165107727051, -0.005467236042022705, -0.005212306976318359, -0.004957377910614014, -0.004702448844909668, -0.004447519779205322, -0.0041925907135009766, -0.003937661647796631, -0.003682732582092285, -0.0034278035163879395, -0.0031728744506835938, -0.002917945384979248, -0.0026630163192749023, -0.0024080872535705566, -0.002153158187866211, -0.0018982291221618652, -0.0016433000564575195, -0.0013883709907531738, -0.0011334419250488281, -0.0008785128593444824, -0.0006235837936401367, -0.000368654727935791, -0.00011372566223144531, 0.0001412034034729004, 0.0003961324691772461, 0.0006510615348815918, 0.0009059906005859375, 0.0011609196662902832, 0.001415848731994629, 0.0016707777976989746, 0.0019257068634033203, 0.002180635929107666, 0.0024355649948120117, 0.0026904940605163574, 0.002945423126220703, 0.003200352191925049, 0.0034552812576293945, 0.0037102103233337402, 0.003965139389038086, 0.004220068454742432, 0.004474997520446777, 0.004729926586151123, 0.004984855651855469, 0.0052397847175598145, 0.00549471378326416, 0.005749642848968506, 0.0060045719146728516, 0.006259500980377197, 0.006514430046081543, 0.006769359111785889, 0.007024288177490234, 0.00727921724319458, 0.007534146308898926, 0.0077890753746032715, 0.008044004440307617, 0.008298933506011963, 0.008553862571716309, 0.008808791637420654, 0.009063720703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 9.0, 12.0, 9.0, 10.0, 16.0, 23.0, 27.0, 50.0, 50.0, 101.0, 120.0, 173.0, 314.0, 499.0, 798.0, 1657.0, 4854.0, 23852.0, 219051.0, 724908.0, 57892.0, 8941.0, 2410.0, 1124.0, 619.0, 342.0, 210.0, 139.0, 94.0, 64.0, 41.0, 38.0, 25.0, 21.0, 21.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00908660888671875, -0.008795499801635742, -0.008504390716552734, -0.008213281631469727, -0.007922172546386719, -0.007631063461303711, -0.007339954376220703, -0.007048845291137695, -0.0067577362060546875, -0.00646662712097168, -0.006175518035888672, -0.005884408950805664, -0.005593299865722656, -0.0053021907806396484, -0.005011081695556641, -0.004719972610473633, -0.004428863525390625, -0.004137754440307617, -0.0038466453552246094, -0.0035555362701416016, -0.0032644271850585938, -0.002973318099975586, -0.002682209014892578, -0.0023910999298095703, -0.0020999908447265625, -0.0018088817596435547, -0.0015177726745605469, -0.001226663589477539, -0.0009355545043945312, -0.0006444454193115234, -0.0003533363342285156, -6.222724914550781e-05, 0.0002288818359375, 0.0005199909210205078, 0.0008111000061035156, 0.0011022090911865234, 0.0013933181762695312, 0.001684427261352539, 0.001975536346435547, 0.0022666454315185547, 0.0025577545166015625, 0.0028488636016845703, 0.003139972686767578, 0.003431081771850586, 0.0037221908569335938, 0.0040132999420166016, 0.004304409027099609, 0.004595518112182617, 0.004886627197265625, 0.005177736282348633, 0.005468845367431641, 0.0057599544525146484, 0.006051063537597656, 0.006342172622680664, 0.006633281707763672, 0.00692439079284668, 0.0072154998779296875, 0.007506608963012695, 0.007797718048095703, 0.008088827133178711, 0.008379936218261719, 0.008671045303344727, 0.008962154388427734, 0.009253263473510742, 0.00954437255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 7.0, 13.0, 9.0, 18.0, 30.0, 30.0, 44.0, 32.0, 44.0, 69.0, 70.0, 61.0, 61.0, 65.0, 62.0, 58.0, 50.0, 55.0, 45.0, 31.0, 29.0, 22.0, 21.0, 16.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01593017578125, -0.0154496431350708, -0.014969110488891602, -0.014488577842712402, -0.014008045196533203, -0.013527512550354004, -0.013046979904174805, -0.012566447257995605, -0.012085914611816406, -0.011605381965637207, -0.011124849319458008, -0.010644316673278809, -0.01016378402709961, -0.00968325138092041, -0.009202718734741211, -0.008722186088562012, -0.008241653442382812, -0.007761120796203613, -0.007280588150024414, -0.006800055503845215, -0.006319522857666016, -0.005838990211486816, -0.005358457565307617, -0.004877924919128418, -0.004397392272949219, -0.0039168596267700195, -0.0034363269805908203, -0.002955794334411621, -0.002475261688232422, -0.0019947290420532227, -0.0015141963958740234, -0.0010336637496948242, -0.000553131103515625, -7.259845733642578e-05, 0.00040793418884277344, 0.0008884668350219727, 0.0013689994812011719, 0.001849532127380371, 0.0023300647735595703, 0.0028105974197387695, 0.0032911300659179688, 0.003771662712097168, 0.004252195358276367, 0.004732728004455566, 0.005213260650634766, 0.005693793296813965, 0.006174325942993164, 0.006654858589172363, 0.0071353912353515625, 0.007615923881530762, 0.008096456527709961, 0.00857698917388916, 0.00905752182006836, 0.009538054466247559, 0.010018587112426758, 0.010499119758605957, 0.010979652404785156, 0.011460185050964355, 0.011940717697143555, 0.012421250343322754, 0.012901782989501953, 0.013382315635681152, 0.013862848281860352, 0.01434338092803955, 0.01482391357421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 9.0, 16.0, 23.0, 42.0, 52.0, 70.0, 140.0, 235.0, 419.0, 814.0, 2102.0, 6603.0, 29399.0, 224223.0, 710576.0, 57515.0, 10814.0, 3096.0, 1150.0, 513.0, 258.0, 185.0, 86.0, 59.0, 35.0, 28.0, 12.0, 12.0, 16.0, 6.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.001682281494140625, -0.0016330629587173462, -0.0015838444232940674, -0.0015346258878707886, -0.0014854073524475098, -0.001436188817024231, -0.0013869702816009521, -0.0013377517461776733, -0.0012885332107543945, -0.0012393146753311157, -0.001190096139907837, -0.001140877604484558, -0.0010916590690612793, -0.0010424405336380005, -0.0009932219982147217, -0.0009440034627914429, -0.0008947849273681641, -0.0008455663919448853, -0.0007963478565216064, -0.0007471293210983276, -0.0006979107856750488, -0.00064869225025177, -0.0005994737148284912, -0.0005502551794052124, -0.0005010366439819336, -0.0004518181085586548, -0.000402599573135376, -0.00035338103771209717, -0.00030416250228881836, -0.00025494396686553955, -0.00020572543144226074, -0.00015650689601898193, -0.00010728836059570312, -5.8069825172424316e-05, -8.851289749145508e-06, 4.03672456741333e-05, 8.958578109741211e-05, 0.00013880431652069092, 0.00018802285194396973, 0.00023724138736724854, 0.00028645992279052734, 0.00033567845821380615, 0.00038489699363708496, 0.00043411552906036377, 0.0004833340644836426, 0.0005325525999069214, 0.0005817711353302002, 0.000630989670753479, 0.0006802082061767578, 0.0007294267416000366, 0.0007786452770233154, 0.0008278638124465942, 0.000877082347869873, 0.0009263008832931519, 0.0009755194187164307, 0.0010247379541397095, 0.0010739564895629883, 0.001123175024986267, 0.001172393560409546, 0.0012216120958328247, 0.0012708306312561035, 0.0013200491666793823, 0.0013692677021026611, 0.00141848623752594, 0.0014677047729492188]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 8.0, 8.0, 8.0, 20.0, 11.0, 18.0, 15.0, 21.0, 16.0, 37.0, 33.0, 50.0, 30.0, 76.0, 43.0, 80.0, 55.0, 56.0, 69.0, 43.0, 53.0, 27.0, 32.0, 27.0, 42.0, 20.0, 13.0, 19.0, 9.0, 9.0, 9.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.708766937255859e-06, -4.560686647891998e-06, -4.412606358528137e-06, -4.264526069164276e-06, -4.116445779800415e-06, -3.968365490436554e-06, -3.820285201072693e-06, -3.6722049117088318e-06, -3.5241246223449707e-06, -3.3760443329811096e-06, -3.2279640436172485e-06, -3.0798837542533875e-06, -2.9318034648895264e-06, -2.7837231755256653e-06, -2.635642886161804e-06, -2.487562596797943e-06, -2.339482307434082e-06, -2.191402018070221e-06, -2.04332172870636e-06, -1.8952414393424988e-06, -1.7471611499786377e-06, -1.5990808606147766e-06, -1.4510005712509155e-06, -1.3029202818870544e-06, -1.1548399925231934e-06, -1.0067597031593323e-06, -8.586794137954712e-07, -7.105991244316101e-07, -5.62518835067749e-07, -4.1443854570388794e-07, -2.6635825634002686e-07, -1.1827796697616577e-07, 2.9802322387695312e-08, 1.778826117515564e-07, 3.259629011154175e-07, 4.7404319047927856e-07, 6.221234798431396e-07, 7.702037692070007e-07, 9.182840585708618e-07, 1.066364347934723e-06, 1.214444637298584e-06, 1.362524926662445e-06, 1.5106052160263062e-06, 1.6586855053901672e-06, 1.8067657947540283e-06, 1.9548460841178894e-06, 2.1029263734817505e-06, 2.2510066628456116e-06, 2.3990869522094727e-06, 2.5471672415733337e-06, 2.695247530937195e-06, 2.843327820301056e-06, 2.991408109664917e-06, 3.139488399028778e-06, 3.287568688392639e-06, 3.4356489777565002e-06, 3.5837292671203613e-06, 3.7318095564842224e-06, 3.8798898458480835e-06, 4.027970135211945e-06, 4.176050424575806e-06, 4.324130713939667e-06, 4.472211003303528e-06, 4.620291292667389e-06, 4.76837158203125e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 0.0, 7.0, 5.0, 24.0, 11.0, 27.0, 31.0, 44.0, 77.0, 85.0, 140.0, 253.0, 427.0, 916.0, 2108.0, 5885.0, 22629.0, 155876.0, 756513.0, 81469.0, 14421.0, 4229.0, 1631.0, 722.0, 398.0, 210.0, 131.0, 72.0, 61.0, 49.0, 27.0, 24.0, 14.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001369476318359375, -0.0013243556022644043, -0.0012792348861694336, -0.0012341141700744629, -0.0011889934539794922, -0.0011438727378845215, -0.0010987520217895508, -0.00105363130569458, -0.0010085105895996094, -0.0009633898735046387, -0.000918269157409668, -0.0008731484413146973, -0.0008280277252197266, -0.0007829070091247559, -0.0007377862930297852, -0.0006926655769348145, -0.0006475448608398438, -0.000602424144744873, -0.0005573034286499023, -0.0005121827125549316, -0.00046706199645996094, -0.00042194128036499023, -0.00037682056427001953, -0.00033169984817504883, -0.0002865791320800781, -0.00024145841598510742, -0.00019633769989013672, -0.00015121698379516602, -0.00010609626770019531, -6.097555160522461e-05, -1.5854835510253906e-05, 2.9265880584716797e-05, 7.43865966796875e-05, 0.0001195073127746582, 0.0001646280288696289, 0.0002097487449645996, 0.0002548694610595703, 0.000299990177154541, 0.0003451108932495117, 0.0003902316093444824, 0.0004353523254394531, 0.00048047304153442383, 0.0005255937576293945, 0.0005707144737243652, 0.0006158351898193359, 0.0006609559059143066, 0.0007060766220092773, 0.000751197338104248, 0.0007963180541992188, 0.0008414387702941895, 0.0008865594863891602, 0.0009316802024841309, 0.0009768009185791016, 0.0010219216346740723, 0.001067042350769043, 0.0011121630668640137, 0.0011572837829589844, 0.001202404499053955, 0.0012475252151489258, 0.0012926459312438965, 0.0013377666473388672, 0.0013828873634338379, 0.0014280080795288086, 0.0014731287956237793, 0.00151824951171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 16.0, 25.0, 23.0, 36.0, 57.0, 69.0, 75.0, 95.0, 108.0, 93.0, 76.0, 74.0, 56.0, 44.0, 36.0, 19.0, 11.0, 20.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020904541015625, -0.0020330101251602173, -0.0019755661487579346, -0.0019181221723556519, -0.0018606781959533691, -0.0018032342195510864, -0.0017457902431488037, -0.001688346266746521, -0.0016309022903442383, -0.0015734583139419556, -0.0015160143375396729, -0.0014585703611373901, -0.0014011263847351074, -0.0013436824083328247, -0.001286238431930542, -0.0012287944555282593, -0.0011713504791259766, -0.0011139065027236938, -0.0010564625263214111, -0.0009990185499191284, -0.0009415745735168457, -0.000884130597114563, -0.0008266866207122803, -0.0007692426443099976, -0.0007117986679077148, -0.0006543546915054321, -0.0005969107151031494, -0.0005394667387008667, -0.000482022762298584, -0.00042457878589630127, -0.00036713480949401855, -0.00030969083309173584, -0.0002522468566894531, -0.0001948028802871704, -0.0001373589038848877, -7.991492748260498e-05, -2.2470951080322266e-05, 3.497302532196045e-05, 9.241700172424316e-05, 0.00014986097812652588, 0.0002073049545288086, 0.0002647489309310913, 0.000322192907333374, 0.00037963688373565674, 0.00043708086013793945, 0.0004945248365402222, 0.0005519688129425049, 0.0006094127893447876, 0.0006668567657470703, 0.000724300742149353, 0.0007817447185516357, 0.0008391886949539185, 0.0008966326713562012, 0.0009540766477584839, 0.0010115206241607666, 0.0010689646005630493, 0.001126408576965332, 0.0011838525533676147, 0.0012412965297698975, 0.0012987405061721802, 0.0013561844825744629, 0.0014136284589767456, 0.0014710724353790283, 0.001528516411781311, 0.0015859603881835938]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 26.0, 86.0, 198.0, 421.0, 166.0, 56.0, 19.0, 15.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0683184489607811, -0.06560777872800827, -0.06289711594581604, -0.06018644571304321, -0.057475775480270386, -0.05476510524749756, -0.05205443874001503, -0.0493437722325325, -0.046633101999759674, -0.04392243176698685, -0.04121176525950432, -0.03850109875202179, -0.03579042851924896, -0.033079758286476135, -0.030369091778993607, -0.02765842340886593, -0.02494775503873825, -0.022237086668610573, -0.019526418298482895, -0.016815749928355217, -0.014105081558227539, -0.011394413188099861, -0.008683744817972183, -0.005973076447844505, -0.0032624080777168274, -0.0005517397075891495, 0.0021589286625385284, 0.004869597032666206, 0.007580265402793884, 0.010290933772921562, 0.01300160214304924, 0.015712270513176918, 0.018422946333885193, 0.02113361470401287, 0.02384428307414055, 0.026554951444268227, 0.029265619814395905, 0.03197629004716873, 0.03468695655465126, 0.03739762306213379, 0.040108293294906616, 0.04281896352767944, 0.04552963003516197, 0.0482402965426445, 0.05095096677541733, 0.053661637008190155, 0.056372303515672684, 0.05908297002315521, 0.06179364025592804, 0.06450431048870087, 0.0672149807214737, 0.06992564350366592, 0.07263631373643875, 0.07534698396921158, 0.07805764675140381, 0.08076831698417664, 0.08347898721694946, 0.08618965744972229, 0.08890032768249512, 0.09161099046468735, 0.09432166069746017, 0.097032330930233, 0.09974299371242523, 0.10245366394519806, 0.10516433417797089]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 3.0, 5.0, 6.0, 12.0, 13.0, 14.0, 18.0, 26.0, 26.0, 26.0, 31.0, 29.0, 42.0, 77.0, 135.0, 154.0, 87.0, 38.0, 41.0, 33.0, 28.0, 24.0, 18.0, 21.0, 19.0, 17.0, 6.0, 14.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05504107475280762, -0.053425658494234085, -0.05181024223566055, -0.05019482597708702, -0.04857940971851349, -0.04696399345993996, -0.045348577201366425, -0.04373316094279289, -0.04211774468421936, -0.04050232842564583, -0.038886912167072296, -0.037271495908498764, -0.03565607964992523, -0.0340406633913517, -0.03242524713277817, -0.030809830874204636, -0.029194414615631104, -0.02757899835705757, -0.02596358209848404, -0.024348165839910507, -0.022732749581336975, -0.021117333322763443, -0.01950191706418991, -0.01788650080561638, -0.016271084547042847, -0.014655668288469315, -0.013040252029895782, -0.01142483577132225, -0.009809419512748718, -0.008194003254175186, -0.006578586995601654, -0.004963170737028122, -0.00334775447845459, -0.0017323382198810577, -0.00011692196130752563, 0.0014984942972660065, 0.0031139105558395386, 0.004729326814413071, 0.006344743072986603, 0.007960159331560135, 0.009575575590133667, 0.011190991848707199, 0.012806408107280731, 0.014421824365854263, 0.016037240624427795, 0.017652656883001328, 0.01926807314157486, 0.02088348940014839, 0.022498905658721924, 0.024114321917295456, 0.025729738175868988, 0.02734515443444252, 0.028960570693016052, 0.030575986951589584, 0.032191403210163116, 0.03380681946873665, 0.03542223572731018, 0.03703765198588371, 0.038653068244457245, 0.04026848450303078, 0.04188390076160431, 0.04349931702017784, 0.04511473327875137, 0.046730149537324905, 0.04834556579589844]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 24.0, 28.0, 42.0, 55.0, 118.0, 270.0, 865.0, 1957.0, 4809.0, 15930.0, 95622.0, 1290094.0, 2515807.0, 236186.0, 22266.0, 6579.0, 2199.0, 700.0, 307.0, 129.0, 93.0, 61.0, 31.0, 24.0, 18.0, 20.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005218505859375, -0.005026519298553467, -0.004834532737731934, -0.0046425461769104, -0.004450559616088867, -0.004258573055267334, -0.004066586494445801, -0.0038745999336242676, -0.0036826133728027344, -0.003490626811981201, -0.003298640251159668, -0.0031066536903381348, -0.0029146671295166016, -0.0027226805686950684, -0.002530694007873535, -0.002338707447052002, -0.0021467208862304688, -0.0019547343254089355, -0.0017627477645874023, -0.0015707612037658691, -0.001378774642944336, -0.0011867880821228027, -0.0009948015213012695, -0.0008028149604797363, -0.0006108283996582031, -0.0004188418388366699, -0.00022685527801513672, -3.4868717193603516e-05, 0.0001571178436279297, 0.0003491044044494629, 0.0005410909652709961, 0.0007330775260925293, 0.0009250640869140625, 0.0011170506477355957, 0.001309037208557129, 0.0015010237693786621, 0.0016930103302001953, 0.0018849968910217285, 0.0020769834518432617, 0.002268970012664795, 0.002460956573486328, 0.0026529431343078613, 0.0028449296951293945, 0.0030369162559509277, 0.003228902816772461, 0.003420889377593994, 0.0036128759384155273, 0.0038048624992370605, 0.003996849060058594, 0.004188835620880127, 0.00438082218170166, 0.004572808742523193, 0.0047647953033447266, 0.00495678186416626, 0.005148768424987793, 0.005340754985809326, 0.005532741546630859, 0.005724728107452393, 0.005916714668273926, 0.006108701229095459, 0.006300687789916992, 0.006492674350738525, 0.006684660911560059, 0.006876647472381592, 0.007068634033203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 13.0, 4.0, 13.0, 17.0, 45.0, 63.0, 90.0, 116.0, 125.0, 125.0, 110.0, 95.0, 62.0, 42.0, 31.0, 23.0, 17.0, 7.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.00699537992477417, -0.006739020347595215, -0.00648266077041626, -0.006226301193237305, -0.00596994161605835, -0.0057135820388793945, -0.0054572224617004395, -0.005200862884521484, -0.004944503307342529, -0.004688143730163574, -0.004431784152984619, -0.004175424575805664, -0.003919064998626709, -0.003662705421447754, -0.003406345844268799, -0.0031499862670898438, -0.0028936266899108887, -0.0026372671127319336, -0.0023809075355529785, -0.0021245479583740234, -0.0018681883811950684, -0.0016118288040161133, -0.0013554692268371582, -0.0010991096496582031, -0.000842750072479248, -0.000586390495300293, -0.0003300309181213379, -7.367134094238281e-05, 0.00018268823623657227, 0.00043904781341552734, 0.0006954073905944824, 0.0009517669677734375, 0.0012081265449523926, 0.0014644861221313477, 0.0017208456993103027, 0.001977205276489258, 0.002233564853668213, 0.002489924430847168, 0.002746284008026123, 0.003002643585205078, 0.003259003162384033, 0.0035153627395629883, 0.0037717223167419434, 0.0040280818939208984, 0.0042844414710998535, 0.004540801048278809, 0.004797160625457764, 0.005053520202636719, 0.005309879779815674, 0.005566239356994629, 0.005822598934173584, 0.006078958511352539, 0.006335318088531494, 0.006591677665710449, 0.006848037242889404, 0.007104396820068359, 0.0073607563972473145, 0.0076171159744262695, 0.007873475551605225, 0.00812983512878418, 0.008386194705963135, 0.00864255428314209, 0.008898913860321045, 0.0091552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 17.0, 32.0, 72.0, 196.0, 613.0, 3480.0, 4065049.0, 122162.0, 1904.0, 456.0, 157.0, 62.0, 37.0, 12.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03726673126220703, -0.03592872619628906, -0.034590721130371094, -0.033252716064453125, -0.031914710998535156, -0.030576705932617188, -0.02923870086669922, -0.02790069580078125, -0.02656269073486328, -0.025224685668945312, -0.023886680603027344, -0.022548675537109375, -0.021210670471191406, -0.019872665405273438, -0.01853466033935547, -0.0171966552734375, -0.01585865020751953, -0.014520645141601562, -0.013182640075683594, -0.011844635009765625, -0.010506629943847656, -0.009168624877929688, -0.007830619812011719, -0.00649261474609375, -0.005154609680175781, -0.0038166046142578125, -0.0024785995483398438, -0.001140594482421875, 0.00019741058349609375, 0.0015354156494140625, 0.0028734207153320312, 0.00421142578125, 0.005549430847167969, 0.0068874359130859375, 0.008225440979003906, 0.009563446044921875, 0.010901451110839844, 0.012239456176757812, 0.013577461242675781, 0.01491546630859375, 0.01625347137451172, 0.017591476440429688, 0.018929481506347656, 0.020267486572265625, 0.021605491638183594, 0.022943496704101562, 0.02428150177001953, 0.0256195068359375, 0.02695751190185547, 0.028295516967773438, 0.029633522033691406, 0.030971527099609375, 0.032309532165527344, 0.03364753723144531, 0.03498554229736328, 0.03632354736328125, 0.03766155242919922, 0.03899955749511719, 0.040337562561035156, 0.041675567626953125, 0.043013572692871094, 0.04435157775878906, 0.04568958282470703, 0.047027587890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 9.0, 10.0, 12.0, 24.0, 36.0, 61.0, 114.0, 225.0, 490.0, 1115.0, 1069.0, 459.0, 216.0, 102.0, 62.0, 24.0, 17.0, 11.0, 5.0, 11.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0099945068359375, -0.009407281875610352, -0.008820056915283203, -0.008232831954956055, -0.007645606994628906, -0.007058382034301758, -0.006471157073974609, -0.005883932113647461, -0.0052967071533203125, -0.004709482192993164, -0.004122257232666016, -0.003535032272338867, -0.0029478073120117188, -0.0023605823516845703, -0.0017733573913574219, -0.0011861324310302734, -0.000598907470703125, -1.1682510375976562e-05, 0.0005755424499511719, 0.0011627674102783203, 0.0017499923706054688, 0.002337217330932617, 0.0029244422912597656, 0.003511667251586914, 0.0040988922119140625, 0.004686117172241211, 0.005273342132568359, 0.005860567092895508, 0.006447792053222656, 0.007035017013549805, 0.007622241973876953, 0.008209466934204102, 0.00879669189453125, 0.009383916854858398, 0.009971141815185547, 0.010558366775512695, 0.011145591735839844, 0.011732816696166992, 0.01232004165649414, 0.012907266616821289, 0.013494491577148438, 0.014081716537475586, 0.014668941497802734, 0.015256166458129883, 0.01584339141845703, 0.01643061637878418, 0.017017841339111328, 0.017605066299438477, 0.018192291259765625, 0.018779516220092773, 0.019366741180419922, 0.01995396614074707, 0.02054119110107422, 0.021128416061401367, 0.021715641021728516, 0.022302865982055664, 0.022890090942382812, 0.02347731590270996, 0.02406454086303711, 0.024651765823364258, 0.025238990783691406, 0.025826215744018555, 0.026413440704345703, 0.02700066566467285, 0.027587890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 46.0, 83.0, 135.0, 236.0, 208.0, 111.0, 63.0, 29.0, 14.0, 5.0, 10.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0895826444029808, -0.08583042770624161, -0.08207820355892181, -0.07832598686218262, -0.07457377016544342, -0.07082155346870422, -0.06706933677196503, -0.06331711262464523, -0.059564895927906036, -0.05581267923116684, -0.052060458809137344, -0.04830823838710785, -0.04455602169036865, -0.040803804993629456, -0.03705158457159996, -0.033299364149570465, -0.02954714745283127, -0.025794928893446922, -0.022042710334062576, -0.01829049177467823, -0.014538273215293884, -0.010786054655909538, -0.007033836096525192, -0.0032816175371408463, 0.00047060102224349976, 0.004222819581627846, 0.007975038141012192, 0.011727256700396538, 0.015479475259780884, 0.01923169381916523, 0.022983912378549576, 0.026736130937933922, 0.03048834204673767, 0.03424055874347687, 0.03799277916550636, 0.04174499958753586, 0.045497216284275055, 0.04924943298101425, 0.05300165340304375, 0.05675387382507324, 0.06050609052181244, 0.06425830721855164, 0.06801052391529083, 0.07176274806261063, 0.07551496475934982, 0.07926718145608902, 0.08301940560340881, 0.08677162230014801, 0.09052383899688721, 0.0942760556936264, 0.0980282723903656, 0.1017804965376854, 0.10553271323442459, 0.10928492993116379, 0.11303715407848358, 0.11678937077522278, 0.12054158747196198, 0.12429380416870117, 0.12804602086544037, 0.13179823756217957, 0.13555046916007996, 0.13930268585681915, 0.14305490255355835, 0.14680711925029755, 0.15055933594703674]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 10.0, 21.0, 25.0, 21.0, 44.0, 46.0, 82.0, 83.0, 118.0, 125.0, 106.0, 79.0, 79.0, 50.0, 45.0, 17.0, 14.0, 12.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09496647119522095, -0.09070610255002975, -0.08644573390483856, -0.08218536525964737, -0.07792499661445618, -0.07366463541984558, -0.06940426677465439, -0.0651438981294632, -0.060883529484272, -0.05662316083908081, -0.05236279219388962, -0.048102427273988724, -0.04384205862879753, -0.03958168998360634, -0.035321325063705444, -0.03106095641851425, -0.02680058777332306, -0.022540219128131866, -0.018279852345585823, -0.014019484631717205, -0.009759116917848587, -0.005498748272657394, -0.001238381490111351, 0.0030219852924346924, 0.007282353937625885, 0.011542721651494503, 0.01580308936536312, 0.020063456147909164, 0.024323824793100357, 0.02858419343829155, 0.032844558358192444, 0.037104927003383636, 0.04136529564857483, 0.04562566429376602, 0.049886032938957214, 0.05414639785885811, 0.0584067665040493, 0.0626671314239502, 0.06692750006914139, 0.07118786871433258, 0.07544823735952377, 0.07970860600471497, 0.08396897464990616, 0.08822934329509735, 0.09248970448970795, 0.09675008058547974, 0.10101044178009033, 0.10527081042528152, 0.10953117907047272, 0.11379154771566391, 0.1180519163608551, 0.1223122850060463, 0.1265726536512375, 0.13083301484584808, 0.13509339094161987, 0.13935375213623047, 0.14361411333084106, 0.14787447452545166, 0.15213485062122345, 0.15639521181583405, 0.16065558791160583, 0.16491594910621643, 0.16917632520198822, 0.17343668639659882, 0.1776970624923706]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 12.0, 15.0, 20.0, 32.0, 36.0, 68.0, 103.0, 131.0, 219.0, 364.0, 719.0, 1394.0, 3265.0, 8669.0, 28501.0, 147383.0, 687477.0, 129846.0, 26105.0, 7989.0, 3097.0, 1374.0, 690.0, 358.0, 212.0, 141.0, 80.0, 47.0, 38.0, 33.0, 20.0, 13.0, 19.0, 13.0, 10.0, 2.0, 5.0, 2.0, 8.0, 1.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00792694091796875, -0.00761568546295166, -0.00730443000793457, -0.0069931745529174805, -0.006681919097900391, -0.006370663642883301, -0.006059408187866211, -0.005748152732849121, -0.005436897277832031, -0.005125641822814941, -0.0048143863677978516, -0.004503130912780762, -0.004191875457763672, -0.003880620002746582, -0.003569364547729492, -0.0032581090927124023, -0.0029468536376953125, -0.0026355981826782227, -0.002324342727661133, -0.002013087272644043, -0.0017018318176269531, -0.0013905763626098633, -0.0010793209075927734, -0.0007680654525756836, -0.00045680999755859375, -0.0001455545425415039, 0.00016570091247558594, 0.0004769563674926758, 0.0007882118225097656, 0.0010994672775268555, 0.0014107227325439453, 0.0017219781875610352, 0.002033233642578125, 0.002344489097595215, 0.0026557445526123047, 0.0029670000076293945, 0.0032782554626464844, 0.0035895109176635742, 0.003900766372680664, 0.004212021827697754, 0.004523277282714844, 0.004834532737731934, 0.0051457881927490234, 0.005457043647766113, 0.005768299102783203, 0.006079554557800293, 0.006390810012817383, 0.006702065467834473, 0.0070133209228515625, 0.007324576377868652, 0.007635831832885742, 0.007947087287902832, 0.008258342742919922, 0.008569598197937012, 0.008880853652954102, 0.009192109107971191, 0.009503364562988281, 0.009814620018005371, 0.010125875473022461, 0.01043713092803955, 0.01074838638305664, 0.01105964183807373, 0.01137089729309082, 0.01168215274810791, 0.011993408203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 12.0, 21.0, 29.0, 42.0, 86.0, 135.0, 137.0, 142.0, 125.0, 87.0, 63.0, 38.0, 37.0, 27.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006771087646484375, -0.006403505802154541, -0.006035923957824707, -0.005668342113494873, -0.005300760269165039, -0.004933178424835205, -0.004565596580505371, -0.004198014736175537, -0.003830432891845703, -0.003462851047515869, -0.003095269203186035, -0.002727687358856201, -0.002360105514526367, -0.001992523670196533, -0.0016249418258666992, -0.0012573599815368652, -0.0008897781372070312, -0.0005221962928771973, -0.00015461444854736328, 0.0002129673957824707, 0.0005805492401123047, 0.0009481310844421387, 0.0013157129287719727, 0.0016832947731018066, 0.0020508766174316406, 0.0024184584617614746, 0.0027860403060913086, 0.0031536221504211426, 0.0035212039947509766, 0.0038887858390808105, 0.0042563676834106445, 0.0046239495277404785, 0.0049915313720703125, 0.0053591132164001465, 0.0057266950607299805, 0.0060942769050598145, 0.0064618587493896484, 0.006829440593719482, 0.007197022438049316, 0.00756460428237915, 0.007932186126708984, 0.008299767971038818, 0.008667349815368652, 0.009034931659698486, 0.00940251350402832, 0.009770095348358154, 0.010137677192687988, 0.010505259037017822, 0.010872840881347656, 0.01124042272567749, 0.011608004570007324, 0.011975586414337158, 0.012343168258666992, 0.012710750102996826, 0.01307833194732666, 0.013445913791656494, 0.013813495635986328, 0.014181077480316162, 0.014548659324645996, 0.01491624116897583, 0.015283823013305664, 0.015651404857635498, 0.016018986701965332, 0.016386568546295166, 0.016754150390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 5.0, 7.0, 12.0, 10.0, 16.0, 10.0, 18.0, 28.0, 36.0, 55.0, 72.0, 114.0, 174.0, 303.0, 557.0, 1200.0, 2994.0, 11970.0, 90059.0, 872751.0, 54890.0, 8494.0, 2533.0, 955.0, 509.0, 269.0, 153.0, 108.0, 66.0, 39.0, 25.0, 27.0, 21.0, 13.0, 11.0, 10.0, 8.0, 9.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01068878173828125, -0.010348320007324219, -0.010007858276367188, -0.009667396545410156, -0.009326934814453125, -0.008986473083496094, -0.008646011352539062, -0.008305549621582031, -0.007965087890625, -0.007624626159667969, -0.0072841644287109375, -0.006943702697753906, -0.006603240966796875, -0.006262779235839844, -0.0059223175048828125, -0.005581855773925781, -0.00524139404296875, -0.004900932312011719, -0.0045604705810546875, -0.004220008850097656, -0.003879547119140625, -0.0035390853881835938, -0.0031986236572265625, -0.0028581619262695312, -0.0025177001953125, -0.0021772384643554688, -0.0018367767333984375, -0.0014963150024414062, -0.001155853271484375, -0.0008153915405273438, -0.0004749298095703125, -0.00013446807861328125, 0.00020599365234375, 0.0005464553833007812, 0.0008869171142578125, 0.0012273788452148438, 0.001567840576171875, 0.0019083023071289062, 0.0022487640380859375, 0.0025892257690429688, 0.0029296875, 0.0032701492309570312, 0.0036106109619140625, 0.003951072692871094, 0.004291534423828125, 0.004631996154785156, 0.0049724578857421875, 0.005312919616699219, 0.00565338134765625, 0.005993843078613281, 0.0063343048095703125, 0.006674766540527344, 0.007015228271484375, 0.007355690002441406, 0.0076961517333984375, 0.008036613464355469, 0.0083770751953125, 0.008717536926269531, 0.009057998657226562, 0.009398460388183594, 0.009738922119140625, 0.010079383850097656, 0.010419845581054688, 0.010760307312011719, 0.01110076904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 7.0, 7.0, 6.0, 5.0, 6.0, 16.0, 11.0, 21.0, 19.0, 24.0, 28.0, 35.0, 55.0, 56.0, 69.0, 76.0, 86.0, 79.0, 62.0, 58.0, 40.0, 39.0, 40.0, 27.0, 24.0, 22.0, 13.0, 10.0, 13.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0196380615234375, -0.018996000289916992, -0.018353939056396484, -0.017711877822875977, -0.01706981658935547, -0.01642775535583496, -0.015785694122314453, -0.015143632888793945, -0.014501571655273438, -0.01385951042175293, -0.013217449188232422, -0.012575387954711914, -0.011933326721191406, -0.011291265487670898, -0.01064920425415039, -0.010007143020629883, -0.009365081787109375, -0.008723020553588867, -0.00808095932006836, -0.0074388980865478516, -0.006796836853027344, -0.006154775619506836, -0.005512714385986328, -0.00487065315246582, -0.0042285919189453125, -0.0035865306854248047, -0.002944469451904297, -0.002302408218383789, -0.0016603469848632812, -0.0010182857513427734, -0.0003762245178222656, 0.0002658367156982422, 0.00090789794921875, 0.0015499591827392578, 0.0021920204162597656, 0.0028340816497802734, 0.0034761428833007812, 0.004118204116821289, 0.004760265350341797, 0.005402326583862305, 0.0060443878173828125, 0.00668644905090332, 0.007328510284423828, 0.007970571517944336, 0.008612632751464844, 0.009254693984985352, 0.00989675521850586, 0.010538816452026367, 0.011180877685546875, 0.011822938919067383, 0.01246500015258789, 0.013107061386108398, 0.013749122619628906, 0.014391183853149414, 0.015033245086669922, 0.01567530632019043, 0.016317367553710938, 0.016959428787231445, 0.017601490020751953, 0.01824355125427246, 0.01888561248779297, 0.019527673721313477, 0.020169734954833984, 0.020811796188354492, 0.021453857421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 7.0, 17.0, 25.0, 30.0, 62.0, 91.0, 191.0, 418.0, 1355.0, 6181.0, 137906.0, 889755.0, 9698.0, 1797.0, 500.0, 200.0, 96.0, 72.0, 40.0, 28.0, 24.0, 9.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0046844482421875, -0.004538536071777344, -0.0043926239013671875, -0.004246711730957031, -0.004100799560546875, -0.003954887390136719, -0.0038089752197265625, -0.0036630630493164062, -0.00351715087890625, -0.0033712387084960938, -0.0032253265380859375, -0.0030794143676757812, -0.002933502197265625, -0.0027875900268554688, -0.0026416778564453125, -0.0024957656860351562, -0.002349853515625, -0.0022039413452148438, -0.0020580291748046875, -0.0019121170043945312, -0.001766204833984375, -0.0016202926635742188, -0.0014743804931640625, -0.0013284683227539062, -0.00118255615234375, -0.0010366439819335938, -0.0008907318115234375, -0.0007448196411132812, -0.000598907470703125, -0.00045299530029296875, -0.0003070831298828125, -0.00016117095947265625, -1.52587890625e-05, 0.00013065338134765625, 0.0002765655517578125, 0.00042247772216796875, 0.000568389892578125, 0.0007143020629882812, 0.0008602142333984375, 0.0010061264038085938, 0.00115203857421875, 0.0012979507446289062, 0.0014438629150390625, 0.0015897750854492188, 0.001735687255859375, 0.0018815994262695312, 0.0020275115966796875, 0.0021734237670898438, 0.0023193359375, 0.0024652481079101562, 0.0026111602783203125, 0.0027570724487304688, 0.002902984619140625, 0.0030488967895507812, 0.0031948089599609375, 0.0033407211303710938, 0.00348663330078125, 0.0036325454711914062, 0.0037784576416015625, 0.003924369812011719, 0.004070281982421875, 0.004216194152832031, 0.0043621063232421875, 0.004508018493652344, 0.0046539306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 4.0, 0.0, 7.0, 6.0, 7.0, 5.0, 7.0, 10.0, 13.0, 13.0, 11.0, 8.0, 24.0, 34.0, 37.0, 23.0, 47.0, 63.0, 41.0, 48.0, 33.0, 54.0, 94.0, 49.0, 33.0, 43.0, 31.0, 57.0, 34.0, 26.0, 17.0, 22.0, 22.0, 13.0, 13.0, 8.0, 9.0, 4.0, 6.0, 8.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.410743713378906e-06, -4.279427230358124e-06, -4.148110747337341e-06, -4.016794264316559e-06, -3.885477781295776e-06, -3.754161298274994e-06, -3.6228448152542114e-06, -3.491528332233429e-06, -3.3602118492126465e-06, -3.228895366191864e-06, -3.0975788831710815e-06, -2.966262400150299e-06, -2.8349459171295166e-06, -2.703629434108734e-06, -2.5723129510879517e-06, -2.440996468067169e-06, -2.3096799850463867e-06, -2.1783635020256042e-06, -2.0470470190048218e-06, -1.9157305359840393e-06, -1.7844140529632568e-06, -1.6530975699424744e-06, -1.521781086921692e-06, -1.3904646039009094e-06, -1.259148120880127e-06, -1.1278316378593445e-06, -9.96515154838562e-07, -8.651986718177795e-07, -7.338821887969971e-07, -6.025657057762146e-07, -4.7124922275543213e-07, -3.3993273973464966e-07, -2.086162567138672e-07, -7.729977369308472e-08, 5.4016709327697754e-08, 1.8533319234848022e-07, 3.166496753692627e-07, 4.4796615839004517e-07, 5.792826414108276e-07, 7.105991244316101e-07, 8.419156074523926e-07, 9.73232090473175e-07, 1.1045485734939575e-06, 1.23586505651474e-06, 1.3671815395355225e-06, 1.498498022556305e-06, 1.6298145055770874e-06, 1.7611309885978699e-06, 1.8924474716186523e-06, 2.023763954639435e-06, 2.1550804376602173e-06, 2.2863969206809998e-06, 2.4177134037017822e-06, 2.5490298867225647e-06, 2.680346369743347e-06, 2.8116628527641296e-06, 2.942979335784912e-06, 3.0742958188056946e-06, 3.205612301826477e-06, 3.3369287848472595e-06, 3.468245267868042e-06, 3.5995617508888245e-06, 3.730878233909607e-06, 3.862194716930389e-06, 3.993511199951172e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 5.0, 13.0, 28.0, 47.0, 77.0, 89.0, 229.0, 357.0, 766.0, 1780.0, 5255.0, 22479.0, 733054.0, 256106.0, 20073.0, 4969.0, 1694.0, 728.0, 338.0, 173.0, 93.0, 58.0, 43.0, 21.0, 17.0, 16.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014171600341796875, -0.0013682395219802856, -0.0013193190097808838, -0.001270398497581482, -0.00122147798538208, -0.0011725574731826782, -0.0011236369609832764, -0.0010747164487838745, -0.0010257959365844727, -0.0009768754243850708, -0.0009279549121856689, -0.0008790343999862671, -0.0008301138877868652, -0.0007811933755874634, -0.0007322728633880615, -0.0006833523511886597, -0.0006344318389892578, -0.000585511326789856, -0.0005365908145904541, -0.00048767030239105225, -0.0004387497901916504, -0.00038982927799224854, -0.0003409087657928467, -0.0002919882535934448, -0.00024306774139404297, -0.0001941472291946411, -0.00014522671699523926, -9.63062047958374e-05, -4.738569259643555e-05, 1.5348196029663086e-06, 5.0455331802368164e-05, 9.937584400177002e-05, 0.00014829635620117188, 0.00019721686840057373, 0.0002461373805999756, 0.00029505789279937744, 0.0003439784049987793, 0.00039289891719818115, 0.000441819429397583, 0.0004907399415969849, 0.0005396604537963867, 0.0005885809659957886, 0.0006375014781951904, 0.0006864219903945923, 0.0007353425025939941, 0.000784263014793396, 0.0008331835269927979, 0.0008821040391921997, 0.0009310245513916016, 0.0009799450635910034, 0.0010288655757904053, 0.0010777860879898071, 0.001126706600189209, 0.0011756271123886108, 0.0012245476245880127, 0.0012734681367874146, 0.0013223886489868164, 0.0013713091611862183, 0.0014202296733856201, 0.001469150185585022, 0.0015180706977844238, 0.0015669912099838257, 0.0016159117221832275, 0.0016648322343826294, 0.0017137527465820312]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 21.0, 14.0, 19.0, 45.0, 50.0, 118.0, 151.0, 175.0, 130.0, 101.0, 54.0, 36.0, 21.0, 10.0, 10.0, 17.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002475738525390625, -0.002370178699493408, -0.0022646188735961914, -0.0021590590476989746, -0.002053499221801758, -0.001947939395904541, -0.0018423795700073242, -0.0017368197441101074, -0.0016312599182128906, -0.0015257000923156738, -0.001420140266418457, -0.0013145804405212402, -0.0012090206146240234, -0.0011034607887268066, -0.0009979009628295898, -0.000892341136932373, -0.0007867813110351562, -0.0006812214851379395, -0.0005756616592407227, -0.00047010183334350586, -0.00036454200744628906, -0.00025898218154907227, -0.00015342235565185547, -4.786252975463867e-05, 5.7697296142578125e-05, 0.00016325712203979492, 0.0002688169479370117, 0.0003743767738342285, 0.0004799365997314453, 0.0005854964256286621, 0.0006910562515258789, 0.0007966160774230957, 0.0009021759033203125, 0.0010077357292175293, 0.001113295555114746, 0.0012188553810119629, 0.0013244152069091797, 0.0014299750328063965, 0.0015355348587036133, 0.00164109468460083, 0.0017466545104980469, 0.0018522143363952637, 0.0019577741622924805, 0.0020633339881896973, 0.002168893814086914, 0.002274453639984131, 0.0023800134658813477, 0.0024855732917785645, 0.0025911331176757812, 0.002696692943572998, 0.002802252769470215, 0.0029078125953674316, 0.0030133724212646484, 0.0031189322471618652, 0.003224492073059082, 0.003330051898956299, 0.0034356117248535156, 0.0035411715507507324, 0.0036467313766479492, 0.003752291202545166, 0.003857851028442383, 0.0039634108543396, 0.004068970680236816, 0.004174530506134033, 0.00428009033203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 10.0, 20.0, 50.0, 130.0, 588.0, 127.0, 47.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.17189592123031616, -0.16756770014762878, -0.1632394641637802, -0.15891124308109283, -0.15458300709724426, -0.15025478601455688, -0.1459265649318695, -0.14159832894802094, -0.13727010786533356, -0.13294188678264618, -0.1286136507987976, -0.12428542971611023, -0.11995720118284225, -0.11562897264957428, -0.1113007515668869, -0.10697252303361893, -0.10264429450035095, -0.09831606596708298, -0.093987837433815, -0.08965961635112762, -0.08533138781785965, -0.08100315928459167, -0.0766749382019043, -0.07234670966863632, -0.06801848113536835, -0.06369025260210037, -0.059362027794122696, -0.05503380298614502, -0.050705574452877045, -0.04637734591960907, -0.04204912111163139, -0.03772089630365372, -0.033392660319805145, -0.02906443364918232, -0.024736206978559494, -0.02040798030793667, -0.016079753637313843, -0.011751526966691017, -0.0074233002960681915, -0.003095073625445366, 0.0012331530451774597, 0.005561379715800285, 0.009889606386423111, 0.014217833057045937, 0.018546059727668762, 0.022874286398291588, 0.027202513068914413, 0.03153073787689209, 0.035858966410160065, 0.04018719494342804, 0.044515419751405716, 0.04884364455938339, 0.05317187309265137, 0.05750010162591934, 0.06182832643389702, 0.0661565512418747, 0.07048477977514267, 0.07481300830841064, 0.07914122939109802, 0.083469457924366, 0.08779768645763397, 0.09212591499090195, 0.09645414352416992, 0.1007823646068573, 0.10511059314012527]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 6.0, 12.0, 17.0, 24.0, 26.0, 27.0, 26.0, 29.0, 44.0, 123.0, 300.0, 112.0, 38.0, 32.0, 25.0, 23.0, 22.0, 23.0, 14.0, 12.0, 9.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07029181718826294, -0.06805931776762009, -0.06582681089639664, -0.06359431147575378, -0.06136180832982063, -0.05912930518388748, -0.05689680576324463, -0.05466430261731148, -0.052431799471378326, -0.050199296325445175, -0.047966793179512024, -0.04573429375886917, -0.04350179061293602, -0.04126928746700287, -0.039036788046360016, -0.036804284900426865, -0.03457178175449371, -0.03233927860856056, -0.03010677732527256, -0.027874276041984558, -0.025641772896051407, -0.023409269750118256, -0.021176768466830254, -0.01894426718354225, -0.0167117640376091, -0.014479261822998524, -0.012246759608387947, -0.01001425739377737, -0.007781755179166794, -0.005549252964556217, -0.0033167507499456406, -0.0010842494666576385, 0.0011482536792755127, 0.0033807558938860893, 0.005613258108496666, 0.007845760323107243, 0.01007826253771782, 0.012310764752328396, 0.014543266966938972, 0.016775768250226974, 0.019008271396160126, 0.021240774542093277, 0.02347327582538128, 0.02570577710866928, 0.027938280254602432, 0.030170783400535583, 0.032403282821178436, 0.03463578596711159, 0.03686828911304474, 0.03910079225897789, 0.04133329540491104, 0.043565794825553894, 0.045798297971487045, 0.0480308011174202, 0.05026330053806305, 0.0524958036839962, 0.05472830682992935, 0.0569608099758625, 0.059193313121795654, 0.06142581254243851, 0.06365831196308136, 0.06589081883430481, 0.06812331825494766, 0.07035581767559052, 0.07258832454681396]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 2.0, 6.0, 11.0, 20.0, 11.0, 16.0, 16.0, 23.0, 24.0, 44.0, 56.0, 117.0, 280.0, 92.0, 41.0, 47.0, 31.0, 29.0, 29.0, 16.0, 14.0, 7.0, 7.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00418853759765625, -0.004035472869873047, -0.0038824081420898438, -0.0037293434143066406, -0.0035762786865234375, -0.0034232139587402344, -0.0032701492309570312, -0.003117084503173828, -0.002964019775390625, -0.002810955047607422, -0.0026578903198242188, -0.0025048255920410156, -0.0023517608642578125, -0.0021986961364746094, -0.0020456314086914062, -0.0018925666809082031, -0.001739501953125, -0.0015864372253417969, -0.0014333724975585938, -0.0012803077697753906, -0.0011272430419921875, -0.0009741783142089844, -0.0008211135864257812, -0.0006680488586425781, -0.000514984130859375, -0.0003619194030761719, -0.00020885467529296875, -5.5789947509765625e-05, 9.72747802734375e-05, 0.0002503395080566406, 0.00040340423583984375, 0.0005564689636230469, 0.00070953369140625, 0.0008625984191894531, 0.0010156631469726562, 0.0011687278747558594, 0.0013217926025390625, 0.0014748573303222656, 0.0016279220581054688, 0.0017809867858886719, 0.001934051513671875, 0.002087116241455078, 0.0022401809692382812, 0.0023932456970214844, 0.0025463104248046875, 0.0026993751525878906, 0.0028524398803710938, 0.003005504608154297, 0.0031585693359375, 0.003311634063720703, 0.0034646987915039062, 0.0036177635192871094, 0.0037708282470703125, 0.003923892974853516, 0.004076957702636719, 0.004230022430419922, 0.004383087158203125, 0.004536151885986328, 0.004689216613769531, 0.004842281341552734, 0.0049953460693359375, 0.005148410797119141, 0.005301475524902344, 0.005454540252685547, 0.00560760498046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 20.0, 11.0, 5.0, 15.0, 36.0, 31.0, 44.0, 100.0, 252.0, 844.0, 7848.0, 8369648.0, 8293.0, 921.0, 238.0, 92.0, 76.0, 31.0, 13.0, 13.0, 14.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.05763475224375725, -0.05601182579994202, -0.05438889563083649, -0.052765969187021255, -0.051143042743206024, -0.049520112574100494, -0.04789718613028526, -0.04627425968647003, -0.0446513332426548, -0.04302840679883957, -0.04140547662973404, -0.03978255018591881, -0.03815962374210358, -0.03653669357299805, -0.034913767129182816, -0.033290840685367584, -0.031667910516262054, -0.030044982209801674, -0.028422055765986443, -0.026799127459526062, -0.02517620101571083, -0.02355327270925045, -0.02193034440279007, -0.020307417958974838, -0.018684491515159607, -0.017061563208699226, -0.015438636764883995, -0.013815708458423615, -0.012192782014608383, -0.010569853708148003, -0.008946926333010197, -0.007323998957872391, -0.005701072514057159, -0.0040781451389193535, -0.002455217530950904, -0.0008322899229824543, 0.0007906374521553516, 0.002413565292954445, 0.004036492668092251, 0.005659420043230057, 0.007282347418367863, 0.008905274793505669, 0.010528202168643475, 0.01215112954378128, 0.013774057850241661, 0.015396985225379467, 0.017019912600517273, 0.018642839044332504, 0.020265767350792885, 0.021888695657253265, 0.023511622101068497, 0.025134550407528877, 0.02675747685134411, 0.02838040515780449, 0.03000333160161972, 0.03162626177072525, 0.03324918821454048, 0.03487211465835571, 0.03649504482746124, 0.038117971271276474, 0.039740897715091705, 0.041363827884197235, 0.042986754328012466, 0.0446096807718277, 0.04623260721564293]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 2.0, 2.0, 4.0, 2.0, 9.0, 4.0, 7.0, 5.0, 8.0, 1.0, 5.0, 2.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023277707397937775, -0.022740105167031288, -0.0222025029361248, -0.021664900705218315, -0.02112729847431183, -0.020589694380760193, -0.020052092149853706, -0.01951448991894722, -0.018976887688040733, -0.018439285457134247, -0.01790168322622776, -0.017364080995321274, -0.016826476901769638, -0.01628887467086315, -0.015751272439956665, -0.015213670209050179, -0.014676067978143692, -0.014138465747237206, -0.013600863516330719, -0.013063260354101658, -0.012525658123195171, -0.011988055892288685, -0.011450452730059624, -0.010912850499153137, -0.01037524826824665, -0.009837646037340164, -0.009300043806433678, -0.008762440644204617, -0.00822483841329813, -0.0076872361823916435, -0.00714963348582387, -0.006612030789256096, -0.00607442669570446, -0.005536824464797974, -0.0049992217682302, -0.004461619071662426, -0.0039240168407559395, -0.0033864143770188093, -0.002848811913281679, -0.002311209449544549, -0.0017736069858074188, -0.0012360045220702887, -0.0006984020583331585, -0.00016079959459602833, 0.00037680286914110184, 0.000914405332878232, 0.0014520077966153622, 0.0019896102603524923, 0.0025272127240896225, 0.0030648151878267527, 0.003602417651563883, 0.004140020348131657, 0.004677622579038143, 0.00521522480994463, 0.0057528275065124035, 0.006290430203080177, 0.006828032433986664, 0.00736563466489315, 0.007903236895799637, 0.008440840058028698, 0.008978442288935184, 0.009516044519841671, 0.010053647682070732, 0.010591249912977219, 0.011128852143883705]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 5.0, 9.0, 6.0, 21.0, 14.0, 36.0, 52.0, 96.0, 170.0, 224.0, 389.0, 819.0, 1722.0, 4031.0, 10191.0, 30030.0, 100196.0, 221675.0, 105560.0, 31341.0, 10403.0, 3885.0, 1545.0, 754.0, 375.0, 204.0, 162.0, 90.0, 60.0, 46.0, 38.0, 22.0, 17.0, 17.0, 14.0, 6.0, 9.0, 6.0, 4.0, 2.0, 7.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0206298828125, -0.01995372772216797, -0.019277572631835938, -0.018601417541503906, -0.017925262451171875, -0.017249107360839844, -0.016572952270507812, -0.01589679718017578, -0.01522064208984375, -0.014544486999511719, -0.013868331909179688, -0.013192176818847656, -0.012516021728515625, -0.011839866638183594, -0.011163711547851562, -0.010487556457519531, -0.0098114013671875, -0.009135246276855469, -0.008459091186523438, -0.007782936096191406, -0.007106781005859375, -0.006430625915527344, -0.0057544708251953125, -0.005078315734863281, -0.00440216064453125, -0.0037260055541992188, -0.0030498504638671875, -0.0023736953735351562, -0.001697540283203125, -0.0010213851928710938, -0.0003452301025390625, 0.00033092498779296875, 0.001007080078125, 0.0016832351684570312, 0.0023593902587890625, 0.0030355453491210938, 0.003711700439453125, 0.004387855529785156, 0.0050640106201171875, 0.005740165710449219, 0.00641632080078125, 0.007092475891113281, 0.0077686309814453125, 0.008444786071777344, 0.009120941162109375, 0.009797096252441406, 0.010473251342773438, 0.011149406433105469, 0.0118255615234375, 0.012501716613769531, 0.013177871704101562, 0.013854026794433594, 0.014530181884765625, 0.015206336975097656, 0.015882492065429688, 0.01655864715576172, 0.01723480224609375, 0.01791095733642578, 0.018587112426757812, 0.019263267517089844, 0.019939422607421875, 0.020615577697753906, 0.021291732788085938, 0.02196788787841797, 0.02264404296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 7.0, 7.0, 10.0, 38.0, 50.0, 87.0, 101.0, 161.0, 162.0, 159.0, 83.0, 61.0, 33.0, 23.0, 13.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006114959716796875, -0.005738317966461182, -0.005361676216125488, -0.004985034465789795, -0.0046083927154541016, -0.004231750965118408, -0.003855109214782715, -0.0034784674644470215, -0.003101825714111328, -0.0027251839637756348, -0.0023485422134399414, -0.001971900463104248, -0.0015952587127685547, -0.0012186169624328613, -0.000841975212097168, -0.0004653334617614746, -8.869171142578125e-05, 0.0002879500389099121, 0.0006645917892456055, 0.0010412335395812988, 0.0014178752899169922, 0.0017945170402526855, 0.002171158790588379, 0.0025478005409240723, 0.0029244422912597656, 0.003301084041595459, 0.0036777257919311523, 0.004054367542266846, 0.004431009292602539, 0.004807651042938232, 0.005184292793273926, 0.005560934543609619, 0.0059375762939453125, 0.006314218044281006, 0.006690859794616699, 0.007067501544952393, 0.007444143295288086, 0.00782078504562378, 0.008197426795959473, 0.008574068546295166, 0.00895071029663086, 0.009327352046966553, 0.009703993797302246, 0.01008063554763794, 0.010457277297973633, 0.010833919048309326, 0.01121056079864502, 0.011587202548980713, 0.011963844299316406, 0.0123404860496521, 0.012717127799987793, 0.013093769550323486, 0.01347041130065918, 0.013847053050994873, 0.014223694801330566, 0.01460033655166626, 0.014976978302001953, 0.015353620052337646, 0.01573026180267334, 0.016106903553009033, 0.016483545303344727, 0.01686018705368042, 0.017236828804016113, 0.017613470554351807, 0.0179901123046875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 9.0, 6.0, 3.0, 15.0, 29.0, 126.0, 151.0, 75.0, 28.0, 9.0, 8.0, 8.0, 3.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03378673642873764, -0.03251172974705696, -0.031236721202731133, -0.029961712658405304, -0.028686705976724625, -0.027411699295043945, -0.026136690750718117, -0.024861682206392288, -0.02358667552471161, -0.02231166884303093, -0.0210366602987051, -0.019761651754379272, -0.018486645072698593, -0.017211638391017914, -0.015936629846692085, -0.014661622233688831, -0.013386614620685577, -0.012111607007682323, -0.01083659939467907, -0.009561591781675816, -0.008286584168672562, -0.007011576555669308, -0.005736568942666054, -0.0044615613296628, -0.003186553716659546, -0.001911546103656292, -0.000636538490653038, 0.0006384691223502159, 0.0019134767353534698, 0.003188484348356724, 0.004463491961359978, 0.005738499574363232, 0.007013507187366486, 0.00828851480036974, 0.009563522413372993, 0.010838530026376247, 0.012113537639379501, 0.013388545252382755, 0.01466355286538601, 0.015938561409711838, 0.017213568091392517, 0.018488574773073196, 0.019763583317399025, 0.021038591861724854, 0.022313598543405533, 0.023588605225086212, 0.02486361376941204, 0.02613862231373787, 0.02741362899541855, 0.028688635677099228, 0.029963644221425056, 0.031238652765750885, 0.032513659447431564, 0.033788666129112244, 0.03506367653608322, 0.0363386832177639, 0.03761368989944458, 0.03888869658112526, 0.04016370326280594, 0.041438713669776917, 0.042713720351457596, 0.043988727033138275, 0.04526373744010925, 0.04653874412178993, 0.04781375080347061]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 8.0, 12.0, 45.0, 106.0, 98.0, 80.0, 35.0, 14.0, 10.0, 4.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.031161367893218994, -0.030129114165902138, -0.02909686043858528, -0.028064606711268425, -0.02703235298395157, -0.026000099256634712, -0.024967845529317856, -0.023935591802001, -0.022903338074684143, -0.021871084347367287, -0.02083883062005043, -0.019806576892733574, -0.018774323165416718, -0.01774206943809986, -0.016709815710783005, -0.01567756198346615, -0.014645308256149292, -0.013613054528832436, -0.01258080080151558, -0.011548547074198723, -0.010516293346881866, -0.00948403961956501, -0.008451785892248154, -0.007419532164931297, -0.006387278437614441, -0.0053550247102975845, -0.004322770982980728, -0.0032905172556638718, -0.0022582635283470154, -0.001226009801030159, -0.0001937560737133026, 0.0008384976536035538, 0.0018707513809204102, 0.0029030051082372665, 0.003935258835554123, 0.004967512562870979, 0.005999766290187836, 0.007032020017504692, 0.008064273744821548, 0.009096527472138405, 0.010128781199455261, 0.011161034926772118, 0.012193288654088974, 0.01322554238140583, 0.014257796108722687, 0.015290049836039543, 0.0163223035633564, 0.017354557290673256, 0.018386811017990112, 0.01941906474530697, 0.020451318472623825, 0.02148357219994068, 0.022515825927257538, 0.023548079654574394, 0.02458033338189125, 0.025612587109208107, 0.026644840836524963, 0.02767709456384182, 0.028709348291158676, 0.029741602018475533, 0.03077385574579239, 0.031806111335754395, 0.0328383632004261, 0.03387061506509781, 0.034902870655059814]}, "eval/loss": 4.547459125518799, "eval/wer": 2.4429393097976995, "eval/runtime": 930.4687, "eval/samples_per_second": 2.839, "eval/steps_per_second": 0.238, "train/train_runtime": 6725.1387, "train/train_samples_per_second": 4.243, "train/train_steps_per_second": 0.177, "train/total_flos": 0.0, "train/train_loss": 4.647471772210753, "_wandb": {"runtime": 8138}} \ No newline at end of file