diff --git "a/wandb/run-20220302_114207-c11kvzxa/files/wandb-summary.json" "b/wandb/run-20220302_114207-c11kvzxa/files/wandb-summary.json" --- "a/wandb/run-20220302_114207-c11kvzxa/files/wandb-summary.json" +++ "b/wandb/run-20220302_114207-c11kvzxa/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.9886, "train/learning_rate": 1.5306122448979589e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 6254, "_timestamp": 1646227581, "_step": 893, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 4.0, 15.0, 91.0, 568.0, 276.0, 52.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.2979507446289, -57.26783752441406, -42.23772430419922, -27.20760726928711, -12.177494049072266, 2.8526229858398438, 17.882736206054688, 32.91284942626953, 47.942962646484375, 62.97307586669922, 78.00318908691406, 93.03330993652344, 108.06341552734375, 123.09353637695312, 138.1236572265625, 153.1537628173828, 168.18386840820312, 183.2139892578125, 198.2440948486328, 213.2742156982422, 228.3043212890625, 243.33444213867188, 258.36456298828125, 273.3946533203125, 288.4248046875, 303.4549255371094, 318.48504638671875, 333.51513671875, 348.5452575683594, 363.57537841796875, 378.6054992675781, 393.6356201171875, 408.6656799316406, 423.69580078125, 438.7259216308594, 453.7560119628906, 468.7861328125, 483.8162536621094, 498.84637451171875, 513.87646484375, 528.9066162109375, 543.9367065429688, 558.9668579101562, 573.9969482421875, 589.027099609375, 604.0571899414062, 619.0872802734375, 634.117431640625, 649.1475219726562, 664.1776123046875, 679.207763671875, 694.2378540039062, 709.2680053710938, 724.298095703125, 739.3281860351562, 754.3583374023438, 769.388427734375, 784.4185180664062, 799.4486694335938, 814.478759765625, 829.5089111328125, 844.5390014648438, 859.569091796875, 874.5992431640625, 889.6293334960938]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 8.0, 12.0, 14.0, 11.0, 21.0, 29.0, 24.0, 17.0, 27.0, 32.0, 42.0, 41.0, 35.0, 69.0, 50.0, 54.0, 33.0, 43.0, 40.0, 34.0, 33.0, 37.0, 44.0, 17.0, 16.0, 17.0, 22.0, 23.0, 20.0, 12.0, 13.0, 9.0, 12.0, 11.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-187.4065704345703, -181.70559692382812, -176.00462341308594, -170.3036346435547, -164.6026611328125, -158.9016876220703, -153.20071411132812, -147.49972534179688, -141.7987518310547, -136.0977783203125, -130.3968048095703, -124.6958236694336, -118.99484252929688, -113.29386901855469, -107.5928955078125, -101.89191436767578, -96.1909408569336, -90.4899673461914, -84.78898620605469, -79.0880126953125, -73.38703155517578, -67.6860580444336, -61.98508071899414, -56.28410339355469, -50.583126068115234, -44.88214874267578, -39.18117141723633, -33.480194091796875, -27.779218673706055, -22.0782413482666, -16.37726593017578, -10.676288604736328, -4.975311279296875, 0.7256655693054199, 6.426642417907715, 12.127618789672852, 17.828596115112305, 23.529573440551758, 29.230548858642578, 34.93152618408203, 40.632503509521484, 46.33348083496094, 52.03445816040039, 57.735435485839844, 63.43640899658203, 69.13739013671875, 74.83836364746094, 80.53933715820312, 86.24031829833984, 91.94129180908203, 97.64227294921875, 103.34324645996094, 109.04422760009766, 114.74520111083984, 120.44618225097656, 126.14715576171875, 131.84812927246094, 137.54910278320312, 143.2500762939453, 148.95106506347656, 154.65203857421875, 160.35301208496094, 166.05398559570312, 171.75497436523438, 177.45594787597656]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 4.0, 6.0, 9.0, 17.0, 11.0, 17.0, 11.0, 8.0, 17.0, 17.0, 17.0, 22.0, 21.0, 39.0, 37.0, 37.0, 35.0, 45.0, 41.0, 44.0, 35.0, 36.0, 53.0, 30.0, 37.0, 40.0, 27.0, 28.0, 31.0, 37.0, 21.0, 20.0, 20.0, 12.0, 14.0, 16.0, 14.0, 13.0, 6.0, 9.0, 4.0, 2.0, 11.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.8203125, -2.726715087890625, -2.63311767578125, -2.539520263671875, -2.4459228515625, -2.352325439453125, -2.25872802734375, -2.165130615234375, -2.071533203125, -1.977935791015625, -1.88433837890625, -1.790740966796875, -1.6971435546875, -1.603546142578125, -1.50994873046875, -1.416351318359375, -1.32275390625, -1.229156494140625, -1.13555908203125, -1.041961669921875, -0.9483642578125, -0.854766845703125, -0.76116943359375, -0.667572021484375, -0.573974609375, -0.480377197265625, -0.38677978515625, -0.293182373046875, -0.1995849609375, -0.105987548828125, -0.01239013671875, 0.081207275390625, 0.1748046875, 0.268402099609375, 0.36199951171875, 0.455596923828125, 0.5491943359375, 0.642791748046875, 0.73638916015625, 0.829986572265625, 0.923583984375, 1.017181396484375, 1.11077880859375, 1.204376220703125, 1.2979736328125, 1.391571044921875, 1.48516845703125, 1.578765869140625, 1.67236328125, 1.765960693359375, 1.85955810546875, 1.953155517578125, 2.0467529296875, 2.140350341796875, 2.23394775390625, 2.327545166015625, 2.421142578125, 2.514739990234375, 2.60833740234375, 2.701934814453125, 2.7955322265625, 2.889129638671875, 2.98272705078125, 3.076324462890625, 3.169921875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 6.0, 8.0, 8.0, 12.0, 9.0, 14.0, 17.0, 22.0, 32.0, 43.0, 66.0, 68.0, 99.0, 132.0, 171.0, 248.0, 312.0, 466.0, 683.0, 1046.0, 1649.0, 2886.0, 5272.0, 10830.0, 25433.0, 75018.0, 590166.0, 3261944.0, 143562.0, 40160.0, 15802.0, 7394.0, 3940.0, 2196.0, 1401.0, 849.0, 662.0, 447.0, 294.0, 227.0, 149.0, 118.0, 105.0, 77.0, 48.0, 37.0, 36.0, 31.0, 16.0, 24.0, 14.0, 16.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0], "bins": [-30.125, -29.12841796875, -28.1318359375, -27.13525390625, -26.138671875, -25.14208984375, -24.1455078125, -23.14892578125, -22.15234375, -21.15576171875, -20.1591796875, -19.16259765625, -18.166015625, -17.16943359375, -16.1728515625, -15.17626953125, -14.1796875, -13.18310546875, -12.1865234375, -11.18994140625, -10.193359375, -9.19677734375, -8.2001953125, -7.20361328125, -6.20703125, -5.21044921875, -4.2138671875, -3.21728515625, -2.220703125, -1.22412109375, -0.2275390625, 0.76904296875, 1.765625, 2.76220703125, 3.7587890625, 4.75537109375, 5.751953125, 6.74853515625, 7.7451171875, 8.74169921875, 9.73828125, 10.73486328125, 11.7314453125, 12.72802734375, 13.724609375, 14.72119140625, 15.7177734375, 16.71435546875, 17.7109375, 18.70751953125, 19.7041015625, 20.70068359375, 21.697265625, 22.69384765625, 23.6904296875, 24.68701171875, 25.68359375, 26.68017578125, 27.6767578125, 28.67333984375, 29.669921875, 30.66650390625, 31.6630859375, 32.65966796875, 33.65625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 6.0, 16.0, 15.0, 16.0, 28.0, 48.0, 48.0, 78.0, 105.0, 139.0, 186.0, 281.0, 453.0, 722.0, 656.0, 386.0, 244.0, 162.0, 107.0, 98.0, 65.0, 65.0, 48.0, 25.0, 14.0, 17.0, 10.0, 13.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.572021484375, -18.89404296875, -18.216064453125, -17.5380859375, -16.860107421875, -16.18212890625, -15.504150390625, -14.826171875, -14.148193359375, -13.47021484375, -12.792236328125, -12.1142578125, -11.436279296875, -10.75830078125, -10.080322265625, -9.40234375, -8.724365234375, -8.04638671875, -7.368408203125, -6.6904296875, -6.012451171875, -5.33447265625, -4.656494140625, -3.978515625, -3.300537109375, -2.62255859375, -1.944580078125, -1.2666015625, -0.588623046875, 0.08935546875, 0.767333984375, 1.4453125, 2.123291015625, 2.80126953125, 3.479248046875, 4.1572265625, 4.835205078125, 5.51318359375, 6.191162109375, 6.869140625, 7.547119140625, 8.22509765625, 8.903076171875, 9.5810546875, 10.259033203125, 10.93701171875, 11.614990234375, 12.29296875, 12.970947265625, 13.64892578125, 14.326904296875, 15.0048828125, 15.682861328125, 16.36083984375, 17.038818359375, 17.716796875, 18.394775390625, 19.07275390625, 19.750732421875, 20.4287109375, 21.106689453125, 21.78466796875, 22.462646484375, 23.140625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 11.0, 13.0, 23.0, 30.0, 35.0, 48.0, 64.0, 93.0, 157.0, 237.0, 358.0, 670.0, 1683.0, 5761.0, 30858.0, 307033.0, 3546984.0, 263835.0, 27888.0, 5292.0, 1521.0, 598.0, 341.0, 235.0, 168.0, 96.0, 63.0, 52.0, 38.0, 32.0, 14.0, 12.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.03125, -53.28271484375, -51.5341796875, -49.78564453125, -48.037109375, -46.28857421875, -44.5400390625, -42.79150390625, -41.04296875, -39.29443359375, -37.5458984375, -35.79736328125, -34.048828125, -32.30029296875, -30.5517578125, -28.80322265625, -27.0546875, -25.30615234375, -23.5576171875, -21.80908203125, -20.060546875, -18.31201171875, -16.5634765625, -14.81494140625, -13.06640625, -11.31787109375, -9.5693359375, -7.82080078125, -6.072265625, -4.32373046875, -2.5751953125, -0.82666015625, 0.921875, 2.67041015625, 4.4189453125, 6.16748046875, 7.916015625, 9.66455078125, 11.4130859375, 13.16162109375, 14.91015625, 16.65869140625, 18.4072265625, 20.15576171875, 21.904296875, 23.65283203125, 25.4013671875, 27.14990234375, 28.8984375, 30.64697265625, 32.3955078125, 34.14404296875, 35.892578125, 37.64111328125, 39.3896484375, 41.13818359375, 42.88671875, 44.63525390625, 46.3837890625, 48.13232421875, 49.880859375, 51.62939453125, 53.3779296875, 55.12646484375, 56.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 14.0, 105.0, 385.0, 399.0, 89.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.84393310546875, -206.4600830078125, -197.07623291015625, -187.69239807128906, -178.3085479736328, -168.92469787597656, -159.54086303710938, -150.15701293945312, -140.77316284179688, -131.38931274414062, -122.0054702758789, -112.62162780761719, -103.23777770996094, -93.85392761230469, -84.47008514404297, -75.08624267578125, -65.702392578125, -56.318546295166016, -46.93470001220703, -37.55085372924805, -28.167007446289062, -18.783161163330078, -9.399314880371094, -0.015472412109375, 9.368377685546875, 18.75222396850586, 28.136070251464844, 37.51991653442383, 46.90376281738281, 56.2876091003418, 65.67145538330078, 75.0552978515625, 84.43914794921875, 93.822998046875, 103.20684051513672, 112.59068298339844, 121.97453308105469, 131.35838317871094, 140.74221801757812, 150.12606811523438, 159.50991821289062, 168.89376831054688, 178.27761840820312, 187.6614532470703, 197.04530334472656, 206.4291534423828, 215.81298828125, 225.19683837890625, 234.5806884765625, 243.96453857421875, 253.348388671875, 262.73223876953125, 272.1160888671875, 281.4999084472656, 290.8837585449219, 300.2676086425781, 309.6514587402344, 319.0353088378906, 328.4191589355469, 337.8030090332031, 347.18682861328125, 356.5706787109375, 365.95452880859375, 375.33837890625, 384.72222900390625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 7.0, 5.0, 8.0, 12.0, 14.0, 10.0, 20.0, 23.0, 21.0, 22.0, 18.0, 32.0, 22.0, 22.0, 30.0, 43.0, 42.0, 39.0, 37.0, 31.0, 35.0, 31.0, 38.0, 38.0, 33.0, 32.0, 28.0, 32.0, 26.0, 19.0, 37.0, 20.0, 25.0, 10.0, 15.0, 17.0, 16.0, 17.0, 9.0, 10.0, 13.0, 8.0, 7.0, 2.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-61.95584487915039, -60.02712631225586, -58.098411560058594, -56.16969299316406, -54.24097442626953, -52.312255859375, -50.38353729248047, -48.4548225402832, -46.52610397338867, -44.59738540649414, -42.668670654296875, -40.739952087402344, -38.81123352050781, -36.88251495361328, -34.95379638671875, -33.025081634521484, -31.096363067626953, -29.167644500732422, -27.238927841186523, -25.310211181640625, -23.381492614746094, -21.452774047851562, -19.524057388305664, -17.595340728759766, -15.666622161865234, -13.73790454864502, -11.809186935424805, -9.88046932220459, -7.951751708984375, -6.02303409576416, -4.094316482543945, -2.1655988693237305, -0.23688507080078125, 1.6918325424194336, 3.6205501556396484, 5.549267768859863, 7.477985382080078, 9.406702995300293, 11.335420608520508, 13.264138221740723, 15.192855834960938, 17.12157440185547, 19.050291061401367, 20.979007720947266, 22.907726287841797, 24.836444854736328, 26.765161514282227, 28.693878173828125, 30.622596740722656, 32.55131530761719, 34.48003387451172, 36.408748626708984, 38.337467193603516, 40.26618576049805, 42.19490051269531, 44.123619079589844, 46.052337646484375, 47.981056213378906, 49.90977478027344, 51.8384895324707, 53.767208099365234, 55.695926666259766, 57.62464141845703, 59.55335998535156, 61.482078552246094]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 17.0, 10.0, 21.0, 22.0, 19.0, 16.0, 28.0, 29.0, 38.0, 39.0, 35.0, 37.0, 35.0, 40.0, 35.0, 49.0, 40.0, 39.0, 53.0, 35.0, 34.0, 28.0, 38.0, 29.0, 24.0, 31.0, 24.0, 20.0, 18.0, 24.0, 13.0, 5.0, 7.0, 14.0, 8.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.40625, -3.29998779296875, -3.1937255859375, -3.08746337890625, -2.981201171875, -2.87493896484375, -2.7686767578125, -2.66241455078125, -2.55615234375, -2.44989013671875, -2.3436279296875, -2.23736572265625, -2.131103515625, -2.02484130859375, -1.9185791015625, -1.81231689453125, -1.7060546875, -1.59979248046875, -1.4935302734375, -1.38726806640625, -1.281005859375, -1.17474365234375, -1.0684814453125, -0.96221923828125, -0.85595703125, -0.74969482421875, -0.6434326171875, -0.53717041015625, -0.430908203125, -0.32464599609375, -0.2183837890625, -0.11212158203125, -0.005859375, 0.10040283203125, 0.2066650390625, 0.31292724609375, 0.419189453125, 0.52545166015625, 0.6317138671875, 0.73797607421875, 0.84423828125, 0.95050048828125, 1.0567626953125, 1.16302490234375, 1.269287109375, 1.37554931640625, 1.4818115234375, 1.58807373046875, 1.6943359375, 1.80059814453125, 1.9068603515625, 2.01312255859375, 2.119384765625, 2.22564697265625, 2.3319091796875, 2.43817138671875, 2.54443359375, 2.65069580078125, 2.7569580078125, 2.86322021484375, 2.969482421875, 3.07574462890625, 3.1820068359375, 3.28826904296875, 3.39453125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 8.0, 8.0, 13.0, 16.0, 19.0, 18.0, 37.0, 46.0, 81.0, 109.0, 140.0, 212.0, 287.0, 386.0, 585.0, 879.0, 1182.0, 1779.0, 2635.0, 4106.0, 6326.0, 10356.0, 18347.0, 35125.0, 74670.0, 167542.0, 303342.0, 218033.0, 99117.0, 45615.0, 22942.0, 12542.0, 7568.0, 4718.0, 3067.0, 2073.0, 1438.0, 912.0, 677.0, 463.0, 324.0, 246.0, 158.0, 121.0, 82.0, 59.0, 45.0, 35.0, 33.0, 20.0, 5.0, 7.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5427474975585938, -0.5244598388671875, -0.5061721801757812, -0.487884521484375, -0.46959686279296875, -0.4513092041015625, -0.43302154541015625, -0.41473388671875, -0.39644622802734375, -0.3781585693359375, -0.35987091064453125, -0.341583251953125, -0.32329559326171875, -0.3050079345703125, -0.28672027587890625, -0.2684326171875, -0.25014495849609375, -0.2318572998046875, -0.21356964111328125, -0.195281982421875, -0.17699432373046875, -0.1587066650390625, -0.14041900634765625, -0.12213134765625, -0.10384368896484375, -0.0855560302734375, -0.06726837158203125, -0.048980712890625, -0.03069305419921875, -0.0124053955078125, 0.00588226318359375, 0.024169921875, 0.04245758056640625, 0.0607452392578125, 0.07903289794921875, 0.097320556640625, 0.11560821533203125, 0.1338958740234375, 0.15218353271484375, 0.17047119140625, 0.18875885009765625, 0.2070465087890625, 0.22533416748046875, 0.243621826171875, 0.26190948486328125, 0.2801971435546875, 0.29848480224609375, 0.3167724609375, 0.33506011962890625, 0.3533477783203125, 0.37163543701171875, 0.389923095703125, 0.40821075439453125, 0.4264984130859375, 0.44478607177734375, 0.46307373046875, 0.48136138916015625, 0.4996490478515625, 0.5179367065429688, 0.536224365234375, 0.5545120239257812, 0.5727996826171875, 0.5910873413085938, 0.609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 7.0, 7.0, 13.0, 13.0, 19.0, 12.0, 14.0, 21.0, 22.0, 36.0, 31.0, 43.0, 37.0, 39.0, 41.0, 30.0, 35.0, 44.0, 1074.0, 35.0, 36.0, 38.0, 33.0, 46.0, 31.0, 29.0, 25.0, 34.0, 25.0, 27.0, 13.0, 19.0, 18.0, 11.0, 5.0, 13.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.453125, -2.38079833984375, -2.3084716796875, -2.23614501953125, -2.163818359375, -2.09149169921875, -2.0191650390625, -1.94683837890625, -1.87451171875, -1.80218505859375, -1.7298583984375, -1.65753173828125, -1.585205078125, -1.51287841796875, -1.4405517578125, -1.36822509765625, -1.2958984375, -1.22357177734375, -1.1512451171875, -1.07891845703125, -1.006591796875, -0.93426513671875, -0.8619384765625, -0.78961181640625, -0.71728515625, -0.64495849609375, -0.5726318359375, -0.50030517578125, -0.427978515625, -0.35565185546875, -0.2833251953125, -0.21099853515625, -0.138671875, -0.06634521484375, 0.0059814453125, 0.07830810546875, 0.150634765625, 0.22296142578125, 0.2952880859375, 0.36761474609375, 0.43994140625, 0.51226806640625, 0.5845947265625, 0.65692138671875, 0.729248046875, 0.80157470703125, 0.8739013671875, 0.94622802734375, 1.0185546875, 1.09088134765625, 1.1632080078125, 1.23553466796875, 1.307861328125, 1.38018798828125, 1.4525146484375, 1.52484130859375, 1.59716796875, 1.66949462890625, 1.7418212890625, 1.81414794921875, 1.886474609375, 1.95880126953125, 2.0311279296875, 2.10345458984375, 2.17578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 10.0, 7.0, 22.0, 28.0, 42.0, 71.0, 83.0, 142.0, 184.0, 326.0, 467.0, 802.0, 1226.0, 1775.0, 2914.0, 4930.0, 7982.0, 13186.0, 22162.0, 38312.0, 67263.0, 124524.0, 346759.0, 1153099.0, 135616.0, 73224.0, 41065.0, 24111.0, 14278.0, 8553.0, 5093.0, 3245.0, 2003.0, 1289.0, 800.0, 532.0, 306.0, 226.0, 154.0, 113.0, 83.0, 40.0, 19.0, 23.0, 14.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.318115234375, -0.30849456787109375, -0.2988739013671875, -0.28925323486328125, -0.279632568359375, -0.27001190185546875, -0.2603912353515625, -0.25077056884765625, -0.24114990234375, -0.23152923583984375, -0.2219085693359375, -0.21228790283203125, -0.202667236328125, -0.19304656982421875, -0.1834259033203125, -0.17380523681640625, -0.1641845703125, -0.15456390380859375, -0.1449432373046875, -0.13532257080078125, -0.125701904296875, -0.11608123779296875, -0.1064605712890625, -0.09683990478515625, -0.08721923828125, -0.07759857177734375, -0.0679779052734375, -0.05835723876953125, -0.048736572265625, -0.03911590576171875, -0.0294952392578125, -0.01987457275390625, -0.01025390625, -0.00063323974609375, 0.0089874267578125, 0.01860809326171875, 0.028228759765625, 0.03784942626953125, 0.0474700927734375, 0.05709075927734375, 0.06671142578125, 0.07633209228515625, 0.0859527587890625, 0.09557342529296875, 0.105194091796875, 0.11481475830078125, 0.1244354248046875, 0.13405609130859375, 0.1436767578125, 0.15329742431640625, 0.1629180908203125, 0.17253875732421875, 0.182159423828125, 0.19178009033203125, 0.2014007568359375, 0.21102142333984375, 0.22064208984375, 0.23026275634765625, 0.2398834228515625, 0.24950408935546875, 0.259124755859375, 0.26874542236328125, 0.2783660888671875, 0.28798675537109375, 0.297607421875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 5.0, 3.0, 4.0, 11.0, 8.0, 9.0, 17.0, 12.0, 24.0, 30.0, 34.0, 39.0, 40.0, 68.0, 108.0, 178.0, 100.0, 71.0, 35.0, 40.0, 26.0, 26.0, 20.0, 15.0, 7.0, 10.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.017913818359375, -0.01740741729736328, -0.016901016235351562, -0.016394615173339844, -0.015888214111328125, -0.015381813049316406, -0.014875411987304688, -0.014369010925292969, -0.01386260986328125, -0.013356208801269531, -0.012849807739257812, -0.012343406677246094, -0.011837005615234375, -0.011330604553222656, -0.010824203491210938, -0.010317802429199219, -0.0098114013671875, -0.009305000305175781, -0.008798599243164062, -0.008292198181152344, -0.007785797119140625, -0.007279396057128906, -0.0067729949951171875, -0.006266593933105469, -0.00576019287109375, -0.005253791809082031, -0.0047473907470703125, -0.004240989685058594, -0.003734588623046875, -0.0032281875610351562, -0.0027217864990234375, -0.0022153854370117188, -0.001708984375, -0.0012025833129882812, -0.0006961822509765625, -0.00018978118896484375, 0.000316619873046875, 0.0008230209350585938, 0.0013294219970703125, 0.0018358230590820312, 0.00234222412109375, 0.0028486251831054688, 0.0033550262451171875, 0.0038614273071289062, 0.004367828369140625, 0.004874229431152344, 0.0053806304931640625, 0.005887031555175781, 0.0063934326171875, 0.006899833679199219, 0.0074062347412109375, 0.007912635803222656, 0.008419036865234375, 0.008925437927246094, 0.009431838989257812, 0.009938240051269531, 0.01044464111328125, 0.010951042175292969, 0.011457443237304688, 0.011963844299316406, 0.012470245361328125, 0.012976646423339844, 0.013483047485351562, 0.013989448547363281, 0.014495849609375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 9.0, 15.0, 20.0, 16.0, 13.0, 21.0, 33.0, 36.0, 54.0, 54.0, 83.0, 126.0, 126.0, 183.0, 315.0, 2369.0, 959639.0, 83637.0, 814.0, 230.0, 172.0, 118.0, 101.0, 63.0, 57.0, 37.0, 42.0, 20.0, 22.0, 13.0, 17.0, 12.0, 9.0, 8.0, 12.0, 10.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.29931640625, -0.29046630859375, -0.2816162109375, -0.27276611328125, -0.263916015625, -0.25506591796875, -0.2462158203125, -0.23736572265625, -0.228515625, -0.21966552734375, -0.2108154296875, -0.20196533203125, -0.193115234375, -0.18426513671875, -0.1754150390625, -0.16656494140625, -0.15771484375, -0.14886474609375, -0.1400146484375, -0.13116455078125, -0.122314453125, -0.11346435546875, -0.1046142578125, -0.09576416015625, -0.0869140625, -0.07806396484375, -0.0692138671875, -0.06036376953125, -0.051513671875, -0.04266357421875, -0.0338134765625, -0.02496337890625, -0.01611328125, -0.00726318359375, 0.0015869140625, 0.01043701171875, 0.019287109375, 0.02813720703125, 0.0369873046875, 0.04583740234375, 0.0546875, 0.06353759765625, 0.0723876953125, 0.08123779296875, 0.090087890625, 0.09893798828125, 0.1077880859375, 0.11663818359375, 0.12548828125, 0.13433837890625, 0.1431884765625, 0.15203857421875, 0.160888671875, 0.16973876953125, 0.1785888671875, 0.18743896484375, 0.1962890625, 0.20513916015625, 0.2139892578125, 0.22283935546875, 0.231689453125, 0.24053955078125, 0.2493896484375, 0.25823974609375, 0.26708984375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 51.0, 864.0, 85.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08904317021369934, -0.08130837976932526, -0.07357358187437057, -0.0658387839794159, -0.05810399353504181, -0.050369199365377426, -0.04263440519571304, -0.03489961102604866, -0.027164816856384277, -0.019430022686719894, -0.011695228517055511, -0.0039604343473911285, 0.0037743598222732544, 0.011509153991937637, 0.01924394816160202, 0.026978742331266403, 0.034713536500930786, 0.04244833067059517, 0.05018312484025955, 0.057917919009923935, 0.06565271317958832, 0.0733875036239624, 0.08112230151891708, 0.08885709941387177, 0.09659188985824585, 0.10432668030261993, 0.11206147819757462, 0.1197962760925293, 0.12753106653690338, 0.13526585698127747, 0.14300066232681274, 0.15073545277118683, 0.1584702432155609, 0.166205033659935, 0.17393982410430908, 0.18167462944984436, 0.18940941989421844, 0.19714421033859253, 0.2048790156841278, 0.2126138061285019, 0.22034859657287598, 0.22808338701725006, 0.23581817746162415, 0.24355298280715942, 0.2512877583503723, 0.2590225636959076, 0.26675736904144287, 0.27449214458465576, 0.28222694993019104, 0.2899617552757263, 0.2976965308189392, 0.3054313361644745, 0.31316614151000977, 0.32090091705322266, 0.32863572239875793, 0.3363704979419708, 0.3441053032875061, 0.3518401086330414, 0.3595748841762543, 0.36730968952178955, 0.37504446506500244, 0.3827792704105377, 0.390514075756073, 0.3982488512992859, 0.40598365664482117]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 11.0, 10.0, 18.0, 17.0, 20.0, 23.0, 30.0, 36.0, 31.0, 27.0, 42.0, 52.0, 48.0, 49.0, 37.0, 50.0, 49.0, 58.0, 47.0, 44.0, 49.0, 44.0, 37.0, 24.0, 31.0, 21.0, 12.0, 12.0, 15.0, 16.0, 17.0, 2.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027567923069000244, -0.026634935289621353, -0.02570194937288761, -0.02476896345615387, -0.02383597567677498, -0.022902987897396088, -0.021970001980662346, -0.021037016063928604, -0.020104028284549713, -0.019171040505170822, -0.01823805458843708, -0.01730506867170334, -0.016372080892324448, -0.015439094044268131, -0.014506107196211815, -0.013573120348155499, -0.012640133500099182, -0.011707146652042866, -0.01077415980398655, -0.009841172955930233, -0.008908186107873917, -0.0079751992598176, -0.007042212411761284, -0.0061092255637049675, -0.005176238715648651, -0.004243251867592335, -0.0033102650195360184, -0.002377278171479702, -0.0014442913234233856, -0.0005113044753670692, 0.00042168237268924713, 0.0013546692207455635, 0.00228765606880188, 0.0032206429168581963, 0.004153629764914513, 0.005086616612970829, 0.006019603461027145, 0.006952590309083462, 0.007885577157139778, 0.008818564005196095, 0.009751550853252411, 0.010684537701308727, 0.011617524549365044, 0.01255051139742136, 0.013483498245477676, 0.014416485093533993, 0.01534947194159031, 0.01628245785832405, 0.017215445637702942, 0.018148433417081833, 0.019081419333815575, 0.020014405250549316, 0.020947393029928207, 0.0218803808093071, 0.02281336672604084, 0.023746352642774582, 0.024679340422153473, 0.025612328201532364, 0.026545314118266106, 0.027478300034999847, 0.02841128781437874, 0.02934427559375763, 0.03027726151049137, 0.031210247427225113, 0.032143235206604004]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 17.0, 10.0, 21.0, 22.0, 19.0, 16.0, 28.0, 29.0, 38.0, 40.0, 34.0, 37.0, 36.0, 39.0, 35.0, 49.0, 40.0, 39.0, 53.0, 35.0, 34.0, 28.0, 38.0, 28.0, 25.0, 31.0, 24.0, 20.0, 18.0, 24.0, 13.0, 5.0, 7.0, 14.0, 8.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.40625, -3.29998779296875, -3.1937255859375, -3.08746337890625, -2.981201171875, -2.87493896484375, -2.7686767578125, -2.66241455078125, -2.55615234375, -2.44989013671875, -2.3436279296875, -2.23736572265625, -2.131103515625, -2.02484130859375, -1.9185791015625, -1.81231689453125, -1.7060546875, -1.59979248046875, -1.4935302734375, -1.38726806640625, -1.281005859375, -1.17474365234375, -1.0684814453125, -0.96221923828125, -0.85595703125, -0.74969482421875, -0.6434326171875, -0.53717041015625, -0.430908203125, -0.32464599609375, -0.2183837890625, -0.11212158203125, -0.005859375, 0.10040283203125, 0.2066650390625, 0.31292724609375, 0.419189453125, 0.52545166015625, 0.6317138671875, 0.73797607421875, 0.84423828125, 0.95050048828125, 1.0567626953125, 1.16302490234375, 1.269287109375, 1.37554931640625, 1.4818115234375, 1.58807373046875, 1.6943359375, 1.80059814453125, 1.9068603515625, 2.01312255859375, 2.119384765625, 2.22564697265625, 2.3319091796875, 2.43817138671875, 2.54443359375, 2.65069580078125, 2.7569580078125, 2.86322021484375, 2.969482421875, 3.07574462890625, 3.1820068359375, 3.28826904296875, 3.39453125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 18.0, 21.0, 14.0, 41.0, 55.0, 58.0, 94.0, 134.0, 187.0, 228.0, 374.0, 481.0, 682.0, 1021.0, 1544.0, 2413.0, 3721.0, 6144.0, 10769.0, 21208.0, 50146.0, 175080.0, 507438.0, 169333.0, 48739.0, 20760.0, 10801.0, 6135.0, 3617.0, 2309.0, 1575.0, 1020.0, 705.0, 465.0, 336.0, 226.0, 176.0, 136.0, 94.0, 68.0, 40.0, 28.0, 35.0, 20.0, 16.0, 6.0, 9.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 4.0], "bins": [-11.6875, -11.3277587890625, -10.968017578125, -10.6082763671875, -10.24853515625, -9.8887939453125, -9.529052734375, -9.1693115234375, -8.8095703125, -8.4498291015625, -8.090087890625, -7.7303466796875, -7.37060546875, -7.0108642578125, -6.651123046875, -6.2913818359375, -5.931640625, -5.5718994140625, -5.212158203125, -4.8524169921875, -4.49267578125, -4.1329345703125, -3.773193359375, -3.4134521484375, -3.0537109375, -2.6939697265625, -2.334228515625, -1.9744873046875, -1.61474609375, -1.2550048828125, -0.895263671875, -0.5355224609375, -0.17578125, 0.1839599609375, 0.543701171875, 0.9034423828125, 1.26318359375, 1.6229248046875, 1.982666015625, 2.3424072265625, 2.7021484375, 3.0618896484375, 3.421630859375, 3.7813720703125, 4.14111328125, 4.5008544921875, 4.860595703125, 5.2203369140625, 5.580078125, 5.9398193359375, 6.299560546875, 6.6593017578125, 7.01904296875, 7.3787841796875, 7.738525390625, 8.0982666015625, 8.4580078125, 8.8177490234375, 9.177490234375, 9.5372314453125, 9.89697265625, 10.2567138671875, 10.616455078125, 10.9761962890625, 11.3359375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 6.0, 5.0, 9.0, 11.0, 15.0, 7.0, 14.0, 17.0, 21.0, 27.0, 22.0, 31.0, 25.0, 37.0, 40.0, 65.0, 76.0, 102.0, 169.0, 1449.0, 280.0, 127.0, 70.0, 65.0, 38.0, 33.0, 44.0, 32.0, 43.0, 31.0, 23.0, 17.0, 21.0, 13.0, 9.0, 7.0, 6.0, 7.0, 7.0, 7.0, 0.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.6234130859375, -13.207763671875, -12.7921142578125, -12.37646484375, -11.9608154296875, -11.545166015625, -11.1295166015625, -10.7138671875, -10.2982177734375, -9.882568359375, -9.4669189453125, -9.05126953125, -8.6356201171875, -8.219970703125, -7.8043212890625, -7.388671875, -6.9730224609375, -6.557373046875, -6.1417236328125, -5.72607421875, -5.3104248046875, -4.894775390625, -4.4791259765625, -4.0634765625, -3.6478271484375, -3.232177734375, -2.8165283203125, -2.40087890625, -1.9852294921875, -1.569580078125, -1.1539306640625, -0.73828125, -0.3226318359375, 0.093017578125, 0.5086669921875, 0.92431640625, 1.3399658203125, 1.755615234375, 2.1712646484375, 2.5869140625, 3.0025634765625, 3.418212890625, 3.8338623046875, 4.24951171875, 4.6651611328125, 5.080810546875, 5.4964599609375, 5.912109375, 6.3277587890625, 6.743408203125, 7.1590576171875, 7.57470703125, 7.9903564453125, 8.406005859375, 8.8216552734375, 9.2373046875, 9.6529541015625, 10.068603515625, 10.4842529296875, 10.89990234375, 11.3155517578125, 11.731201171875, 12.1468505859375, 12.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 8.0, 7.0, 8.0, 11.0, 15.0, 14.0, 27.0, 22.0, 26.0, 35.0, 43.0, 46.0, 92.0, 192.0, 511.0, 2076.0, 32795.0, 3012639.0, 92088.0, 3691.0, 697.0, 240.0, 109.0, 65.0, 40.0, 22.0, 27.0, 20.0, 15.0, 17.0, 10.0, 8.0, 11.0, 9.0, 10.0, 9.0, 9.0, 2.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.90625, -55.04833984375, -53.1904296875, -51.33251953125, -49.474609375, -47.61669921875, -45.7587890625, -43.90087890625, -42.04296875, -40.18505859375, -38.3271484375, -36.46923828125, -34.611328125, -32.75341796875, -30.8955078125, -29.03759765625, -27.1796875, -25.32177734375, -23.4638671875, -21.60595703125, -19.748046875, -17.89013671875, -16.0322265625, -14.17431640625, -12.31640625, -10.45849609375, -8.6005859375, -6.74267578125, -4.884765625, -3.02685546875, -1.1689453125, 0.68896484375, 2.546875, 4.40478515625, 6.2626953125, 8.12060546875, 9.978515625, 11.83642578125, 13.6943359375, 15.55224609375, 17.41015625, 19.26806640625, 21.1259765625, 22.98388671875, 24.841796875, 26.69970703125, 28.5576171875, 30.41552734375, 32.2734375, 34.13134765625, 35.9892578125, 37.84716796875, 39.705078125, 41.56298828125, 43.4208984375, 45.27880859375, 47.13671875, 48.99462890625, 50.8525390625, 52.71044921875, 54.568359375, 56.42626953125, 58.2841796875, 60.14208984375, 62.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 981.0, 33.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1167.9273681640625, -1144.395751953125, -1120.8641357421875, -1097.33251953125, -1073.8009033203125, -1050.269287109375, -1026.737548828125, -1003.2059936523438, -979.67431640625, -956.1427001953125, -932.611083984375, -909.0794677734375, -885.5477905273438, -862.0161743164062, -838.4845581054688, -814.9529418945312, -791.4213256835938, -767.8897094726562, -744.3580932617188, -720.826416015625, -697.2947998046875, -673.76318359375, -650.2315673828125, -626.699951171875, -603.1683349609375, -579.63671875, -556.1051025390625, -532.573486328125, -509.04180908203125, -485.51019287109375, -461.97857666015625, -438.44696044921875, -414.9153137207031, -391.3836975097656, -367.85205078125, -344.3204345703125, -320.788818359375, -297.2571716308594, -273.7255554199219, -250.1939239501953, -226.66229248046875, -203.1306610107422, -179.59902954101562, -156.06741333007812, -132.53578186035156, -109.004150390625, -85.4725341796875, -61.94090270996094, -38.409271240234375, -14.877643585205078, 8.653984069824219, 32.18560791015625, 55.71723937988281, 79.24887084960938, 102.78048706054688, 126.31211853027344, 149.84375, 173.37538146972656, 196.90701293945312, 220.43862915039062, 243.9702606201172, 267.50189208984375, 291.03350830078125, 314.56512451171875, 338.0967712402344]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 9.0, 22.0, 21.0, 27.0, 27.0, 30.0, 36.0, 53.0, 50.0, 41.0, 49.0, 63.0, 64.0, 50.0, 66.0, 49.0, 57.0, 59.0, 29.0, 36.0, 31.0, 27.0, 20.0, 21.0, 10.0, 12.0, 9.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.7646484375, -66.6091079711914, -64.45357513427734, -62.298038482666016, -60.14250183105469, -57.986961364746094, -55.831424713134766, -53.67588806152344, -51.52035140991211, -49.36481475830078, -47.20927810668945, -45.053741455078125, -42.89820098876953, -40.74266815185547, -38.587127685546875, -36.43159103393555, -34.27605438232422, -32.12051773071289, -29.964981079101562, -27.8094425201416, -25.653905868530273, -23.498369216918945, -21.342830657958984, -19.187294006347656, -17.031757354736328, -14.876220703125, -12.720683097839355, -10.565145492553711, -8.409608840942383, -6.254072189331055, -4.09853458404541, -1.9429969787597656, 0.21253204345703125, 2.3680691719055176, 4.523606300354004, 6.67914342880249, 8.834680557250977, 10.990217208862305, 13.14575481414795, 15.301292419433594, 17.456829071044922, 19.61236572265625, 21.767902374267578, 23.92344093322754, 26.078977584838867, 28.234514236450195, 30.390052795410156, 32.545589447021484, 34.70112609863281, 36.85666275024414, 39.01219940185547, 41.1677360534668, 43.323272705078125, 45.47881317138672, 47.63434982299805, 49.789886474609375, 51.9454231262207, 54.10095977783203, 56.25649642944336, 58.41203308105469, 60.56757354736328, 62.723106384277344, 64.87864685058594, 67.0341796875, 69.1897201538086]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 1.0, 3.0, 6.0, 7.0, 8.0, 17.0, 14.0, 12.0, 20.0, 14.0, 17.0, 29.0, 34.0, 41.0, 29.0, 32.0, 33.0, 48.0, 32.0, 38.0, 47.0, 35.0, 44.0, 42.0, 34.0, 45.0, 33.0, 39.0, 29.0, 31.0, 20.0, 30.0, 24.0, 18.0, 13.0, 16.0, 17.0, 6.0, 4.0, 10.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.107757568359375, -2.99871826171875, -2.889678955078125, -2.7806396484375, -2.671600341796875, -2.56256103515625, -2.453521728515625, -2.344482421875, -2.235443115234375, -2.12640380859375, -2.017364501953125, -1.9083251953125, -1.799285888671875, -1.69024658203125, -1.581207275390625, -1.47216796875, -1.363128662109375, -1.25408935546875, -1.145050048828125, -1.0360107421875, -0.926971435546875, -0.81793212890625, -0.708892822265625, -0.599853515625, -0.490814208984375, -0.38177490234375, -0.272735595703125, -0.1636962890625, -0.054656982421875, 0.05438232421875, 0.163421630859375, 0.2724609375, 0.381500244140625, 0.49053955078125, 0.599578857421875, 0.7086181640625, 0.817657470703125, 0.92669677734375, 1.035736083984375, 1.144775390625, 1.253814697265625, 1.36285400390625, 1.471893310546875, 1.5809326171875, 1.689971923828125, 1.79901123046875, 1.908050537109375, 2.01708984375, 2.126129150390625, 2.23516845703125, 2.344207763671875, 2.4532470703125, 2.562286376953125, 2.67132568359375, 2.780364990234375, 2.889404296875, 2.998443603515625, 3.10748291015625, 3.216522216796875, 3.3255615234375, 3.434600830078125, 3.54364013671875, 3.652679443359375, 3.76171875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 9.0, 17.0, 20.0, 40.0, 60.0, 93.0, 123.0, 251.0, 366.0, 720.0, 1286.0, 2245.0, 4614.0, 9925.0, 23941.0, 75934.0, 940691.0, 2957046.0, 118879.0, 33522.0, 12841.0, 5538.0, 2682.0, 1391.0, 785.0, 467.0, 284.0, 163.0, 118.0, 52.0, 48.0, 31.0, 30.0, 13.0, 13.0, 12.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.03125, -25.1064453125, -24.181640625, -23.2568359375, -22.33203125, -21.4072265625, -20.482421875, -19.5576171875, -18.6328125, -17.7080078125, -16.783203125, -15.8583984375, -14.93359375, -14.0087890625, -13.083984375, -12.1591796875, -11.234375, -10.3095703125, -9.384765625, -8.4599609375, -7.53515625, -6.6103515625, -5.685546875, -4.7607421875, -3.8359375, -2.9111328125, -1.986328125, -1.0615234375, -0.13671875, 0.7880859375, 1.712890625, 2.6376953125, 3.5625, 4.4873046875, 5.412109375, 6.3369140625, 7.26171875, 8.1865234375, 9.111328125, 10.0361328125, 10.9609375, 11.8857421875, 12.810546875, 13.7353515625, 14.66015625, 15.5849609375, 16.509765625, 17.4345703125, 18.359375, 19.2841796875, 20.208984375, 21.1337890625, 22.05859375, 22.9833984375, 23.908203125, 24.8330078125, 25.7578125, 26.6826171875, 27.607421875, 28.5322265625, 29.45703125, 30.3818359375, 31.306640625, 32.2314453125, 33.15625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 6.0, 14.0, 19.0, 12.0, 16.0, 20.0, 31.0, 55.0, 37.0, 72.0, 84.0, 130.0, 146.0, 222.0, 328.0, 495.0, 648.0, 521.0, 358.0, 230.0, 149.0, 106.0, 95.0, 48.0, 46.0, 38.0, 31.0, 24.0, 23.0, 15.0, 7.0, 12.0, 4.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.203125, -14.68896484375, -14.1748046875, -13.66064453125, -13.146484375, -12.63232421875, -12.1181640625, -11.60400390625, -11.08984375, -10.57568359375, -10.0615234375, -9.54736328125, -9.033203125, -8.51904296875, -8.0048828125, -7.49072265625, -6.9765625, -6.46240234375, -5.9482421875, -5.43408203125, -4.919921875, -4.40576171875, -3.8916015625, -3.37744140625, -2.86328125, -2.34912109375, -1.8349609375, -1.32080078125, -0.806640625, -0.29248046875, 0.2216796875, 0.73583984375, 1.25, 1.76416015625, 2.2783203125, 2.79248046875, 3.306640625, 3.82080078125, 4.3349609375, 4.84912109375, 5.36328125, 5.87744140625, 6.3916015625, 6.90576171875, 7.419921875, 7.93408203125, 8.4482421875, 8.96240234375, 9.4765625, 9.99072265625, 10.5048828125, 11.01904296875, 11.533203125, 12.04736328125, 12.5615234375, 13.07568359375, 13.58984375, 14.10400390625, 14.6181640625, 15.13232421875, 15.646484375, 16.16064453125, 16.6748046875, 17.18896484375, 17.703125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 12.0, 13.0, 13.0, 42.0, 59.0, 103.0, 174.0, 272.0, 398.0, 687.0, 1099.0, 1831.0, 3011.0, 5147.0, 8631.0, 15425.0, 29657.0, 62882.0, 157555.0, 658881.0, 2515382.0, 484784.0, 132264.0, 55288.0, 26700.0, 14053.0, 7995.0, 4736.0, 2764.0, 1755.0, 1046.0, 675.0, 367.0, 247.0, 132.0, 81.0, 61.0, 30.0, 14.0, 8.0, 6.0, 1.0, 4.0, 2.0, 1.0], "bins": [-30.09375, -29.330322265625, -28.56689453125, -27.803466796875, -27.0400390625, -26.276611328125, -25.51318359375, -24.749755859375, -23.986328125, -23.222900390625, -22.45947265625, -21.696044921875, -20.9326171875, -20.169189453125, -19.40576171875, -18.642333984375, -17.87890625, -17.115478515625, -16.35205078125, -15.588623046875, -14.8251953125, -14.061767578125, -13.29833984375, -12.534912109375, -11.771484375, -11.008056640625, -10.24462890625, -9.481201171875, -8.7177734375, -7.954345703125, -7.19091796875, -6.427490234375, -5.6640625, -4.900634765625, -4.13720703125, -3.373779296875, -2.6103515625, -1.846923828125, -1.08349609375, -0.320068359375, 0.443359375, 1.206787109375, 1.97021484375, 2.733642578125, 3.4970703125, 4.260498046875, 5.02392578125, 5.787353515625, 6.55078125, 7.314208984375, 8.07763671875, 8.841064453125, 9.6044921875, 10.367919921875, 11.13134765625, 11.894775390625, 12.658203125, 13.421630859375, 14.18505859375, 14.948486328125, 15.7119140625, 16.475341796875, 17.23876953125, 18.002197265625, 18.765625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 9.0, 13.0, 21.0, 17.0, 34.0, 63.0, 80.0, 103.0, 136.0, 133.0, 114.0, 99.0, 71.0, 41.0, 31.0, 14.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-148.42059326171875, -145.14511108398438, -141.86962890625, -138.59414672851562, -135.3186798095703, -132.04319763183594, -128.76771545410156, -125.49223327636719, -122.21675109863281, -118.94126892089844, -115.6657943725586, -112.39031219482422, -109.11483001708984, -105.83935546875, -102.56387329101562, -99.28839111328125, -96.01290893554688, -92.7374267578125, -89.46195220947266, -86.18647003173828, -82.9109878540039, -79.63551330566406, -76.36003112792969, -73.08454895019531, -69.80907440185547, -66.5335922241211, -63.258113861083984, -59.982635498046875, -56.7071533203125, -53.43167495727539, -50.15619659423828, -46.880714416503906, -43.6052360534668, -40.32975769042969, -37.05427551269531, -33.7787971496582, -30.503314971923828, -27.22783660888672, -23.952356338500977, -20.676876068115234, -17.401395797729492, -14.12591552734375, -10.850435256958008, -7.574955940246582, -4.29947566986084, -1.023996353149414, 2.251483917236328, 5.52696418762207, 8.802444458007812, 12.077924728393555, 15.353404998779297, 18.628883361816406, 21.90436553955078, 25.17984390258789, 28.455324172973633, 31.730804443359375, 35.00628662109375, 38.28176498413086, 41.557247161865234, 44.832725524902344, 48.10820770263672, 51.38368606567383, 54.65916442871094, 57.93464660644531, 61.21012496948242]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 13.0, 7.0, 14.0, 14.0, 16.0, 20.0, 21.0, 31.0, 41.0, 26.0, 34.0, 34.0, 48.0, 42.0, 47.0, 39.0, 57.0, 42.0, 44.0, 46.0, 40.0, 44.0, 37.0, 36.0, 26.0, 27.0, 25.0, 25.0, 15.0, 15.0, 11.0, 8.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.133914947509766, -55.247379302978516, -53.360843658447266, -51.474308013916016, -49.587772369384766, -47.701236724853516, -45.814697265625, -43.92816162109375, -42.0416259765625, -40.15509033203125, -38.2685546875, -36.38201904296875, -34.4954833984375, -32.60894775390625, -30.722410202026367, -28.835874557495117, -26.9493408203125, -25.06280517578125, -23.17626953125, -21.28973388671875, -19.4031982421875, -17.51666259765625, -15.630125045776367, -13.743589401245117, -11.857053756713867, -9.970518112182617, -8.083982467651367, -6.197445869445801, -4.310910224914551, -2.424374580383301, -0.5378379821777344, 1.3486976623535156, 3.2352294921875, 5.12176513671875, 7.008301258087158, 8.894837379455566, 10.781373023986816, 12.667908668518066, 14.554445266723633, 16.440980911254883, 18.327516555786133, 20.214052200317383, 22.100587844848633, 23.987125396728516, 25.873661041259766, 27.760196685791016, 29.646732330322266, 31.533267974853516, 33.419803619384766, 35.306339263916016, 37.192874908447266, 39.079410552978516, 40.965946197509766, 42.852481842041016, 44.73902130126953, 46.62555694580078, 48.51209259033203, 50.39862823486328, 52.28516387939453, 54.17169952392578, 56.05823516845703, 57.94477081298828, 59.83130645751953, 61.71784210205078, 63.60437774658203]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 6.0, 10.0, 8.0, 7.0, 9.0, 20.0, 18.0, 22.0, 28.0, 23.0, 33.0, 33.0, 34.0, 39.0, 38.0, 45.0, 46.0, 57.0, 49.0, 48.0, 57.0, 44.0, 33.0, 28.0, 34.0, 27.0, 31.0, 29.0, 20.0, 25.0, 11.0, 13.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.896484375, -3.768280029296875, -3.64007568359375, -3.511871337890625, -3.3836669921875, -3.255462646484375, -3.12725830078125, -2.999053955078125, -2.870849609375, -2.742645263671875, -2.61444091796875, -2.486236572265625, -2.3580322265625, -2.229827880859375, -2.10162353515625, -1.973419189453125, -1.84521484375, -1.717010498046875, -1.58880615234375, -1.460601806640625, -1.3323974609375, -1.204193115234375, -1.07598876953125, -0.947784423828125, -0.819580078125, -0.691375732421875, -0.56317138671875, -0.434967041015625, -0.3067626953125, -0.178558349609375, -0.05035400390625, 0.077850341796875, 0.2060546875, 0.334259033203125, 0.46246337890625, 0.590667724609375, 0.7188720703125, 0.847076416015625, 0.97528076171875, 1.103485107421875, 1.231689453125, 1.359893798828125, 1.48809814453125, 1.616302490234375, 1.7445068359375, 1.872711181640625, 2.00091552734375, 2.129119873046875, 2.25732421875, 2.385528564453125, 2.51373291015625, 2.641937255859375, 2.7701416015625, 2.898345947265625, 3.02655029296875, 3.154754638671875, 3.282958984375, 3.411163330078125, 3.53936767578125, 3.667572021484375, 3.7957763671875, 3.923980712890625, 4.05218505859375, 4.180389404296875, 4.30859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 0.0, 12.0, 15.0, 25.0, 28.0, 43.0, 56.0, 93.0, 119.0, 151.0, 212.0, 347.0, 434.0, 629.0, 895.0, 1201.0, 1830.0, 2794.0, 4239.0, 6700.0, 11037.0, 19025.0, 35404.0, 67529.0, 133831.0, 245926.0, 239278.0, 129626.0, 64652.0, 34002.0, 18206.0, 10755.0, 6538.0, 4061.0, 2680.0, 1788.0, 1297.0, 905.0, 652.0, 402.0, 310.0, 244.0, 156.0, 126.0, 93.0, 53.0, 37.0, 45.0, 25.0, 15.0, 8.0, 10.0, 9.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.587890625, -0.5700607299804688, -0.5522308349609375, -0.5344009399414062, -0.516571044921875, -0.49874114990234375, -0.4809112548828125, -0.46308135986328125, -0.44525146484375, -0.42742156982421875, -0.4095916748046875, -0.39176177978515625, -0.373931884765625, -0.35610198974609375, -0.3382720947265625, -0.32044219970703125, -0.3026123046875, -0.28478240966796875, -0.2669525146484375, -0.24912261962890625, -0.231292724609375, -0.21346282958984375, -0.1956329345703125, -0.17780303955078125, -0.15997314453125, -0.14214324951171875, -0.1243133544921875, -0.10648345947265625, -0.088653564453125, -0.07082366943359375, -0.0529937744140625, -0.03516387939453125, -0.017333984375, 0.00049591064453125, 0.0183258056640625, 0.03615570068359375, 0.053985595703125, 0.07181549072265625, 0.0896453857421875, 0.10747528076171875, 0.12530517578125, 0.14313507080078125, 0.1609649658203125, 0.17879486083984375, 0.196624755859375, 0.21445465087890625, 0.2322845458984375, 0.25011444091796875, 0.2679443359375, 0.28577423095703125, 0.3036041259765625, 0.32143402099609375, 0.339263916015625, 0.35709381103515625, 0.3749237060546875, 0.39275360107421875, 0.41058349609375, 0.42841339111328125, 0.4462432861328125, 0.46407318115234375, 0.481903076171875, 0.49973297119140625, 0.5175628662109375, 0.5353927612304688, 0.55322265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 8.0, 5.0, 16.0, 18.0, 17.0, 17.0, 24.0, 20.0, 32.0, 29.0, 41.0, 32.0, 40.0, 39.0, 51.0, 45.0, 40.0, 1075.0, 54.0, 37.0, 51.0, 49.0, 34.0, 31.0, 26.0, 25.0, 29.0, 26.0, 18.0, 21.0, 13.0, 12.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.308258056640625, -2.22003173828125, -2.131805419921875, -2.0435791015625, -1.955352783203125, -1.86712646484375, -1.778900146484375, -1.690673828125, -1.602447509765625, -1.51422119140625, -1.425994873046875, -1.3377685546875, -1.249542236328125, -1.16131591796875, -1.073089599609375, -0.98486328125, -0.896636962890625, -0.80841064453125, -0.720184326171875, -0.6319580078125, -0.543731689453125, -0.45550537109375, -0.367279052734375, -0.279052734375, -0.190826416015625, -0.10260009765625, -0.014373779296875, 0.0738525390625, 0.162078857421875, 0.25030517578125, 0.338531494140625, 0.4267578125, 0.514984130859375, 0.60321044921875, 0.691436767578125, 0.7796630859375, 0.867889404296875, 0.95611572265625, 1.044342041015625, 1.132568359375, 1.220794677734375, 1.30902099609375, 1.397247314453125, 1.4854736328125, 1.573699951171875, 1.66192626953125, 1.750152587890625, 1.83837890625, 1.926605224609375, 2.01483154296875, 2.103057861328125, 2.1912841796875, 2.279510498046875, 2.36773681640625, 2.455963134765625, 2.544189453125, 2.632415771484375, 2.72064208984375, 2.808868408203125, 2.8970947265625, 2.985321044921875, 3.07354736328125, 3.161773681640625, 3.25]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 2.0, 5.0, 7.0, 7.0, 20.0, 30.0, 60.0, 81.0, 112.0, 179.0, 327.0, 551.0, 842.0, 1349.0, 2204.0, 3655.0, 5900.0, 10170.0, 16764.0, 28867.0, 49793.0, 91480.0, 170362.0, 1294631.0, 187207.0, 100478.0, 54734.0, 31362.0, 18310.0, 11026.0, 6517.0, 3889.0, 2364.0, 1483.0, 899.0, 551.0, 359.0, 212.0, 129.0, 76.0, 57.0, 35.0, 25.0, 8.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30487823486328125, -0.2945709228515625, -0.28426361083984375, -0.273956298828125, -0.26364898681640625, -0.2533416748046875, -0.24303436279296875, -0.23272705078125, -0.22241973876953125, -0.2121124267578125, -0.20180511474609375, -0.191497802734375, -0.18119049072265625, -0.1708831787109375, -0.16057586669921875, -0.1502685546875, -0.13996124267578125, -0.1296539306640625, -0.11934661865234375, -0.109039306640625, -0.09873199462890625, -0.0884246826171875, -0.07811737060546875, -0.06781005859375, -0.05750274658203125, -0.0471954345703125, -0.03688812255859375, -0.026580810546875, -0.01627349853515625, -0.0059661865234375, 0.00434112548828125, 0.0146484375, 0.02495574951171875, 0.0352630615234375, 0.04557037353515625, 0.055877685546875, 0.06618499755859375, 0.0764923095703125, 0.08679962158203125, 0.09710693359375, 0.10741424560546875, 0.1177215576171875, 0.12802886962890625, 0.138336181640625, 0.14864349365234375, 0.1589508056640625, 0.16925811767578125, 0.1795654296875, 0.18987274169921875, 0.2001800537109375, 0.21048736572265625, 0.220794677734375, 0.23110198974609375, 0.2414093017578125, 0.25171661376953125, 0.26202392578125, 0.27233123779296875, 0.2826385498046875, 0.29294586181640625, 0.303253173828125, 0.31356048583984375, 0.3238677978515625, 0.33417510986328125, 0.344482421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 13.0, 7.0, 23.0, 36.0, 39.0, 51.0, 55.0, 127.0, 194.0, 134.0, 66.0, 58.0, 46.0, 31.0, 14.0, 15.0, 4.0, 5.0, 7.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0108795166015625, -0.010485172271728516, -0.010090827941894531, -0.009696483612060547, -0.009302139282226562, -0.008907794952392578, -0.008513450622558594, -0.00811910629272461, -0.007724761962890625, -0.007330417633056641, -0.006936073303222656, -0.006541728973388672, -0.0061473846435546875, -0.005753040313720703, -0.005358695983886719, -0.004964351654052734, -0.00457000732421875, -0.004175662994384766, -0.0037813186645507812, -0.003386974334716797, -0.0029926300048828125, -0.002598285675048828, -0.0022039413452148438, -0.0018095970153808594, -0.001415252685546875, -0.0010209083557128906, -0.0006265640258789062, -0.00023221969604492188, 0.0001621246337890625, 0.0005564689636230469, 0.0009508132934570312, 0.0013451576232910156, 0.001739501953125, 0.0021338462829589844, 0.0025281906127929688, 0.002922534942626953, 0.0033168792724609375, 0.003711223602294922, 0.004105567932128906, 0.004499912261962891, 0.004894256591796875, 0.005288600921630859, 0.005682945251464844, 0.006077289581298828, 0.0064716339111328125, 0.006865978240966797, 0.007260322570800781, 0.007654666900634766, 0.00804901123046875, 0.008443355560302734, 0.008837699890136719, 0.009232044219970703, 0.009626388549804688, 0.010020732879638672, 0.010415077209472656, 0.01080942153930664, 0.011203765869140625, 0.01159811019897461, 0.011992454528808594, 0.012386798858642578, 0.012781143188476562, 0.013175487518310547, 0.013569831848144531, 0.013964176177978516, 0.0143585205078125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 10.0, 11.0, 13.0, 19.0, 22.0, 46.0, 54.0, 102.0, 154.0, 350.0, 7394.0, 1007657.0, 31598.0, 570.0, 197.0, 94.0, 74.0, 39.0, 25.0, 23.0, 12.0, 8.0, 8.0, 12.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 6.0, 0.0, 2.0, 2.0, 2.0, 4.0], "bins": [-0.357666015625, -0.3484077453613281, -0.33914947509765625, -0.3298912048339844, -0.3206329345703125, -0.3113746643066406, -0.30211639404296875, -0.2928581237792969, -0.283599853515625, -0.2743415832519531, -0.26508331298828125, -0.2558250427246094, -0.2465667724609375, -0.23730850219726562, -0.22805023193359375, -0.21879196166992188, -0.20953369140625, -0.20027542114257812, -0.19101715087890625, -0.18175888061523438, -0.1725006103515625, -0.16324234008789062, -0.15398406982421875, -0.14472579956054688, -0.135467529296875, -0.12620925903320312, -0.11695098876953125, -0.10769271850585938, -0.0984344482421875, -0.08917617797851562, -0.07991790771484375, -0.07065963745117188, -0.0614013671875, -0.052143096923828125, -0.04288482666015625, -0.033626556396484375, -0.0243682861328125, -0.015110015869140625, -0.00585174560546875, 0.003406524658203125, 0.012664794921875, 0.021923065185546875, 0.03118133544921875, 0.040439605712890625, 0.0496978759765625, 0.058956146240234375, 0.06821441650390625, 0.07747268676757812, 0.08673095703125, 0.09598922729492188, 0.10524749755859375, 0.11450576782226562, 0.1237640380859375, 0.13302230834960938, 0.14228057861328125, 0.15153884887695312, 0.160797119140625, 0.17005538940429688, 0.17931365966796875, 0.18857192993164062, 0.1978302001953125, 0.20708847045898438, 0.21634674072265625, 0.22560501098632812, 0.23486328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 10.0, 30.0, 310.0, 578.0, 71.0, 19.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1947118639945984, -0.18916688859462738, -0.18362189829349518, -0.17807692289352417, -0.17253194749355316, -0.16698697209358215, -0.16144198179244995, -0.15589700639247894, -0.15035203099250793, -0.14480705559253693, -0.13926206529140472, -0.13371708989143372, -0.1281721144914627, -0.1226271316409111, -0.1170821487903595, -0.11153717339038849, -0.10599218308925629, -0.10044720023870468, -0.09490222483873367, -0.08935724198818207, -0.08381226658821106, -0.07826728373765945, -0.07272230088710785, -0.06717732548713684, -0.061632342636585236, -0.05608736351132393, -0.05054238438606262, -0.04499740153551102, -0.03945242241024971, -0.0339074432849884, -0.028362460434436798, -0.02281748130917549, -0.01727248728275299, -0.01172750722616911, -0.006182527169585228, -0.000637546181678772, 0.004907432943582535, 0.010452412068843842, 0.015997394919395447, 0.021542374044656754, 0.02708735316991806, 0.03263233229517937, 0.038177311420440674, 0.04372229427099228, 0.049267273396253586, 0.05481225252151489, 0.0603572353720665, 0.0659022182226181, 0.07144719362258911, 0.07699217647314072, 0.08253715187311172, 0.08808213472366333, 0.09362711012363434, 0.09917209297418594, 0.10471707582473755, 0.11026205122470856, 0.11580703407526016, 0.12135201692581177, 0.12689699232578278, 0.13244196772575378, 0.137986958026886, 0.143531933426857, 0.149076908826828, 0.1546218991279602, 0.1601668745279312]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 3.0, 8.0, 11.0, 15.0, 12.0, 13.0, 12.0, 21.0, 31.0, 35.0, 29.0, 32.0, 37.0, 34.0, 43.0, 35.0, 42.0, 39.0, 51.0, 44.0, 42.0, 53.0, 44.0, 47.0, 30.0, 36.0, 41.0, 26.0, 21.0, 27.0, 22.0, 20.0, 14.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016757488250732422, -0.016219746321439743, -0.015682004392147064, -0.015144262462854385, -0.014606520533561707, -0.014068778604269028, -0.013531036674976349, -0.01299329474568367, -0.012455552816390991, -0.011917810887098312, -0.011380068957805634, -0.010842327028512955, -0.010304585099220276, -0.009766843169927597, -0.009229101240634918, -0.00869135931134224, -0.00815361738204956, -0.007615875452756882, -0.007078133523464203, -0.006540391594171524, -0.006002649664878845, -0.005464907735586166, -0.0049271658062934875, -0.004389423877000809, -0.00385168194770813, -0.003313940018415451, -0.002776198089122772, -0.0022384561598300934, -0.0017007142305374146, -0.0011629723012447357, -0.0006252303719520569, -8.748844265937805e-05, 0.0004502534866333008, 0.0009879954159259796, 0.0015257373452186584, 0.0020634792745113373, 0.002601221203804016, 0.003138963133096695, 0.0036767050623893738, 0.004214446991682053, 0.0047521889209747314, 0.00528993085026741, 0.005827672779560089, 0.006365414708852768, 0.006903156638145447, 0.007440898567438126, 0.007978640496730804, 0.008516382426023483, 0.009054124355316162, 0.009591866284608841, 0.01012960821390152, 0.010667350143194199, 0.011205092072486877, 0.011742834001779556, 0.012280575931072235, 0.012818317860364914, 0.013356059789657593, 0.013893801718950272, 0.01443154364824295, 0.01496928557753563, 0.015507027506828308, 0.016044769436120987, 0.016582511365413666, 0.017120253294706345, 0.017657995223999023]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 6.0, 10.0, 8.0, 7.0, 9.0, 20.0, 18.0, 22.0, 28.0, 23.0, 33.0, 33.0, 34.0, 39.0, 39.0, 44.0, 45.0, 58.0, 49.0, 48.0, 57.0, 44.0, 33.0, 28.0, 34.0, 27.0, 31.0, 29.0, 20.0, 25.0, 11.0, 13.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.896484375, -3.768280029296875, -3.64007568359375, -3.511871337890625, -3.3836669921875, -3.255462646484375, -3.12725830078125, -2.999053955078125, -2.870849609375, -2.742645263671875, -2.61444091796875, -2.486236572265625, -2.3580322265625, -2.229827880859375, -2.10162353515625, -1.973419189453125, -1.84521484375, -1.717010498046875, -1.58880615234375, -1.460601806640625, -1.3323974609375, -1.204193115234375, -1.07598876953125, -0.947784423828125, -0.819580078125, -0.691375732421875, -0.56317138671875, -0.434967041015625, -0.3067626953125, -0.178558349609375, -0.05035400390625, 0.077850341796875, 0.2060546875, 0.334259033203125, 0.46246337890625, 0.590667724609375, 0.7188720703125, 0.847076416015625, 0.97528076171875, 1.103485107421875, 1.231689453125, 1.359893798828125, 1.48809814453125, 1.616302490234375, 1.7445068359375, 1.872711181640625, 2.00091552734375, 2.129119873046875, 2.25732421875, 2.385528564453125, 2.51373291015625, 2.641937255859375, 2.7701416015625, 2.898345947265625, 3.02655029296875, 3.154754638671875, 3.282958984375, 3.411163330078125, 3.53936767578125, 3.667572021484375, 3.7957763671875, 3.923980712890625, 4.05218505859375, 4.180389404296875, 4.30859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 14.0, 18.0, 27.0, 30.0, 32.0, 53.0, 57.0, 96.0, 137.0, 205.0, 300.0, 417.0, 777.0, 1419.0, 2962.0, 9700.0, 410442.0, 603140.0, 11409.0, 3380.0, 1578.0, 883.0, 491.0, 327.0, 204.0, 125.0, 94.0, 65.0, 37.0, 29.0, 20.0, 19.0, 17.0, 13.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.828125, -19.189453125, -18.55078125, -17.912109375, -17.2734375, -16.634765625, -15.99609375, -15.357421875, -14.71875, -14.080078125, -13.44140625, -12.802734375, -12.1640625, -11.525390625, -10.88671875, -10.248046875, -9.609375, -8.970703125, -8.33203125, -7.693359375, -7.0546875, -6.416015625, -5.77734375, -5.138671875, -4.5, -3.861328125, -3.22265625, -2.583984375, -1.9453125, -1.306640625, -0.66796875, -0.029296875, 0.609375, 1.248046875, 1.88671875, 2.525390625, 3.1640625, 3.802734375, 4.44140625, 5.080078125, 5.71875, 6.357421875, 6.99609375, 7.634765625, 8.2734375, 8.912109375, 9.55078125, 10.189453125, 10.828125, 11.466796875, 12.10546875, 12.744140625, 13.3828125, 14.021484375, 14.66015625, 15.298828125, 15.9375, 16.576171875, 17.21484375, 17.853515625, 18.4921875, 19.130859375, 19.76953125, 20.408203125, 21.046875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 6.0, 12.0, 11.0, 9.0, 6.0, 13.0, 19.0, 22.0, 26.0, 27.0, 37.0, 31.0, 31.0, 31.0, 42.0, 60.0, 125.0, 364.0, 1499.0, 133.0, 73.0, 59.0, 48.0, 45.0, 26.0, 25.0, 40.0, 23.0, 26.0, 30.0, 19.0, 20.0, 13.0, 10.0, 15.0, 12.0, 6.0, 12.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-14.75, -14.3304443359375, -13.910888671875, -13.4913330078125, -13.07177734375, -12.6522216796875, -12.232666015625, -11.8131103515625, -11.3935546875, -10.9739990234375, -10.554443359375, -10.1348876953125, -9.71533203125, -9.2957763671875, -8.876220703125, -8.4566650390625, -8.037109375, -7.6175537109375, -7.197998046875, -6.7784423828125, -6.35888671875, -5.9393310546875, -5.519775390625, -5.1002197265625, -4.6806640625, -4.2611083984375, -3.841552734375, -3.4219970703125, -3.00244140625, -2.5828857421875, -2.163330078125, -1.7437744140625, -1.32421875, -0.9046630859375, -0.485107421875, -0.0655517578125, 0.35400390625, 0.7735595703125, 1.193115234375, 1.6126708984375, 2.0322265625, 2.4517822265625, 2.871337890625, 3.2908935546875, 3.71044921875, 4.1300048828125, 4.549560546875, 4.9691162109375, 5.388671875, 5.8082275390625, 6.227783203125, 6.6473388671875, 7.06689453125, 7.4864501953125, 7.906005859375, 8.3255615234375, 8.7451171875, 9.1646728515625, 9.584228515625, 10.0037841796875, 10.42333984375, 10.8428955078125, 11.262451171875, 11.6820068359375, 12.1015625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 6.0, 8.0, 9.0, 13.0, 17.0, 13.0, 15.0, 27.0, 23.0, 41.0, 43.0, 70.0, 106.0, 156.0, 399.0, 1081.0, 2973.0, 9197.0, 614319.0, 2499552.0, 11925.0, 3452.0, 1253.0, 463.0, 184.0, 107.0, 65.0, 39.0, 32.0, 22.0, 14.0, 13.0, 15.0, 13.0, 9.0, 9.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -32.82080078125, -31.7978515625, -30.77490234375, -29.751953125, -28.72900390625, -27.7060546875, -26.68310546875, -25.66015625, -24.63720703125, -23.6142578125, -22.59130859375, -21.568359375, -20.54541015625, -19.5224609375, -18.49951171875, -17.4765625, -16.45361328125, -15.4306640625, -14.40771484375, -13.384765625, -12.36181640625, -11.3388671875, -10.31591796875, -9.29296875, -8.27001953125, -7.2470703125, -6.22412109375, -5.201171875, -4.17822265625, -3.1552734375, -2.13232421875, -1.109375, -0.08642578125, 0.9365234375, 1.95947265625, 2.982421875, 4.00537109375, 5.0283203125, 6.05126953125, 7.07421875, 8.09716796875, 9.1201171875, 10.14306640625, 11.166015625, 12.18896484375, 13.2119140625, 14.23486328125, 15.2578125, 16.28076171875, 17.3037109375, 18.32666015625, 19.349609375, 20.37255859375, 21.3955078125, 22.41845703125, 23.44140625, 24.46435546875, 25.4873046875, 26.51025390625, 27.533203125, 28.55615234375, 29.5791015625, 30.60205078125, 31.625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 114.0, 743.0, 150.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.32150268554688, -211.6716766357422, -207.0218505859375, -202.3720245361328, -197.72219848632812, -193.07237243652344, -188.42254638671875, -183.772705078125, -179.12289428710938, -174.4730682373047, -169.8232421875, -165.1734161376953, -160.52359008789062, -155.87376403808594, -151.22393798828125, -146.5740966796875, -141.9242706298828, -137.27444458007812, -132.62461853027344, -127.97479248046875, -123.32496643066406, -118.67514038085938, -114.02530670166016, -109.37548065185547, -104.72565460205078, -100.0758285522461, -95.4260025024414, -90.77617645263672, -86.1263427734375, -81.47651672363281, -76.82669067382812, -72.17686462402344, -67.52702331542969, -62.877197265625, -58.22737121582031, -53.57754135131836, -48.92771530151367, -44.277889251708984, -39.62805938720703, -34.978233337402344, -30.328407287597656, -25.67858123779297, -21.02875328063965, -16.378925323486328, -11.72909927368164, -7.079273223876953, -2.429445266723633, 2.2203826904296875, 6.870208740234375, 11.520035743713379, 16.169862747192383, 20.819690704345703, 25.46951675415039, 30.119342803955078, 34.76917266845703, 39.41899871826172, 44.068824768066406, 48.718650817871094, 53.36847686767578, 58.018306732177734, 62.66813278198242, 67.31796264648438, 71.96778869628906, 76.61761474609375, 81.26744079589844]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 8.0, 8.0, 10.0, 16.0, 17.0, 22.0, 17.0, 29.0, 37.0, 38.0, 39.0, 42.0, 38.0, 36.0, 42.0, 33.0, 52.0, 39.0, 40.0, 45.0, 39.0, 34.0, 28.0, 36.0, 33.0, 33.0, 31.0, 24.0, 17.0, 14.0, 15.0, 8.0, 10.0, 12.0, 4.0, 2.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.88842010498047, -45.42708206176758, -43.96574401855469, -42.5044059753418, -41.043067932128906, -39.581729888916016, -38.120391845703125, -36.6590576171875, -35.197715759277344, -33.73637771606445, -32.27503967285156, -30.813701629638672, -29.35236358642578, -27.89102554321289, -26.429689407348633, -24.968351364135742, -23.507015228271484, -22.045677185058594, -20.584339141845703, -19.123001098632812, -17.661663055419922, -16.20032501220703, -14.738988876342773, -13.277650833129883, -11.816312789916992, -10.354974746704102, -8.893636703491211, -7.432299613952637, -5.970961570739746, -4.5096235275268555, -3.0482864379882812, -1.5869483947753906, -0.12561416625976562, 1.335723638534546, 2.7970614433288574, 4.25839900970459, 5.7197370529174805, 7.181075096130371, 8.642412185668945, 10.103750228881836, 11.565088272094727, 13.026426315307617, 14.487764358520508, 15.949101448059082, 17.410438537597656, 18.871776580810547, 20.333114624023438, 21.794452667236328, 23.25579071044922, 24.71712875366211, 26.178466796875, 27.63980484008789, 29.10114288330078, 30.562480926513672, 32.02381896972656, 33.48515319824219, 34.946495056152344, 36.407833099365234, 37.869171142578125, 39.330509185791016, 40.791847229003906, 42.2531852722168, 43.71452331542969, 45.17585754394531, 46.6371955871582]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 10.0, 10.0, 5.0, 9.0, 11.0, 20.0, 21.0, 21.0, 28.0, 31.0, 31.0, 35.0, 36.0, 36.0, 40.0, 49.0, 42.0, 45.0, 66.0, 42.0, 46.0, 45.0, 38.0, 34.0, 29.0, 28.0, 32.0, 23.0, 23.0, 23.0, 7.0, 12.0, 15.0, 9.0, 8.0, 12.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.09765625, -3.9661865234375, -3.834716796875, -3.7032470703125, -3.57177734375, -3.4403076171875, -3.308837890625, -3.1773681640625, -3.0458984375, -2.9144287109375, -2.782958984375, -2.6514892578125, -2.52001953125, -2.3885498046875, -2.257080078125, -2.1256103515625, -1.994140625, -1.8626708984375, -1.731201171875, -1.5997314453125, -1.46826171875, -1.3367919921875, -1.205322265625, -1.0738525390625, -0.9423828125, -0.8109130859375, -0.679443359375, -0.5479736328125, -0.41650390625, -0.2850341796875, -0.153564453125, -0.0220947265625, 0.109375, 0.2408447265625, 0.372314453125, 0.5037841796875, 0.63525390625, 0.7667236328125, 0.898193359375, 1.0296630859375, 1.1611328125, 1.2926025390625, 1.424072265625, 1.5555419921875, 1.68701171875, 1.8184814453125, 1.949951171875, 2.0814208984375, 2.212890625, 2.3443603515625, 2.475830078125, 2.6072998046875, 2.73876953125, 2.8702392578125, 3.001708984375, 3.1331787109375, 3.2646484375, 3.3961181640625, 3.527587890625, 3.6590576171875, 3.79052734375, 3.9219970703125, 4.053466796875, 4.1849365234375, 4.31640625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 13.0, 20.0, 19.0, 35.0, 44.0, 83.0, 140.0, 259.0, 396.0, 646.0, 1294.0, 2435.0, 5017.0, 11924.0, 32546.0, 144737.0, 3452370.0, 459640.0, 52791.0, 16562.0, 6684.0, 3057.0, 1535.0, 797.0, 439.0, 288.0, 184.0, 103.0, 62.0, 44.0, 27.0, 20.0, 17.0, 11.0, 10.0, 5.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65625, -26.724853515625, -25.79345703125, -24.862060546875, -23.9306640625, -22.999267578125, -22.06787109375, -21.136474609375, -20.205078125, -19.273681640625, -18.34228515625, -17.410888671875, -16.4794921875, -15.548095703125, -14.61669921875, -13.685302734375, -12.75390625, -11.822509765625, -10.89111328125, -9.959716796875, -9.0283203125, -8.096923828125, -7.16552734375, -6.234130859375, -5.302734375, -4.371337890625, -3.43994140625, -2.508544921875, -1.5771484375, -0.645751953125, 0.28564453125, 1.217041015625, 2.1484375, 3.079833984375, 4.01123046875, 4.942626953125, 5.8740234375, 6.805419921875, 7.73681640625, 8.668212890625, 9.599609375, 10.531005859375, 11.46240234375, 12.393798828125, 13.3251953125, 14.256591796875, 15.18798828125, 16.119384765625, 17.05078125, 17.982177734375, 18.91357421875, 19.844970703125, 20.7763671875, 21.707763671875, 22.63916015625, 23.570556640625, 24.501953125, 25.433349609375, 26.36474609375, 27.296142578125, 28.2275390625, 29.158935546875, 30.09033203125, 31.021728515625, 31.953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 7.0, 6.0, 5.0, 14.0, 11.0, 22.0, 20.0, 33.0, 37.0, 44.0, 49.0, 68.0, 80.0, 132.0, 180.0, 254.0, 424.0, 607.0, 607.0, 475.0, 272.0, 176.0, 129.0, 89.0, 77.0, 58.0, 44.0, 33.0, 21.0, 20.0, 26.0, 14.0, 10.0, 10.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.8359375, -15.3272705078125, -14.818603515625, -14.3099365234375, -13.80126953125, -13.2926025390625, -12.783935546875, -12.2752685546875, -11.7666015625, -11.2579345703125, -10.749267578125, -10.2406005859375, -9.73193359375, -9.2232666015625, -8.714599609375, -8.2059326171875, -7.697265625, -7.1885986328125, -6.679931640625, -6.1712646484375, -5.66259765625, -5.1539306640625, -4.645263671875, -4.1365966796875, -3.6279296875, -3.1192626953125, -2.610595703125, -2.1019287109375, -1.59326171875, -1.0845947265625, -0.575927734375, -0.0672607421875, 0.44140625, 0.9500732421875, 1.458740234375, 1.9674072265625, 2.47607421875, 2.9847412109375, 3.493408203125, 4.0020751953125, 4.5107421875, 5.0194091796875, 5.528076171875, 6.0367431640625, 6.54541015625, 7.0540771484375, 7.562744140625, 8.0714111328125, 8.580078125, 9.0887451171875, 9.597412109375, 10.1060791015625, 10.61474609375, 11.1234130859375, 11.632080078125, 12.1407470703125, 12.6494140625, 13.1580810546875, 13.666748046875, 14.1754150390625, 14.68408203125, 15.1927490234375, 15.701416015625, 16.2100830078125, 16.71875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 4.0, 9.0, 16.0, 18.0, 39.0, 59.0, 83.0, 127.0, 193.0, 255.0, 454.0, 588.0, 949.0, 1514.0, 2411.0, 3890.0, 6290.0, 10617.0, 18325.0, 33722.0, 67519.0, 160691.0, 654445.0, 2364761.0, 577080.0, 149472.0, 63937.0, 32465.0, 17785.0, 10225.0, 6070.0, 3661.0, 2372.0, 1470.0, 949.0, 637.0, 374.0, 252.0, 187.0, 118.0, 89.0, 44.0, 40.0, 28.0, 13.0, 9.0, 10.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.234375, -20.580322265625, -19.92626953125, -19.272216796875, -18.6181640625, -17.964111328125, -17.31005859375, -16.656005859375, -16.001953125, -15.347900390625, -14.69384765625, -14.039794921875, -13.3857421875, -12.731689453125, -12.07763671875, -11.423583984375, -10.76953125, -10.115478515625, -9.46142578125, -8.807373046875, -8.1533203125, -7.499267578125, -6.84521484375, -6.191162109375, -5.537109375, -4.883056640625, -4.22900390625, -3.574951171875, -2.9208984375, -2.266845703125, -1.61279296875, -0.958740234375, -0.3046875, 0.349365234375, 1.00341796875, 1.657470703125, 2.3115234375, 2.965576171875, 3.61962890625, 4.273681640625, 4.927734375, 5.581787109375, 6.23583984375, 6.889892578125, 7.5439453125, 8.197998046875, 8.85205078125, 9.506103515625, 10.16015625, 10.814208984375, 11.46826171875, 12.122314453125, 12.7763671875, 13.430419921875, 14.08447265625, 14.738525390625, 15.392578125, 16.046630859375, 16.70068359375, 17.354736328125, 18.0087890625, 18.662841796875, 19.31689453125, 19.970947265625, 20.625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 10.0, 20.0, 53.0, 103.0, 191.0, 242.0, 200.0, 111.0, 47.0, 22.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.7401351928711, -84.49911499023438, -77.25808715820312, -70.0170669555664, -62.77604293823242, -55.53501892089844, -48.29399871826172, -41.052974700927734, -33.81195068359375, -26.570926666259766, -19.329904556274414, -12.088882446289062, -4.847858428955078, 2.3931655883789062, 9.634185791015625, 16.87520980834961, 24.116233825683594, 31.357257843017578, 38.59828186035156, 45.83930206298828, 53.080326080322266, 60.32135009765625, 67.56237030029297, 74.80339050292969, 82.04441833496094, 89.28543853759766, 96.5264663696289, 103.76748657226562, 111.00851440429688, 118.2495346069336, 125.49055480957031, 132.73158264160156, 139.97259521484375, 147.213623046875, 154.4546356201172, 161.69566345214844, 168.9366912841797, 176.17770385742188, 183.41873168945312, 190.65975952148438, 197.90078735351562, 205.14181518554688, 212.38282775878906, 219.6238555908203, 226.86488342285156, 234.10589599609375, 241.346923828125, 248.58795166015625, 255.82896423339844, 263.0699768066406, 270.3110046386719, 277.5520324707031, 284.7930603027344, 292.0340881347656, 299.27508544921875, 306.51611328125, 313.75714111328125, 320.9981689453125, 328.23919677734375, 335.480224609375, 342.7212219238281, 349.9622497558594, 357.2032775878906, 364.4443054199219, 371.6853332519531]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 3.0, 11.0, 10.0, 18.0, 13.0, 17.0, 24.0, 15.0, 26.0, 29.0, 16.0, 50.0, 41.0, 37.0, 45.0, 35.0, 47.0, 40.0, 35.0, 39.0, 44.0, 47.0, 46.0, 40.0, 40.0, 31.0, 27.0, 32.0, 29.0, 17.0, 17.0, 12.0, 11.0, 14.0, 8.0, 13.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-72.28639221191406, -70.28898620605469, -68.29158020019531, -66.29417419433594, -64.29676055908203, -62.299354553222656, -60.30194854736328, -58.304542541503906, -56.30713653564453, -54.309730529785156, -52.312320709228516, -50.31491470336914, -48.317508697509766, -46.320098876953125, -44.32269287109375, -42.325286865234375, -40.327877044677734, -38.33047103881836, -36.33306121826172, -34.335655212402344, -32.33824920654297, -30.34084129333496, -28.343433380126953, -26.346027374267578, -24.34861946105957, -22.351211547851562, -20.353805541992188, -18.35639762878418, -16.358989715576172, -14.361583709716797, -12.364175796508789, -10.366768836975098, -8.36935806274414, -6.371951103210449, -4.3745436668396, -2.37713623046875, -0.3797292709350586, 1.6176776885986328, 3.6150856018066406, 5.612492561340332, 7.609899520874023, 9.607306480407715, 11.604713439941406, 13.602121353149414, 15.599528312683105, 17.596935272216797, 19.594343185424805, 21.591751098632812, 23.589157104492188, 25.586565017700195, 27.58397102355957, 29.581378936767578, 31.578784942626953, 33.576194763183594, 35.57360076904297, 37.571006774902344, 39.56841278076172, 41.565818786621094, 43.563228607177734, 45.56063461303711, 47.558040618896484, 49.555450439453125, 51.5528564453125, 53.550262451171875, 55.547672271728516]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 2.0, 11.0, 8.0, 9.0, 12.0, 19.0, 12.0, 19.0, 20.0, 23.0, 24.0, 24.0, 32.0, 29.0, 48.0, 42.0, 41.0, 45.0, 47.0, 47.0, 38.0, 35.0, 52.0, 36.0, 37.0, 39.0, 30.0, 32.0, 21.0, 28.0, 19.0, 22.0, 12.0, 16.0, 8.0, 13.0, 11.0, 2.0, 3.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.703338623046875, -3.56488037109375, -3.426422119140625, -3.2879638671875, -3.149505615234375, -3.01104736328125, -2.872589111328125, -2.734130859375, -2.595672607421875, -2.45721435546875, -2.318756103515625, -2.1802978515625, -2.041839599609375, -1.90338134765625, -1.764923095703125, -1.62646484375, -1.488006591796875, -1.34954833984375, -1.211090087890625, -1.0726318359375, -0.934173583984375, -0.79571533203125, -0.657257080078125, -0.518798828125, -0.380340576171875, -0.24188232421875, -0.103424072265625, 0.0350341796875, 0.173492431640625, 0.31195068359375, 0.450408935546875, 0.5888671875, 0.727325439453125, 0.86578369140625, 1.004241943359375, 1.1427001953125, 1.281158447265625, 1.41961669921875, 1.558074951171875, 1.696533203125, 1.834991455078125, 1.97344970703125, 2.111907958984375, 2.2503662109375, 2.388824462890625, 2.52728271484375, 2.665740966796875, 2.80419921875, 2.942657470703125, 3.08111572265625, 3.219573974609375, 3.3580322265625, 3.496490478515625, 3.63494873046875, 3.773406982421875, 3.911865234375, 4.050323486328125, 4.18878173828125, 4.327239990234375, 4.4656982421875, 4.604156494140625, 4.74261474609375, 4.881072998046875, 5.01953125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 4.0, 8.0, 9.0, 12.0, 30.0, 31.0, 35.0, 68.0, 70.0, 116.0, 192.0, 250.0, 378.0, 594.0, 799.0, 1284.0, 2009.0, 3024.0, 5229.0, 9143.0, 16587.0, 32516.0, 65838.0, 136480.0, 260354.0, 251377.0, 129554.0, 63126.0, 31180.0, 15944.0, 8584.0, 5037.0, 3104.0, 1851.0, 1256.0, 800.0, 524.0, 356.0, 256.0, 172.0, 105.0, 78.0, 56.0, 49.0, 33.0, 20.0, 8.0, 8.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.68798828125, -0.6664657592773438, -0.6449432373046875, -0.6234207153320312, -0.601898193359375, -0.5803756713867188, -0.5588531494140625, -0.5373306274414062, -0.51580810546875, -0.49428558349609375, -0.4727630615234375, -0.45124053955078125, -0.429718017578125, -0.40819549560546875, -0.3866729736328125, -0.36515045166015625, -0.3436279296875, -0.32210540771484375, -0.3005828857421875, -0.27906036376953125, -0.257537841796875, -0.23601531982421875, -0.2144927978515625, -0.19297027587890625, -0.17144775390625, -0.14992523193359375, -0.1284027099609375, -0.10688018798828125, -0.085357666015625, -0.06383514404296875, -0.0423126220703125, -0.02079010009765625, 0.000732421875, 0.02225494384765625, 0.0437774658203125, 0.06529998779296875, 0.086822509765625, 0.10834503173828125, 0.1298675537109375, 0.15139007568359375, 0.17291259765625, 0.19443511962890625, 0.2159576416015625, 0.23748016357421875, 0.259002685546875, 0.28052520751953125, 0.3020477294921875, 0.32357025146484375, 0.3450927734375, 0.36661529541015625, 0.3881378173828125, 0.40966033935546875, 0.431182861328125, 0.45270538330078125, 0.4742279052734375, 0.49575042724609375, 0.51727294921875, 0.5387954711914062, 0.5603179931640625, 0.5818405151367188, 0.603363037109375, 0.6248855590820312, 0.6464080810546875, 0.6679306030273438, 0.689453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 3.0, 10.0, 6.0, 8.0, 12.0, 20.0, 16.0, 17.0, 18.0, 25.0, 22.0, 25.0, 22.0, 31.0, 32.0, 43.0, 42.0, 42.0, 48.0, 37.0, 1063.0, 44.0, 36.0, 44.0, 35.0, 29.0, 31.0, 37.0, 30.0, 32.0, 27.0, 22.0, 26.0, 17.0, 8.0, 6.0, 13.0, 3.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.681640625, -2.593505859375, -2.50537109375, -2.417236328125, -2.3291015625, -2.240966796875, -2.15283203125, -2.064697265625, -1.9765625, -1.888427734375, -1.80029296875, -1.712158203125, -1.6240234375, -1.535888671875, -1.44775390625, -1.359619140625, -1.271484375, -1.183349609375, -1.09521484375, -1.007080078125, -0.9189453125, -0.830810546875, -0.74267578125, -0.654541015625, -0.56640625, -0.478271484375, -0.39013671875, -0.302001953125, -0.2138671875, -0.125732421875, -0.03759765625, 0.050537109375, 0.138671875, 0.226806640625, 0.31494140625, 0.403076171875, 0.4912109375, 0.579345703125, 0.66748046875, 0.755615234375, 0.84375, 0.931884765625, 1.02001953125, 1.108154296875, 1.1962890625, 1.284423828125, 1.37255859375, 1.460693359375, 1.548828125, 1.636962890625, 1.72509765625, 1.813232421875, 1.9013671875, 1.989501953125, 2.07763671875, 2.165771484375, 2.25390625, 2.342041015625, 2.43017578125, 2.518310546875, 2.6064453125, 2.694580078125, 2.78271484375, 2.870849609375, 2.958984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 8.0, 2.0, 7.0, 10.0, 11.0, 14.0, 35.0, 48.0, 65.0, 89.0, 116.0, 197.0, 350.0, 456.0, 645.0, 922.0, 1528.0, 2295.0, 3670.0, 5718.0, 8933.0, 13705.0, 21650.0, 34749.0, 56974.0, 96793.0, 167428.0, 1253053.0, 172313.0, 99390.0, 58106.0, 35678.0, 22527.0, 14081.0, 8906.0, 5788.0, 3751.0, 2459.0, 1570.0, 1060.0, 627.0, 476.0, 316.0, 189.0, 130.0, 97.0, 70.0, 52.0, 26.0, 20.0, 6.0, 15.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.278411865234375, -0.26898193359375, -0.259552001953125, -0.2501220703125, -0.240692138671875, -0.23126220703125, -0.221832275390625, -0.21240234375, -0.202972412109375, -0.19354248046875, -0.184112548828125, -0.1746826171875, -0.165252685546875, -0.15582275390625, -0.146392822265625, -0.136962890625, -0.127532958984375, -0.11810302734375, -0.108673095703125, -0.0992431640625, -0.089813232421875, -0.08038330078125, -0.070953369140625, -0.0615234375, -0.052093505859375, -0.04266357421875, -0.033233642578125, -0.0238037109375, -0.014373779296875, -0.00494384765625, 0.004486083984375, 0.013916015625, 0.023345947265625, 0.03277587890625, 0.042205810546875, 0.0516357421875, 0.061065673828125, 0.07049560546875, 0.079925537109375, 0.08935546875, 0.098785400390625, 0.10821533203125, 0.117645263671875, 0.1270751953125, 0.136505126953125, 0.14593505859375, 0.155364990234375, 0.164794921875, 0.174224853515625, 0.18365478515625, 0.193084716796875, 0.2025146484375, 0.211944580078125, 0.22137451171875, 0.230804443359375, 0.240234375, 0.249664306640625, 0.25909423828125, 0.268524169921875, 0.2779541015625, 0.287384033203125, 0.29681396484375, 0.306243896484375, 0.315673828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 4.0, 3.0, 9.0, 11.0, 16.0, 30.0, 23.0, 28.0, 43.0, 52.0, 42.0, 95.0, 150.0, 125.0, 68.0, 48.0, 41.0, 27.0, 42.0, 22.0, 21.0, 16.0, 14.0, 14.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0237884521484375, -0.0230405330657959, -0.022292613983154297, -0.021544694900512695, -0.020796775817871094, -0.020048856735229492, -0.01930093765258789, -0.01855301856994629, -0.017805099487304688, -0.017057180404663086, -0.016309261322021484, -0.015561342239379883, -0.014813423156738281, -0.01406550407409668, -0.013317584991455078, -0.012569665908813477, -0.011821746826171875, -0.011073827743530273, -0.010325908660888672, -0.00957798957824707, -0.008830070495605469, -0.008082151412963867, -0.007334232330322266, -0.006586313247680664, -0.0058383941650390625, -0.005090475082397461, -0.004342555999755859, -0.003594636917114258, -0.0028467178344726562, -0.0020987987518310547, -0.0013508796691894531, -0.0006029605865478516, 0.00014495849609375, 0.0008928775787353516, 0.0016407966613769531, 0.0023887157440185547, 0.0031366348266601562, 0.003884553909301758, 0.004632472991943359, 0.005380392074584961, 0.0061283111572265625, 0.006876230239868164, 0.007624149322509766, 0.008372068405151367, 0.009119987487792969, 0.00986790657043457, 0.010615825653076172, 0.011363744735717773, 0.012111663818359375, 0.012859582901000977, 0.013607501983642578, 0.01435542106628418, 0.015103340148925781, 0.015851259231567383, 0.016599178314208984, 0.017347097396850586, 0.018095016479492188, 0.01884293556213379, 0.01959085464477539, 0.020338773727416992, 0.021086692810058594, 0.021834611892700195, 0.022582530975341797, 0.0233304500579834, 0.024078369140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 7.0, 3.0, 7.0, 21.0, 26.0, 23.0, 28.0, 34.0, 55.0, 75.0, 119.0, 180.0, 805.0, 18203.0, 1018891.0, 8977.0, 538.0, 166.0, 92.0, 74.0, 71.0, 41.0, 30.0, 15.0, 16.0, 12.0, 7.0, 3.0, 8.0, 0.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.49442291259765625, -0.4776153564453125, -0.46080780029296875, -0.444000244140625, -0.42719268798828125, -0.4103851318359375, -0.39357757568359375, -0.37677001953125, -0.35996246337890625, -0.3431549072265625, -0.32634735107421875, -0.309539794921875, -0.29273223876953125, -0.2759246826171875, -0.25911712646484375, -0.2423095703125, -0.22550201416015625, -0.2086944580078125, -0.19188690185546875, -0.175079345703125, -0.15827178955078125, -0.1414642333984375, -0.12465667724609375, -0.10784912109375, -0.09104156494140625, -0.0742340087890625, -0.05742645263671875, -0.040618896484375, -0.02381134033203125, -0.0070037841796875, 0.00980377197265625, 0.026611328125, 0.04341888427734375, 0.0602264404296875, 0.07703399658203125, 0.093841552734375, 0.11064910888671875, 0.1274566650390625, 0.14426422119140625, 0.16107177734375, 0.17787933349609375, 0.1946868896484375, 0.21149444580078125, 0.228302001953125, 0.24510955810546875, 0.2619171142578125, 0.27872467041015625, 0.2955322265625, 0.31233978271484375, 0.3291473388671875, 0.34595489501953125, 0.362762451171875, 0.37957000732421875, 0.3963775634765625, 0.41318511962890625, 0.42999267578125, 0.44680023193359375, 0.4636077880859375, 0.48041534423828125, 0.497222900390625, 0.5140304565429688, 0.5308380126953125, 0.5476455688476562, 0.564453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 22.0, 109.0, 556.0, 239.0, 58.0, 16.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04319857805967331, -0.03673320636153221, -0.030267834663391113, -0.023802461102604866, -0.017337089404463768, -0.01087171584367752, -0.004406344145536423, 0.0020590275526046753, 0.008524399250745773, 0.014989770948886871, 0.02145514264702797, 0.027920516207814217, 0.034385889768600464, 0.04085126146674156, 0.04731663316488266, 0.05378200486302376, 0.060247376561164856, 0.06671275198459625, 0.07317811995744705, 0.07964349538087845, 0.08610886335372925, 0.09257423877716064, 0.09903961420059204, 0.10550498217344284, 0.11197035014629364, 0.11843572556972504, 0.12490109354257584, 0.13136646151542664, 0.13783183693885803, 0.14429721236228943, 0.15076258778572083, 0.15722796320915222, 0.16369332373142242, 0.17015869915485382, 0.17662407457828522, 0.18308943510055542, 0.18955481052398682, 0.1960201859474182, 0.2024855613708496, 0.208950936794281, 0.2154162973165512, 0.2218816727399826, 0.228347048163414, 0.2348124086856842, 0.2412777841091156, 0.247743159532547, 0.2542085349559784, 0.2606739103794098, 0.2671392858028412, 0.2736046612262726, 0.280070036649704, 0.2865354120731354, 0.2930007874965668, 0.2994661331176758, 0.3059315085411072, 0.3123968839645386, 0.31886225938796997, 0.32532763481140137, 0.33179301023483276, 0.33825838565826416, 0.34472376108169556, 0.35118913650512695, 0.35765448212623596, 0.36411985754966736, 0.37058523297309875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 3.0, 8.0, 5.0, 8.0, 10.0, 12.0, 11.0, 16.0, 18.0, 17.0, 23.0, 29.0, 33.0, 23.0, 23.0, 35.0, 37.0, 45.0, 33.0, 38.0, 40.0, 36.0, 42.0, 34.0, 40.0, 35.0, 38.0, 27.0, 28.0, 22.0, 34.0, 36.0, 29.0, 22.0, 20.0, 16.0, 18.0, 13.0, 9.0, 6.0, 11.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.041758060455322266, -0.04040367901325226, -0.03904929757118225, -0.03769491985440254, -0.036340538412332535, -0.03498615697026253, -0.03363177925348282, -0.03227739781141281, -0.030923016369342804, -0.029568634927272797, -0.02821425534784794, -0.02685987576842308, -0.025505494326353073, -0.024151112884283066, -0.022796733304858208, -0.02144235372543335, -0.020087972283363342, -0.018733590841293335, -0.017379211261868477, -0.01602483168244362, -0.014670450240373611, -0.013316069729626179, -0.011961689218878746, -0.010607308708131313, -0.00925292819738388, -0.007898547686636448, -0.006544167175889015, -0.0051897866651415825, -0.0038354061543941498, -0.002481025643646717, -0.0011266451328992844, 0.00022773537784814835, 0.001582115888595581, 0.0029364963993430138, 0.0042908769100904465, 0.005645257420837879, 0.006999637931585312, 0.008354018442332745, 0.009708398953080177, 0.01106277946382761, 0.012417159974575043, 0.013771540485322475, 0.015125920996069908, 0.016480300575494766, 0.017834682017564774, 0.01918906345963478, 0.02054344303905964, 0.021897822618484497, 0.023252204060554504, 0.02460658550262451, 0.02596096508204937, 0.027315344661474228, 0.028669726103544235, 0.030024107545614243, 0.03137848526239395, 0.03273286670446396, 0.034087248146533966, 0.03544162958860397, 0.03679601103067398, 0.03815038874745369, 0.0395047701895237, 0.040859151631593704, 0.04221352934837341, 0.04356791079044342, 0.04492229223251343]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 2.0, 11.0, 8.0, 9.0, 12.0, 19.0, 12.0, 19.0, 20.0, 24.0, 23.0, 24.0, 32.0, 29.0, 48.0, 41.0, 41.0, 46.0, 47.0, 47.0, 38.0, 35.0, 52.0, 36.0, 37.0, 39.0, 30.0, 32.0, 21.0, 28.0, 19.0, 22.0, 12.0, 16.0, 8.0, 13.0, 11.0, 2.0, 3.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.703338623046875, -3.56488037109375, -3.426422119140625, -3.2879638671875, -3.149505615234375, -3.01104736328125, -2.872589111328125, -2.734130859375, -2.595672607421875, -2.45721435546875, -2.318756103515625, -2.1802978515625, -2.041839599609375, -1.90338134765625, -1.764923095703125, -1.62646484375, -1.488006591796875, -1.34954833984375, -1.211090087890625, -1.0726318359375, -0.934173583984375, -0.79571533203125, -0.657257080078125, -0.518798828125, -0.380340576171875, -0.24188232421875, -0.103424072265625, 0.0350341796875, 0.173492431640625, 0.31195068359375, 0.450408935546875, 0.5888671875, 0.727325439453125, 0.86578369140625, 1.004241943359375, 1.1427001953125, 1.281158447265625, 1.41961669921875, 1.558074951171875, 1.696533203125, 1.834991455078125, 1.97344970703125, 2.111907958984375, 2.2503662109375, 2.388824462890625, 2.52728271484375, 2.665740966796875, 2.80419921875, 2.942657470703125, 3.08111572265625, 3.219573974609375, 3.3580322265625, 3.496490478515625, 3.63494873046875, 3.773406982421875, 3.911865234375, 4.050323486328125, 4.18878173828125, 4.327239990234375, 4.4656982421875, 4.604156494140625, 4.74261474609375, 4.881072998046875, 5.01953125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 10.0, 12.0, 12.0, 22.0, 18.0, 33.0, 77.0, 77.0, 99.0, 175.0, 220.0, 283.0, 428.0, 581.0, 905.0, 1397.0, 2037.0, 3464.0, 5797.0, 15716.0, 705206.0, 286365.0, 11304.0, 5283.0, 3187.0, 1912.0, 1274.0, 796.0, 541.0, 382.0, 249.0, 182.0, 146.0, 93.0, 67.0, 44.0, 46.0, 27.0, 20.0, 16.0, 11.0, 8.0, 9.0, 5.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.3466796875, -17.771484375, -17.1962890625, -16.62109375, -16.0458984375, -15.470703125, -14.8955078125, -14.3203125, -13.7451171875, -13.169921875, -12.5947265625, -12.01953125, -11.4443359375, -10.869140625, -10.2939453125, -9.71875, -9.1435546875, -8.568359375, -7.9931640625, -7.41796875, -6.8427734375, -6.267578125, -5.6923828125, -5.1171875, -4.5419921875, -3.966796875, -3.3916015625, -2.81640625, -2.2412109375, -1.666015625, -1.0908203125, -0.515625, 0.0595703125, 0.634765625, 1.2099609375, 1.78515625, 2.3603515625, 2.935546875, 3.5107421875, 4.0859375, 4.6611328125, 5.236328125, 5.8115234375, 6.38671875, 6.9619140625, 7.537109375, 8.1123046875, 8.6875, 9.2626953125, 9.837890625, 10.4130859375, 10.98828125, 11.5634765625, 12.138671875, 12.7138671875, 13.2890625, 13.8642578125, 14.439453125, 15.0146484375, 15.58984375, 16.1650390625, 16.740234375, 17.3154296875, 17.890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 15.0, 13.0, 10.0, 24.0, 15.0, 20.0, 31.0, 31.0, 29.0, 43.0, 45.0, 50.0, 60.0, 80.0, 147.0, 1782.0, 156.0, 60.0, 59.0, 53.0, 40.0, 34.0, 38.0, 26.0, 28.0, 18.0, 32.0, 10.0, 9.0, 13.0, 13.0, 7.0, 6.0, 6.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -13.9757080078125, -13.427978515625, -12.8802490234375, -12.33251953125, -11.7847900390625, -11.237060546875, -10.6893310546875, -10.1416015625, -9.5938720703125, -9.046142578125, -8.4984130859375, -7.95068359375, -7.4029541015625, -6.855224609375, -6.3074951171875, -5.759765625, -5.2120361328125, -4.664306640625, -4.1165771484375, -3.56884765625, -3.0211181640625, -2.473388671875, -1.9256591796875, -1.3779296875, -0.8302001953125, -0.282470703125, 0.2652587890625, 0.81298828125, 1.3607177734375, 1.908447265625, 2.4561767578125, 3.00390625, 3.5516357421875, 4.099365234375, 4.6470947265625, 5.19482421875, 5.7425537109375, 6.290283203125, 6.8380126953125, 7.3857421875, 7.9334716796875, 8.481201171875, 9.0289306640625, 9.57666015625, 10.1243896484375, 10.672119140625, 11.2198486328125, 11.767578125, 12.3153076171875, 12.863037109375, 13.4107666015625, 13.95849609375, 14.5062255859375, 15.053955078125, 15.6016845703125, 16.1494140625, 16.6971435546875, 17.244873046875, 17.7926025390625, 18.34033203125, 18.8880615234375, 19.435791015625, 19.9835205078125, 20.53125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 8.0, 7.0, 4.0, 6.0, 10.0, 10.0, 9.0, 15.0, 12.0, 26.0, 27.0, 35.0, 71.0, 106.0, 227.0, 430.0, 926.0, 1949.0, 4255.0, 11340.0, 60176.0, 2969445.0, 75349.0, 12444.0, 4788.0, 2010.0, 1027.0, 445.0, 214.0, 108.0, 65.0, 39.0, 20.0, 23.0, 15.0, 15.0, 10.0, 14.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-31.34375, -30.48583984375, -29.6279296875, -28.77001953125, -27.912109375, -27.05419921875, -26.1962890625, -25.33837890625, -24.48046875, -23.62255859375, -22.7646484375, -21.90673828125, -21.048828125, -20.19091796875, -19.3330078125, -18.47509765625, -17.6171875, -16.75927734375, -15.9013671875, -15.04345703125, -14.185546875, -13.32763671875, -12.4697265625, -11.61181640625, -10.75390625, -9.89599609375, -9.0380859375, -8.18017578125, -7.322265625, -6.46435546875, -5.6064453125, -4.74853515625, -3.890625, -3.03271484375, -2.1748046875, -1.31689453125, -0.458984375, 0.39892578125, 1.2568359375, 2.11474609375, 2.97265625, 3.83056640625, 4.6884765625, 5.54638671875, 6.404296875, 7.26220703125, 8.1201171875, 8.97802734375, 9.8359375, 10.69384765625, 11.5517578125, 12.40966796875, 13.267578125, 14.12548828125, 14.9833984375, 15.84130859375, 16.69921875, 17.55712890625, 18.4150390625, 19.27294921875, 20.130859375, 20.98876953125, 21.8466796875, 22.70458984375, 23.5625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 16.0, 68.0, 209.0, 394.0, 247.0, 64.0, 12.0, 7.0], "bins": [-183.8159942626953, -180.72845458984375, -177.6409149169922, -174.55337524414062, -171.46583557128906, -168.3782958984375, -165.29075622558594, -162.20321655273438, -159.1156768798828, -156.02813720703125, -152.9405975341797, -149.85305786132812, -146.76551818847656, -143.677978515625, -140.59043884277344, -137.50289916992188, -134.41537475585938, -131.3278350830078, -128.24029541015625, -125.15275573730469, -122.06521606445312, -118.97767639160156, -115.89013671875, -112.80260467529297, -109.71505737304688, -106.62751770019531, -103.53997802734375, -100.45243835449219, -97.36489868164062, -94.27735900878906, -91.1898193359375, -88.10228729248047, -85.01473999023438, -81.92720031738281, -78.83966064453125, -75.75212097167969, -72.66458129882812, -69.57704162597656, -66.489501953125, -63.40196990966797, -60.314430236816406, -57.226890563964844, -54.13935089111328, -51.05181121826172, -47.96427536010742, -44.87673568725586, -41.7891960144043, -38.70166015625, -35.61412048339844, -32.526580810546875, -29.439043045043945, -26.351503372192383, -23.263965606689453, -20.17642593383789, -17.088886260986328, -14.001348495483398, -10.913806915283203, -7.826268196105957, -4.738729000091553, -1.6511898040771484, 1.4363489151000977, 4.523887634277344, 7.611427307128906, 10.698965072631836, 13.786504745483398]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 13.0, 9.0, 10.0, 12.0, 17.0, 21.0, 12.0, 25.0, 18.0, 22.0, 20.0, 35.0, 33.0, 30.0, 37.0, 39.0, 49.0, 42.0, 43.0, 37.0, 42.0, 36.0, 48.0, 33.0, 31.0, 28.0, 28.0, 24.0, 35.0, 26.0, 19.0, 19.0, 14.0, 15.0, 9.0, 12.0, 8.0, 13.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.28564453125, -44.646331787109375, -43.00701904296875, -41.367706298828125, -39.7283935546875, -38.089080810546875, -36.449771881103516, -34.81045913696289, -33.171146392822266, -31.53183364868164, -29.892520904541016, -28.253210067749023, -26.6138973236084, -24.974584579467773, -23.33527374267578, -21.695960998535156, -20.05664825439453, -18.417335510253906, -16.77802276611328, -15.138711929321289, -13.499399185180664, -11.860086441040039, -10.22077465057373, -8.581462860107422, -6.942150115966797, -5.30283784866333, -3.6635255813598633, -2.0242133140563965, -0.3849010467529297, 1.2544116973876953, 2.893723487854004, 4.5330352783203125, 6.1723480224609375, 7.811660289764404, 9.450972557067871, 11.09028434753418, 12.729597091674805, 14.36890983581543, 16.008220672607422, 17.647533416748047, 19.286846160888672, 20.926158905029297, 22.565471649169922, 24.204782485961914, 25.84409523010254, 27.483407974243164, 29.122718811035156, 30.76203155517578, 32.401344299316406, 34.04065704345703, 35.679969787597656, 37.31928253173828, 38.958595275878906, 40.59790802001953, 42.23721694946289, 43.876529693603516, 45.51584243774414, 47.155155181884766, 48.79446792602539, 50.433780670166016, 52.073089599609375, 53.71240234375, 55.351715087890625, 56.99102783203125, 58.630340576171875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 3.0, 6.0, 8.0, 15.0, 3.0, 14.0, 15.0, 16.0, 27.0, 12.0, 17.0, 32.0, 32.0, 24.0, 35.0, 35.0, 45.0, 42.0, 41.0, 47.0, 47.0, 39.0, 46.0, 34.0, 36.0, 48.0, 33.0, 25.0, 26.0, 29.0, 27.0, 21.0, 19.0, 15.0, 13.0, 10.0, 13.0, 13.0, 4.0, 5.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.6099853515625, -3.469970703125, -3.3299560546875, -3.18994140625, -3.0499267578125, -2.909912109375, -2.7698974609375, -2.6298828125, -2.4898681640625, -2.349853515625, -2.2098388671875, -2.06982421875, -1.9298095703125, -1.789794921875, -1.6497802734375, -1.509765625, -1.3697509765625, -1.229736328125, -1.0897216796875, -0.94970703125, -0.8096923828125, -0.669677734375, -0.5296630859375, -0.3896484375, -0.2496337890625, -0.109619140625, 0.0303955078125, 0.17041015625, 0.3104248046875, 0.450439453125, 0.5904541015625, 0.73046875, 0.8704833984375, 1.010498046875, 1.1505126953125, 1.29052734375, 1.4305419921875, 1.570556640625, 1.7105712890625, 1.8505859375, 1.9906005859375, 2.130615234375, 2.2706298828125, 2.41064453125, 2.5506591796875, 2.690673828125, 2.8306884765625, 2.970703125, 3.1107177734375, 3.250732421875, 3.3907470703125, 3.53076171875, 3.6707763671875, 3.810791015625, 3.9508056640625, 4.0908203125, 4.2308349609375, 4.370849609375, 4.5108642578125, 4.65087890625, 4.7908935546875, 4.930908203125, 5.0709228515625, 5.2109375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 2.0, 18.0, 19.0, 31.0, 46.0, 67.0, 105.0, 173.0, 345.0, 519.0, 939.0, 1637.0, 3260.0, 6545.0, 15112.0, 41213.0, 194738.0, 3323244.0, 507179.0, 62338.0, 20150.0, 8180.0, 3904.0, 1917.0, 1078.0, 594.0, 308.0, 201.0, 129.0, 84.0, 48.0, 29.0, 28.0, 24.0, 19.0, 11.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.765625, -23.9833984375, -23.201171875, -22.4189453125, -21.63671875, -20.8544921875, -20.072265625, -19.2900390625, -18.5078125, -17.7255859375, -16.943359375, -16.1611328125, -15.37890625, -14.5966796875, -13.814453125, -13.0322265625, -12.25, -11.4677734375, -10.685546875, -9.9033203125, -9.12109375, -8.3388671875, -7.556640625, -6.7744140625, -5.9921875, -5.2099609375, -4.427734375, -3.6455078125, -2.86328125, -2.0810546875, -1.298828125, -0.5166015625, 0.265625, 1.0478515625, 1.830078125, 2.6123046875, 3.39453125, 4.1767578125, 4.958984375, 5.7412109375, 6.5234375, 7.3056640625, 8.087890625, 8.8701171875, 9.65234375, 10.4345703125, 11.216796875, 11.9990234375, 12.78125, 13.5634765625, 14.345703125, 15.1279296875, 15.91015625, 16.6923828125, 17.474609375, 18.2568359375, 19.0390625, 19.8212890625, 20.603515625, 21.3857421875, 22.16796875, 22.9501953125, 23.732421875, 24.5146484375, 25.296875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 17.0, 22.0, 13.0, 30.0, 35.0, 42.0, 65.0, 59.0, 114.0, 165.0, 291.0, 506.0, 734.0, 691.0, 393.0, 272.0, 167.0, 104.0, 81.0, 79.0, 44.0, 31.0, 29.0, 13.0, 20.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.35302734375, -19.7529296875, -19.15283203125, -18.552734375, -17.95263671875, -17.3525390625, -16.75244140625, -16.15234375, -15.55224609375, -14.9521484375, -14.35205078125, -13.751953125, -13.15185546875, -12.5517578125, -11.95166015625, -11.3515625, -10.75146484375, -10.1513671875, -9.55126953125, -8.951171875, -8.35107421875, -7.7509765625, -7.15087890625, -6.55078125, -5.95068359375, -5.3505859375, -4.75048828125, -4.150390625, -3.55029296875, -2.9501953125, -2.35009765625, -1.75, -1.14990234375, -0.5498046875, 0.05029296875, 0.650390625, 1.25048828125, 1.8505859375, 2.45068359375, 3.05078125, 3.65087890625, 4.2509765625, 4.85107421875, 5.451171875, 6.05126953125, 6.6513671875, 7.25146484375, 7.8515625, 8.45166015625, 9.0517578125, 9.65185546875, 10.251953125, 10.85205078125, 11.4521484375, 12.05224609375, 12.65234375, 13.25244140625, 13.8525390625, 14.45263671875, 15.052734375, 15.65283203125, 16.2529296875, 16.85302734375, 17.453125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 9.0, 16.0, 22.0, 38.0, 59.0, 85.0, 197.0, 331.0, 578.0, 1030.0, 1994.0, 3894.0, 7796.0, 17017.0, 42084.0, 128873.0, 830890.0, 2717785.0, 313031.0, 76043.0, 28278.0, 12161.0, 5726.0, 2911.0, 1501.0, 837.0, 484.0, 254.0, 145.0, 79.0, 49.0, 27.0, 23.0, 10.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.125, -26.166015625, -25.20703125, -24.248046875, -23.2890625, -22.330078125, -21.37109375, -20.412109375, -19.453125, -18.494140625, -17.53515625, -16.576171875, -15.6171875, -14.658203125, -13.69921875, -12.740234375, -11.78125, -10.822265625, -9.86328125, -8.904296875, -7.9453125, -6.986328125, -6.02734375, -5.068359375, -4.109375, -3.150390625, -2.19140625, -1.232421875, -0.2734375, 0.685546875, 1.64453125, 2.603515625, 3.5625, 4.521484375, 5.48046875, 6.439453125, 7.3984375, 8.357421875, 9.31640625, 10.275390625, 11.234375, 12.193359375, 13.15234375, 14.111328125, 15.0703125, 16.029296875, 16.98828125, 17.947265625, 18.90625, 19.865234375, 20.82421875, 21.783203125, 22.7421875, 23.701171875, 24.66015625, 25.619140625, 26.578125, 27.537109375, 28.49609375, 29.455078125, 30.4140625, 31.373046875, 32.33203125, 33.291015625, 34.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 20.0, 43.0, 43.0, 85.0, 143.0, 166.0, 165.0, 106.0, 90.0, 60.0, 30.0, 23.0, 13.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.4460906982422, -203.45620727539062, -198.46632385253906, -193.4764404296875, -188.48655700683594, -183.49667358398438, -178.5067901611328, -173.51690673828125, -168.52703857421875, -163.5371551513672, -158.54727172851562, -153.55738830566406, -148.5675048828125, -143.57762145996094, -138.58773803710938, -133.59786987304688, -128.60797119140625, -123.61808776855469, -118.62820434570312, -113.63832092285156, -108.6484375, -103.65855407714844, -98.6686782836914, -93.67879486083984, -88.68891143798828, -83.69902801513672, -78.70914459228516, -73.7192611694336, -68.72938537597656, -63.739498138427734, -58.74961853027344, -53.759735107421875, -48.76984405517578, -43.77996063232422, -38.790077209472656, -33.80019760131836, -28.810314178466797, -23.820430755615234, -18.830549240112305, -13.840667724609375, -8.850784301757812, -3.8609018325805664, 1.1289806365966797, 6.118863105773926, 11.108745574951172, 16.098628997802734, 21.088510513305664, 26.078392028808594, 31.068275451660156, 36.05815887451172, 41.04804229736328, 46.03792190551758, 51.02780532836914, 56.0176887512207, 61.007568359375, 65.99745178222656, 70.98733520507812, 75.97721862792969, 80.96710205078125, 85.95698547363281, 90.94686889648438, 95.93675231933594, 100.92662811279297, 105.91651153564453, 110.9063949584961]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 9.0, 10.0, 11.0, 13.0, 12.0, 16.0, 16.0, 19.0, 25.0, 21.0, 29.0, 38.0, 25.0, 33.0, 28.0, 40.0, 34.0, 40.0, 48.0, 43.0, 39.0, 25.0, 48.0, 42.0, 44.0, 40.0, 41.0, 28.0, 28.0, 24.0, 21.0, 23.0, 13.0, 16.0, 15.0, 9.0, 15.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.133670806884766, -55.37603759765625, -53.61840057373047, -51.86076354980469, -50.10313034057617, -48.345497131347656, -46.587860107421875, -44.830223083496094, -43.07258987426758, -41.31495666503906, -39.55731964111328, -37.7996826171875, -36.042049407958984, -34.28441619873047, -32.52677917480469, -30.76914405822754, -29.01150894165039, -27.253873825073242, -25.496238708496094, -23.738603591918945, -21.980968475341797, -20.22333335876465, -18.4656982421875, -16.70806312561035, -14.950428009033203, -13.192792892456055, -11.435157775878906, -9.677522659301758, -7.919887542724609, -6.162252426147461, -4.4046173095703125, -2.646982192993164, -0.8893470764160156, 0.8682880401611328, 2.6259231567382812, 4.38355827331543, 6.141193389892578, 7.898828506469727, 9.656463623046875, 11.414098739624023, 13.171733856201172, 14.92936897277832, 16.68700408935547, 18.444639205932617, 20.202274322509766, 21.959909439086914, 23.717544555664062, 25.47517967224121, 27.23281478881836, 28.990449905395508, 30.748085021972656, 32.50572204589844, 34.26335525512695, 36.02098846435547, 37.77862548828125, 39.53626251220703, 41.29389572143555, 43.05152893066406, 44.809165954589844, 46.566802978515625, 48.32443618774414, 50.082069396972656, 51.83970642089844, 53.59734344482422, 55.354976654052734]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 12.0, 11.0, 7.0, 17.0, 15.0, 17.0, 23.0, 24.0, 28.0, 21.0, 25.0, 26.0, 35.0, 33.0, 32.0, 34.0, 36.0, 48.0, 40.0, 39.0, 36.0, 25.0, 44.0, 33.0, 29.0, 39.0, 31.0, 27.0, 24.0, 17.0, 16.0, 25.0, 12.0, 10.0, 14.0, 14.0, 14.0, 7.0, 8.0, 6.0, 5.0, 11.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.05078125, -3.9110107421875, -3.771240234375, -3.6314697265625, -3.49169921875, -3.3519287109375, -3.212158203125, -3.0723876953125, -2.9326171875, -2.7928466796875, -2.653076171875, -2.5133056640625, -2.37353515625, -2.2337646484375, -2.093994140625, -1.9542236328125, -1.814453125, -1.6746826171875, -1.534912109375, -1.3951416015625, -1.25537109375, -1.1156005859375, -0.975830078125, -0.8360595703125, -0.6962890625, -0.5565185546875, -0.416748046875, -0.2769775390625, -0.13720703125, 0.0025634765625, 0.142333984375, 0.2821044921875, 0.421875, 0.5616455078125, 0.701416015625, 0.8411865234375, 0.98095703125, 1.1207275390625, 1.260498046875, 1.4002685546875, 1.5400390625, 1.6798095703125, 1.819580078125, 1.9593505859375, 2.09912109375, 2.2388916015625, 2.378662109375, 2.5184326171875, 2.658203125, 2.7979736328125, 2.937744140625, 3.0775146484375, 3.21728515625, 3.3570556640625, 3.496826171875, 3.6365966796875, 3.7763671875, 3.9161376953125, 4.055908203125, 4.1956787109375, 4.33544921875, 4.4752197265625, 4.614990234375, 4.7547607421875, 4.89453125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 14.0, 15.0, 22.0, 35.0, 52.0, 54.0, 107.0, 137.0, 234.0, 331.0, 553.0, 905.0, 1398.0, 2376.0, 3908.0, 6875.0, 12767.0, 24757.0, 49987.0, 108597.0, 229573.0, 293144.0, 162490.0, 74775.0, 34981.0, 17618.0, 9632.0, 5263.0, 3031.0, 1760.0, 1091.0, 749.0, 447.0, 286.0, 190.0, 123.0, 85.0, 62.0, 39.0, 28.0, 21.0, 8.0, 12.0, 7.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.84521484375, -0.8198013305664062, -0.7943878173828125, -0.7689743041992188, -0.743560791015625, -0.7181472778320312, -0.6927337646484375, -0.6673202514648438, -0.64190673828125, -0.6164932250976562, -0.5910797119140625, -0.5656661987304688, -0.540252685546875, -0.5148391723632812, -0.4894256591796875, -0.46401214599609375, -0.4385986328125, -0.41318511962890625, -0.3877716064453125, -0.36235809326171875, -0.336944580078125, -0.31153106689453125, -0.2861175537109375, -0.26070404052734375, -0.23529052734375, -0.20987701416015625, -0.1844635009765625, -0.15904998779296875, -0.133636474609375, -0.10822296142578125, -0.0828094482421875, -0.05739593505859375, -0.031982421875, -0.00656890869140625, 0.0188446044921875, 0.04425811767578125, 0.069671630859375, 0.09508514404296875, 0.1204986572265625, 0.14591217041015625, 0.17132568359375, 0.19673919677734375, 0.2221527099609375, 0.24756622314453125, 0.272979736328125, 0.29839324951171875, 0.3238067626953125, 0.34922027587890625, 0.3746337890625, 0.40004730224609375, 0.4254608154296875, 0.45087432861328125, 0.476287841796875, 0.5017013549804688, 0.5271148681640625, 0.5525283813476562, 0.57794189453125, 0.6033554077148438, 0.6287689208984375, 0.6541824340820312, 0.679595947265625, 0.7050094604492188, 0.7304229736328125, 0.7558364868164062, 0.78125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 17.0, 16.0, 18.0, 18.0, 21.0, 26.0, 28.0, 32.0, 21.0, 32.0, 35.0, 35.0, 43.0, 47.0, 31.0, 35.0, 1057.0, 50.0, 39.0, 44.0, 40.0, 27.0, 24.0, 27.0, 36.0, 31.0, 23.0, 19.0, 26.0, 20.0, 11.0, 12.0, 12.0, 5.0, 8.0, 13.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.228515625, -3.12896728515625, -3.0294189453125, -2.92987060546875, -2.830322265625, -2.73077392578125, -2.6312255859375, -2.53167724609375, -2.43212890625, -2.33258056640625, -2.2330322265625, -2.13348388671875, -2.033935546875, -1.93438720703125, -1.8348388671875, -1.73529052734375, -1.6357421875, -1.53619384765625, -1.4366455078125, -1.33709716796875, -1.237548828125, -1.13800048828125, -1.0384521484375, -0.93890380859375, -0.83935546875, -0.73980712890625, -0.6402587890625, -0.54071044921875, -0.441162109375, -0.34161376953125, -0.2420654296875, -0.14251708984375, -0.04296875, 0.05657958984375, 0.1561279296875, 0.25567626953125, 0.355224609375, 0.45477294921875, 0.5543212890625, 0.65386962890625, 0.75341796875, 0.85296630859375, 0.9525146484375, 1.05206298828125, 1.151611328125, 1.25115966796875, 1.3507080078125, 1.45025634765625, 1.5498046875, 1.64935302734375, 1.7489013671875, 1.84844970703125, 1.947998046875, 2.04754638671875, 2.1470947265625, 2.24664306640625, 2.34619140625, 2.44573974609375, 2.5452880859375, 2.64483642578125, 2.744384765625, 2.84393310546875, 2.9434814453125, 3.04302978515625, 3.142578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 9.0, 7.0, 10.0, 19.0, 26.0, 38.0, 50.0, 89.0, 123.0, 183.0, 285.0, 385.0, 641.0, 820.0, 1280.0, 1889.0, 2879.0, 4254.0, 6424.0, 9418.0, 14609.0, 22916.0, 35865.0, 57745.0, 95520.0, 155039.0, 1232956.0, 174828.0, 104010.0, 63610.0, 39045.0, 25054.0, 15914.0, 10328.0, 6958.0, 4477.0, 3065.0, 2037.0, 1396.0, 949.0, 629.0, 448.0, 271.0, 204.0, 150.0, 81.0, 70.0, 50.0, 27.0, 18.0, 13.0, 7.0, 10.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.279052734375, -0.2699317932128906, -0.26081085205078125, -0.2516899108886719, -0.2425689697265625, -0.23344802856445312, -0.22432708740234375, -0.21520614624023438, -0.206085205078125, -0.19696426391601562, -0.18784332275390625, -0.17872238159179688, -0.1696014404296875, -0.16048049926757812, -0.15135955810546875, -0.14223861694335938, -0.13311767578125, -0.12399673461914062, -0.11487579345703125, -0.10575485229492188, -0.0966339111328125, -0.08751296997070312, -0.07839202880859375, -0.06927108764648438, -0.060150146484375, -0.051029205322265625, -0.04190826416015625, -0.032787322998046875, -0.0236663818359375, -0.014545440673828125, -0.00542449951171875, 0.003696441650390625, 0.0128173828125, 0.021938323974609375, 0.03105926513671875, 0.040180206298828125, 0.0493011474609375, 0.058422088623046875, 0.06754302978515625, 0.07666397094726562, 0.085784912109375, 0.09490585327148438, 0.10402679443359375, 0.11314773559570312, 0.1222686767578125, 0.13138961791992188, 0.14051055908203125, 0.14963150024414062, 0.15875244140625, 0.16787338256835938, 0.17699432373046875, 0.18611526489257812, 0.1952362060546875, 0.20435714721679688, 0.21347808837890625, 0.22259902954101562, 0.231719970703125, 0.24084091186523438, 0.24996185302734375, 0.2590827941894531, 0.2682037353515625, 0.2773246765136719, 0.28644561767578125, 0.2955665588378906, 0.3046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 8.0, 1.0, 1.0, 8.0, 2.0, 8.0, 11.0, 13.0, 16.0, 13.0, 21.0, 33.0, 29.0, 27.0, 46.0, 38.0, 41.0, 50.0, 119.0, 90.0, 67.0, 34.0, 33.0, 45.0, 28.0, 35.0, 19.0, 22.0, 17.0, 20.0, 15.0, 13.0, 9.0, 14.0, 10.0, 10.0, 5.0, 5.0, 4.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0244598388671875, -0.023715496063232422, -0.022971153259277344, -0.022226810455322266, -0.021482467651367188, -0.02073812484741211, -0.01999378204345703, -0.019249439239501953, -0.018505096435546875, -0.017760753631591797, -0.01701641082763672, -0.01627206802368164, -0.015527725219726562, -0.014783382415771484, -0.014039039611816406, -0.013294696807861328, -0.01255035400390625, -0.011806011199951172, -0.011061668395996094, -0.010317325592041016, -0.009572982788085938, -0.00882863998413086, -0.008084297180175781, -0.007339954376220703, -0.006595611572265625, -0.005851268768310547, -0.005106925964355469, -0.004362583160400391, -0.0036182403564453125, -0.0028738975524902344, -0.0021295547485351562, -0.0013852119445800781, -0.000640869140625, 0.00010347366333007812, 0.0008478164672851562, 0.0015921592712402344, 0.0023365020751953125, 0.0030808448791503906, 0.0038251876831054688, 0.004569530487060547, 0.005313873291015625, 0.006058216094970703, 0.006802558898925781, 0.007546901702880859, 0.008291244506835938, 0.009035587310791016, 0.009779930114746094, 0.010524272918701172, 0.01126861572265625, 0.012012958526611328, 0.012757301330566406, 0.013501644134521484, 0.014245986938476562, 0.01499032974243164, 0.01573467254638672, 0.016479015350341797, 0.017223358154296875, 0.017967700958251953, 0.01871204376220703, 0.01945638656616211, 0.020200729370117188, 0.020945072174072266, 0.021689414978027344, 0.022433757781982422, 0.0231781005859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 7.0, 7.0, 7.0, 15.0, 17.0, 15.0, 11.0, 27.0, 23.0, 35.0, 55.0, 79.0, 121.0, 217.0, 609.0, 43068.0, 1001662.0, 1706.0, 315.0, 203.0, 92.0, 81.0, 50.0, 29.0, 27.0, 17.0, 9.0, 5.0, 6.0, 6.0, 6.0, 2.0, 0.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.61376953125, -0.5941085815429688, -0.5744476318359375, -0.5547866821289062, -0.535125732421875, -0.5154647827148438, -0.4958038330078125, -0.47614288330078125, -0.45648193359375, -0.43682098388671875, -0.4171600341796875, -0.39749908447265625, -0.377838134765625, -0.35817718505859375, -0.3385162353515625, -0.31885528564453125, -0.2991943359375, -0.27953338623046875, -0.2598724365234375, -0.24021148681640625, -0.220550537109375, -0.20088958740234375, -0.1812286376953125, -0.16156768798828125, -0.14190673828125, -0.12224578857421875, -0.1025848388671875, -0.08292388916015625, -0.063262939453125, -0.04360198974609375, -0.0239410400390625, -0.00428009033203125, 0.015380859375, 0.03504180908203125, 0.0547027587890625, 0.07436370849609375, 0.094024658203125, 0.11368560791015625, 0.1333465576171875, 0.15300750732421875, 0.17266845703125, 0.19232940673828125, 0.2119903564453125, 0.23165130615234375, 0.251312255859375, 0.27097320556640625, 0.2906341552734375, 0.31029510498046875, 0.3299560546875, 0.34961700439453125, 0.3692779541015625, 0.38893890380859375, 0.408599853515625, 0.42826080322265625, 0.4479217529296875, 0.46758270263671875, 0.48724365234375, 0.5069046020507812, 0.5265655517578125, 0.5462265014648438, 0.565887451171875, 0.5855484008789062, 0.6052093505859375, 0.6248703002929688, 0.64453125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 7.0, 28.0, 76.0, 426.0, 331.0, 92.0, 30.0, 14.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03435846418142319, -0.027344107627868652, -0.020329751074314117, -0.013315392658114433, -0.006301036104559898, 0.0007133223116397858, 0.007727678865194321, 0.014742035418748856, 0.02175639197230339, 0.028770748525857925, 0.03578510507941246, 0.042799465358257294, 0.04981382191181183, 0.056828178465366364, 0.0638425350189209, 0.07085689157247543, 0.07787124812602997, 0.0848856046795845, 0.09189996123313904, 0.09891431778669357, 0.10592867434024811, 0.11294303834438324, 0.11995738744735718, 0.1269717514514923, 0.13398610055446625, 0.14100046455860138, 0.14801481366157532, 0.15502917766571045, 0.1620435267686844, 0.16905789077281952, 0.17607223987579346, 0.1830866038799286, 0.19010095298290253, 0.19711531698703766, 0.2041296660900116, 0.21114403009414673, 0.21815837919712067, 0.2251727432012558, 0.23218709230422974, 0.23920145630836487, 0.2462158054113388, 0.25323015451431274, 0.2602445185184479, 0.267258882522583, 0.27427324652671814, 0.2812875807285309, 0.288301944732666, 0.29531630873680115, 0.3023306727409363, 0.3093450367450714, 0.31635940074920654, 0.3233737349510193, 0.3303880989551544, 0.33740246295928955, 0.3444168269634247, 0.3514311611652374, 0.35844552516937256, 0.3654598891735077, 0.3724742531776428, 0.37948858737945557, 0.3865029513835907, 0.39351731538772583, 0.40053167939186096, 0.4075460135936737, 0.41456037759780884]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 7.0, 6.0, 10.0, 11.0, 11.0, 10.0, 9.0, 15.0, 17.0, 13.0, 21.0, 28.0, 40.0, 35.0, 27.0, 38.0, 34.0, 40.0, 36.0, 36.0, 45.0, 43.0, 37.0, 26.0, 42.0, 26.0, 24.0, 34.0, 35.0, 31.0, 24.0, 28.0, 26.0, 22.0, 21.0, 14.0, 13.0, 15.0, 13.0, 6.0, 8.0, 4.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0731077790260315, -0.0709151029586792, -0.0687224268913269, -0.06652975082397461, -0.06433707475662231, -0.06214439496397972, -0.05995171517133713, -0.05775903910398483, -0.05556636303663254, -0.05337368696928024, -0.05118101090192795, -0.048988331109285355, -0.04679565504193306, -0.044602978974580765, -0.04241029918193817, -0.040217623114585876, -0.03802494704723358, -0.03583227097988129, -0.03363959491252899, -0.0314469151198864, -0.029254239052534103, -0.02706156298518181, -0.024868885055184364, -0.02267620712518692, -0.020483531057834625, -0.01829085499048233, -0.016098177060484886, -0.013905500061810017, -0.011712823063135147, -0.009520146064460278, -0.007327469065785408, -0.0051347920671105385, -0.002942115068435669, -0.0007494380697607994, 0.0014432389289140701, 0.0036359159275889397, 0.005828592926263809, 0.008021269924938679, 0.010213946923613548, 0.012406623922288418, 0.014599300920963287, 0.016791976988315582, 0.018984654918313026, 0.02117733284831047, 0.023370008915662766, 0.02556268498301506, 0.027755362913012505, 0.02994804084300995, 0.032140716910362244, 0.03433339297771454, 0.036526069045066833, 0.03871874883770943, 0.04091142490506172, 0.04310410097241402, 0.04529678076505661, 0.047489456832408905, 0.0496821328997612, 0.051874808967113495, 0.05406748503446579, 0.05626016482710838, 0.05845284089446068, 0.06064551696181297, 0.06283819675445557, 0.06503087282180786, 0.06722354888916016]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 12.0, 11.0, 7.0, 17.0, 15.0, 17.0, 23.0, 24.0, 27.0, 23.0, 24.0, 26.0, 35.0, 33.0, 32.0, 34.0, 36.0, 48.0, 40.0, 39.0, 35.0, 26.0, 44.0, 33.0, 29.0, 40.0, 30.0, 26.0, 25.0, 17.0, 16.0, 26.0, 11.0, 10.0, 14.0, 15.0, 13.0, 7.0, 8.0, 6.0, 5.0, 11.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.05078125, -3.9110107421875, -3.771240234375, -3.6314697265625, -3.49169921875, -3.3519287109375, -3.212158203125, -3.0723876953125, -2.9326171875, -2.7928466796875, -2.653076171875, -2.5133056640625, -2.37353515625, -2.2337646484375, -2.093994140625, -1.9542236328125, -1.814453125, -1.6746826171875, -1.534912109375, -1.3951416015625, -1.25537109375, -1.1156005859375, -0.975830078125, -0.8360595703125, -0.6962890625, -0.5565185546875, -0.416748046875, -0.2769775390625, -0.13720703125, 0.0025634765625, 0.142333984375, 0.2821044921875, 0.421875, 0.5616455078125, 0.701416015625, 0.8411865234375, 0.98095703125, 1.1207275390625, 1.260498046875, 1.4002685546875, 1.5400390625, 1.6798095703125, 1.819580078125, 1.9593505859375, 2.09912109375, 2.2388916015625, 2.378662109375, 2.5184326171875, 2.658203125, 2.7979736328125, 2.937744140625, 3.0775146484375, 3.21728515625, 3.3570556640625, 3.496826171875, 3.6365966796875, 3.7763671875, 3.9161376953125, 4.055908203125, 4.1956787109375, 4.33544921875, 4.4752197265625, 4.614990234375, 4.7547607421875, 4.89453125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 6.0, 4.0, 2.0, 4.0, 6.0, 12.0, 13.0, 22.0, 42.0, 52.0, 76.0, 90.0, 143.0, 223.0, 367.0, 547.0, 957.0, 1596.0, 2927.0, 5560.0, 12551.0, 32508.0, 105519.0, 428770.0, 328548.0, 79910.0, 26492.0, 10486.0, 4868.0, 2463.0, 1441.0, 817.0, 495.0, 340.0, 219.0, 134.0, 99.0, 79.0, 48.0, 34.0, 22.0, 18.0, 16.0, 10.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0], "bins": [-5.1796875, -5.03125, -4.8828125, -4.734375, -4.5859375, -4.4375, -4.2890625, -4.140625, -3.9921875, -3.84375, -3.6953125, -3.546875, -3.3984375, -3.25, -3.1015625, -2.953125, -2.8046875, -2.65625, -2.5078125, -2.359375, -2.2109375, -2.0625, -1.9140625, -1.765625, -1.6171875, -1.46875, -1.3203125, -1.171875, -1.0234375, -0.875, -0.7265625, -0.578125, -0.4296875, -0.28125, -0.1328125, 0.015625, 0.1640625, 0.3125, 0.4609375, 0.609375, 0.7578125, 0.90625, 1.0546875, 1.203125, 1.3515625, 1.5, 1.6484375, 1.796875, 1.9453125, 2.09375, 2.2421875, 2.390625, 2.5390625, 2.6875, 2.8359375, 2.984375, 3.1328125, 3.28125, 3.4296875, 3.578125, 3.7265625, 3.875, 4.0234375, 4.171875, 4.3203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 8.0, 8.0, 7.0, 11.0, 7.0, 16.0, 25.0, 19.0, 19.0, 20.0, 27.0, 32.0, 32.0, 39.0, 42.0, 36.0, 62.0, 127.0, 1555.0, 410.0, 92.0, 48.0, 50.0, 41.0, 41.0, 33.0, 38.0, 23.0, 33.0, 27.0, 16.0, 20.0, 16.0, 13.0, 14.0, 10.0, 13.0, 6.0, 0.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.78125, -17.224853515625, -16.66845703125, -16.112060546875, -15.5556640625, -14.999267578125, -14.44287109375, -13.886474609375, -13.330078125, -12.773681640625, -12.21728515625, -11.660888671875, -11.1044921875, -10.548095703125, -9.99169921875, -9.435302734375, -8.87890625, -8.322509765625, -7.76611328125, -7.209716796875, -6.6533203125, -6.096923828125, -5.54052734375, -4.984130859375, -4.427734375, -3.871337890625, -3.31494140625, -2.758544921875, -2.2021484375, -1.645751953125, -1.08935546875, -0.532958984375, 0.0234375, 0.579833984375, 1.13623046875, 1.692626953125, 2.2490234375, 2.805419921875, 3.36181640625, 3.918212890625, 4.474609375, 5.031005859375, 5.58740234375, 6.143798828125, 6.7001953125, 7.256591796875, 7.81298828125, 8.369384765625, 8.92578125, 9.482177734375, 10.03857421875, 10.594970703125, 11.1513671875, 11.707763671875, 12.26416015625, 12.820556640625, 13.376953125, 13.933349609375, 14.48974609375, 15.046142578125, 15.6025390625, 16.158935546875, 16.71533203125, 17.271728515625, 17.828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 0.0, 7.0, 8.0, 11.0, 14.0, 14.0, 15.0, 18.0, 20.0, 30.0, 32.0, 52.0, 62.0, 106.0, 151.0, 221.0, 436.0, 1092.0, 7709.0, 993215.0, 2130679.0, 9375.0, 1259.0, 425.0, 237.0, 158.0, 100.0, 49.0, 47.0, 30.0, 25.0, 23.0, 15.0, 16.0, 12.0, 14.0, 8.0, 3.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -27.14111328125, -26.2666015625, -25.39208984375, -24.517578125, -23.64306640625, -22.7685546875, -21.89404296875, -21.01953125, -20.14501953125, -19.2705078125, -18.39599609375, -17.521484375, -16.64697265625, -15.7724609375, -14.89794921875, -14.0234375, -13.14892578125, -12.2744140625, -11.39990234375, -10.525390625, -9.65087890625, -8.7763671875, -7.90185546875, -7.02734375, -6.15283203125, -5.2783203125, -4.40380859375, -3.529296875, -2.65478515625, -1.7802734375, -0.90576171875, -0.03125, 0.84326171875, 1.7177734375, 2.59228515625, 3.466796875, 4.34130859375, 5.2158203125, 6.09033203125, 6.96484375, 7.83935546875, 8.7138671875, 9.58837890625, 10.462890625, 11.33740234375, 12.2119140625, 13.08642578125, 13.9609375, 14.83544921875, 15.7099609375, 16.58447265625, 17.458984375, 18.33349609375, 19.2080078125, 20.08251953125, 20.95703125, 21.83154296875, 22.7060546875, 23.58056640625, 24.455078125, 25.32958984375, 26.2041015625, 27.07861328125, 27.953125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 204.0, 730.0, 79.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.94773864746094, -59.170570373535156, -54.39340591430664, -49.616241455078125, -44.839073181152344, -40.06190490722656, -35.28474044799805, -30.50757598876953, -25.73040771484375, -20.9532413482666, -16.176074981689453, -11.398908615112305, -6.621742248535156, -1.8445758819580078, 2.9325904846191406, 7.709754943847656, 12.486923217773438, 17.264089584350586, 22.041255950927734, 26.818422317504883, 31.59558868408203, 36.37275695800781, 41.14992141723633, 45.927085876464844, 50.704254150390625, 55.481422424316406, 60.25858688354492, 65.03575134277344, 69.81291961669922, 74.590087890625, 79.36724853515625, 84.14441680908203, 88.92160034179688, 93.69876861572266, 98.47593688964844, 103.25309753417969, 108.03026580810547, 112.80743408203125, 117.5845947265625, 122.36176300048828, 127.13893127441406, 131.9160919189453, 136.69326782226562, 141.47042846679688, 146.24758911132812, 151.02476501464844, 155.8019256591797, 160.5791015625, 165.35626220703125, 170.1334228515625, 174.9105987548828, 179.68775939941406, 184.46493530273438, 189.24209594726562, 194.01925659179688, 198.79641723632812, 203.57359313964844, 208.3507537841797, 213.1279296875, 217.90509033203125, 222.6822509765625, 227.4594268798828, 232.23658752441406, 237.01376342773438, 241.79092407226562]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 9.0, 7.0, 8.0, 10.0, 14.0, 11.0, 15.0, 14.0, 23.0, 25.0, 29.0, 39.0, 29.0, 42.0, 40.0, 48.0, 43.0, 40.0, 43.0, 45.0, 42.0, 70.0, 43.0, 39.0, 34.0, 40.0, 31.0, 22.0, 31.0, 22.0, 14.0, 16.0, 16.0, 14.0, 11.0, 6.0, 9.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.020755767822266, -57.145050048828125, -55.26934051513672, -53.39363479614258, -51.51792526245117, -49.64221954345703, -47.766510009765625, -45.890804290771484, -44.015098571777344, -42.1393928527832, -40.2636833190918, -38.387977600097656, -36.51226806640625, -34.63656234741211, -32.76085662841797, -30.885147094726562, -29.009437561035156, -27.133729934692383, -25.25802230834961, -23.38231658935547, -21.506607055664062, -19.630901336669922, -17.75519371032715, -15.879486083984375, -14.003778457641602, -12.128070831298828, -10.252363204956055, -8.376656532287598, -6.500948905944824, -4.625241279602051, -2.7495346069335938, -0.8738269805908203, 1.0018844604492188, 2.877591848373413, 4.753299236297607, 6.629006385803223, 8.504714012145996, 10.38042163848877, 12.256128311157227, 14.1318359375, 16.007543563842773, 17.883251190185547, 19.75895881652832, 21.634666442871094, 23.510372161865234, 25.38608169555664, 27.26178741455078, 29.137495040893555, 31.013202667236328, 32.88890838623047, 34.764617919921875, 36.640323638916016, 38.51603317260742, 40.39173889160156, 42.26744842529297, 44.14315414428711, 46.01885986328125, 47.89456558227539, 49.7702751159668, 51.64598083496094, 53.521690368652344, 55.397396087646484, 57.273101806640625, 59.14881134033203, 61.02452087402344]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 11.0, 3.0, 10.0, 14.0, 13.0, 13.0, 16.0, 25.0, 21.0, 23.0, 30.0, 26.0, 21.0, 22.0, 40.0, 36.0, 41.0, 29.0, 45.0, 35.0, 49.0, 34.0, 36.0, 37.0, 42.0, 27.0, 38.0, 33.0, 29.0, 20.0, 20.0, 23.0, 20.0, 11.0, 13.0, 12.0, 13.0, 15.0, 12.0, 6.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -3.9949951171875, -3.849365234375, -3.7037353515625, -3.55810546875, -3.4124755859375, -3.266845703125, -3.1212158203125, -2.9755859375, -2.8299560546875, -2.684326171875, -2.5386962890625, -2.39306640625, -2.2474365234375, -2.101806640625, -1.9561767578125, -1.810546875, -1.6649169921875, -1.519287109375, -1.3736572265625, -1.22802734375, -1.0823974609375, -0.936767578125, -0.7911376953125, -0.6455078125, -0.4998779296875, -0.354248046875, -0.2086181640625, -0.06298828125, 0.0826416015625, 0.228271484375, 0.3739013671875, 0.51953125, 0.6651611328125, 0.810791015625, 0.9564208984375, 1.10205078125, 1.2476806640625, 1.393310546875, 1.5389404296875, 1.6845703125, 1.8302001953125, 1.975830078125, 2.1214599609375, 2.26708984375, 2.4127197265625, 2.558349609375, 2.7039794921875, 2.849609375, 2.9952392578125, 3.140869140625, 3.2864990234375, 3.43212890625, 3.5777587890625, 3.723388671875, 3.8690185546875, 4.0146484375, 4.1602783203125, 4.305908203125, 4.4515380859375, 4.59716796875, 4.7427978515625, 4.888427734375, 5.0340576171875, 5.1796875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 23.0, 23.0, 32.0, 38.0, 57.0, 66.0, 91.0, 152.0, 242.0, 312.0, 458.0, 635.0, 972.0, 1421.0, 2167.0, 3338.0, 5403.0, 9163.0, 16504.0, 32474.0, 81077.0, 457554.0, 2830380.0, 582573.0, 89945.0, 35924.0, 17555.0, 9766.0, 5680.0, 3473.0, 2226.0, 1389.0, 951.0, 656.0, 440.0, 316.0, 222.0, 167.0, 119.0, 68.0, 46.0, 44.0, 34.0, 22.0, 20.0, 13.0, 7.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.5390625, -15.0303955078125, -14.521728515625, -14.0130615234375, -13.50439453125, -12.9957275390625, -12.487060546875, -11.9783935546875, -11.4697265625, -10.9610595703125, -10.452392578125, -9.9437255859375, -9.43505859375, -8.9263916015625, -8.417724609375, -7.9090576171875, -7.400390625, -6.8917236328125, -6.383056640625, -5.8743896484375, -5.36572265625, -4.8570556640625, -4.348388671875, -3.8397216796875, -3.3310546875, -2.8223876953125, -2.313720703125, -1.8050537109375, -1.29638671875, -0.7877197265625, -0.279052734375, 0.2296142578125, 0.73828125, 1.2469482421875, 1.755615234375, 2.2642822265625, 2.77294921875, 3.2816162109375, 3.790283203125, 4.2989501953125, 4.8076171875, 5.3162841796875, 5.824951171875, 6.3336181640625, 6.84228515625, 7.3509521484375, 7.859619140625, 8.3682861328125, 8.876953125, 9.3856201171875, 9.894287109375, 10.4029541015625, 10.91162109375, 11.4202880859375, 11.928955078125, 12.4376220703125, 12.9462890625, 13.4549560546875, 13.963623046875, 14.4722900390625, 14.98095703125, 15.4896240234375, 15.998291015625, 16.5069580078125, 17.015625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 17.0, 9.0, 19.0, 26.0, 27.0, 47.0, 50.0, 73.0, 93.0, 114.0, 194.0, 264.0, 404.0, 599.0, 610.0, 461.0, 297.0, 222.0, 144.0, 74.0, 77.0, 36.0, 46.0, 27.0, 28.0, 22.0, 24.0, 8.0, 8.0, 8.0, 8.0, 2.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.765625, -16.243896484375, -15.72216796875, -15.200439453125, -14.6787109375, -14.156982421875, -13.63525390625, -13.113525390625, -12.591796875, -12.070068359375, -11.54833984375, -11.026611328125, -10.5048828125, -9.983154296875, -9.46142578125, -8.939697265625, -8.41796875, -7.896240234375, -7.37451171875, -6.852783203125, -6.3310546875, -5.809326171875, -5.28759765625, -4.765869140625, -4.244140625, -3.722412109375, -3.20068359375, -2.678955078125, -2.1572265625, -1.635498046875, -1.11376953125, -0.592041015625, -0.0703125, 0.451416015625, 0.97314453125, 1.494873046875, 2.0166015625, 2.538330078125, 3.06005859375, 3.581787109375, 4.103515625, 4.625244140625, 5.14697265625, 5.668701171875, 6.1904296875, 6.712158203125, 7.23388671875, 7.755615234375, 8.27734375, 8.799072265625, 9.32080078125, 9.842529296875, 10.3642578125, 10.885986328125, 11.40771484375, 11.929443359375, 12.451171875, 12.972900390625, 13.49462890625, 14.016357421875, 14.5380859375, 15.059814453125, 15.58154296875, 16.103271484375, 16.625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 2.0, 8.0, 9.0, 16.0, 26.0, 24.0, 42.0, 70.0, 85.0, 143.0, 196.0, 336.0, 595.0, 883.0, 1552.0, 2710.0, 4933.0, 9124.0, 18150.0, 37651.0, 89544.0, 312551.0, 2141917.0, 1245384.0, 199040.0, 67555.0, 29747.0, 14388.0, 7714.0, 4084.0, 2435.0, 1332.0, 743.0, 492.0, 278.0, 176.0, 134.0, 65.0, 51.0, 35.0, 20.0, 15.0, 6.0, 4.0, 11.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.203125, -23.46630859375, -22.7294921875, -21.99267578125, -21.255859375, -20.51904296875, -19.7822265625, -19.04541015625, -18.30859375, -17.57177734375, -16.8349609375, -16.09814453125, -15.361328125, -14.62451171875, -13.8876953125, -13.15087890625, -12.4140625, -11.67724609375, -10.9404296875, -10.20361328125, -9.466796875, -8.72998046875, -7.9931640625, -7.25634765625, -6.51953125, -5.78271484375, -5.0458984375, -4.30908203125, -3.572265625, -2.83544921875, -2.0986328125, -1.36181640625, -0.625, 0.11181640625, 0.8486328125, 1.58544921875, 2.322265625, 3.05908203125, 3.7958984375, 4.53271484375, 5.26953125, 6.00634765625, 6.7431640625, 7.47998046875, 8.216796875, 8.95361328125, 9.6904296875, 10.42724609375, 11.1640625, 11.90087890625, 12.6376953125, 13.37451171875, 14.111328125, 14.84814453125, 15.5849609375, 16.32177734375, 17.05859375, 17.79541015625, 18.5322265625, 19.26904296875, 20.005859375, 20.74267578125, 21.4794921875, 22.21630859375, 22.953125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 13.0, 24.0, 32.0, 54.0, 91.0, 107.0, 123.0, 135.0, 138.0, 86.0, 71.0, 43.0, 32.0, 17.0, 11.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.44300842285156, -163.2902374267578, -159.13746643066406, -154.9846954345703, -150.8319091796875, -146.67913818359375, -142.5263671875, -138.37359619140625, -134.2208251953125, -130.06805419921875, -125.915283203125, -121.76250457763672, -117.60973358154297, -113.45696258544922, -109.30418395996094, -105.15141296386719, -100.99864196777344, -96.84587097167969, -92.69309997558594, -88.54032135009766, -84.3875503540039, -80.23477935791016, -76.08200073242188, -71.92922973632812, -67.77645874023438, -63.623687744140625, -59.47091293334961, -55.318138122558594, -51.165367126464844, -47.012596130371094, -42.85982131958008, -38.70704650878906, -34.55426025390625, -30.401487350463867, -26.248714447021484, -22.0959415435791, -17.94316864013672, -13.790395736694336, -9.637622833251953, -5.48484992980957, -1.3320770263671875, 2.8206958770751953, 6.973468780517578, 11.126241683959961, 15.279014587402344, 19.431787490844727, 23.58456039428711, 27.737333297729492, 31.890106201171875, 36.042877197265625, 40.19565200805664, 44.348426818847656, 48.501197814941406, 52.653968811035156, 56.80674362182617, 60.95951843261719, 65.11228942871094, 69.26506042480469, 73.41783142089844, 77.57061004638672, 81.72338104248047, 85.87615203857422, 90.0289306640625, 94.18170166015625, 98.33447265625]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 7.0, 9.0, 11.0, 15.0, 15.0, 17.0, 17.0, 26.0, 29.0, 29.0, 29.0, 38.0, 33.0, 30.0, 27.0, 29.0, 41.0, 37.0, 35.0, 48.0, 50.0, 50.0, 29.0, 45.0, 31.0, 32.0, 32.0, 28.0, 26.0, 26.0, 13.0, 22.0, 22.0, 12.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-56.74903106689453, -55.08230209350586, -53.41557312011719, -51.748844146728516, -50.082115173339844, -48.41539001464844, -46.7486572265625, -45.081932067871094, -43.41520309448242, -41.74847412109375, -40.08174514770508, -38.415016174316406, -36.748287200927734, -35.08155822753906, -33.414833068847656, -31.748104095458984, -30.08137321472168, -28.414644241333008, -26.747915267944336, -25.081188201904297, -23.414459228515625, -21.747730255126953, -20.08100128173828, -18.41427230834961, -16.747543334960938, -15.080814361572266, -13.41408634185791, -11.747357368469238, -10.080629348754883, -8.413900375366211, -6.747171401977539, -5.080443382263184, -3.413715362548828, -1.746986746788025, -0.08025813102722168, 1.586470603942871, 3.2531991004943848, 4.919927597045898, 6.58665657043457, 8.253384590148926, 9.920113563537598, 11.58684253692627, 13.253570556640625, 14.920299530029297, 16.58702850341797, 18.25375747680664, 19.920486450195312, 21.58721351623535, 23.253942489624023, 24.920671463012695, 26.587400436401367, 28.254127502441406, 29.920856475830078, 31.58758544921875, 33.25431442260742, 34.921043395996094, 36.587772369384766, 38.25450134277344, 39.92123031616211, 41.58795928955078, 43.25468826293945, 44.921417236328125, 46.58814239501953, 48.2548713684082, 49.921600341796875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 5.0, 8.0, 14.0, 13.0, 17.0, 18.0, 19.0, 29.0, 19.0, 27.0, 31.0, 31.0, 31.0, 24.0, 32.0, 47.0, 40.0, 35.0, 40.0, 40.0, 40.0, 37.0, 26.0, 38.0, 26.0, 27.0, 31.0, 30.0, 28.0, 29.0, 20.0, 13.0, 18.0, 19.0, 10.0, 11.0, 12.0, 9.0, 12.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-5.515625, -5.358154296875, -5.20068359375, -5.043212890625, -4.8857421875, -4.728271484375, -4.57080078125, -4.413330078125, -4.255859375, -4.098388671875, -3.94091796875, -3.783447265625, -3.6259765625, -3.468505859375, -3.31103515625, -3.153564453125, -2.99609375, -2.838623046875, -2.68115234375, -2.523681640625, -2.3662109375, -2.208740234375, -2.05126953125, -1.893798828125, -1.736328125, -1.578857421875, -1.42138671875, -1.263916015625, -1.1064453125, -0.948974609375, -0.79150390625, -0.634033203125, -0.4765625, -0.319091796875, -0.16162109375, -0.004150390625, 0.1533203125, 0.310791015625, 0.46826171875, 0.625732421875, 0.783203125, 0.940673828125, 1.09814453125, 1.255615234375, 1.4130859375, 1.570556640625, 1.72802734375, 1.885498046875, 2.04296875, 2.200439453125, 2.35791015625, 2.515380859375, 2.6728515625, 2.830322265625, 2.98779296875, 3.145263671875, 3.302734375, 3.460205078125, 3.61767578125, 3.775146484375, 3.9326171875, 4.090087890625, 4.24755859375, 4.405029296875, 4.5625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 10.0, 10.0, 9.0, 19.0, 26.0, 33.0, 61.0, 90.0, 140.0, 196.0, 304.0, 505.0, 836.0, 1280.0, 2097.0, 3407.0, 5577.0, 9655.0, 17543.0, 33118.0, 67051.0, 141722.0, 269894.0, 245062.0, 123937.0, 58703.0, 29514.0, 15700.0, 8674.0, 4999.0, 3157.0, 1881.0, 1239.0, 787.0, 431.0, 309.0, 200.0, 128.0, 78.0, 55.0, 40.0, 22.0, 18.0, 10.0, 6.0, 5.0, 11.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.91015625, -0.8824996948242188, -0.8548431396484375, -0.8271865844726562, -0.799530029296875, -0.7718734741210938, -0.7442169189453125, -0.7165603637695312, -0.68890380859375, -0.6612472534179688, -0.6335906982421875, -0.6059341430664062, -0.578277587890625, -0.5506210327148438, -0.5229644775390625, -0.49530792236328125, -0.4676513671875, -0.43999481201171875, -0.4123382568359375, -0.38468170166015625, -0.357025146484375, -0.32936859130859375, -0.3017120361328125, -0.27405548095703125, -0.24639892578125, -0.21874237060546875, -0.1910858154296875, -0.16342926025390625, -0.135772705078125, -0.10811614990234375, -0.0804595947265625, -0.05280303955078125, -0.025146484375, 0.00251007080078125, 0.0301666259765625, 0.05782318115234375, 0.085479736328125, 0.11313629150390625, 0.1407928466796875, 0.16844940185546875, 0.19610595703125, 0.22376251220703125, 0.2514190673828125, 0.27907562255859375, 0.306732177734375, 0.33438873291015625, 0.3620452880859375, 0.38970184326171875, 0.4173583984375, 0.44501495361328125, 0.4726715087890625, 0.5003280639648438, 0.527984619140625, 0.5556411743164062, 0.5832977294921875, 0.6109542846679688, 0.63861083984375, 0.6662673950195312, 0.6939239501953125, 0.7215805053710938, 0.749237060546875, 0.7768936157226562, 0.8045501708984375, 0.8322067260742188, 0.85986328125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 6.0, 5.0, 10.0, 6.0, 8.0, 10.0, 13.0, 16.0, 20.0, 21.0, 25.0, 25.0, 26.0, 31.0, 32.0, 37.0, 36.0, 34.0, 37.0, 46.0, 44.0, 1057.0, 27.0, 44.0, 38.0, 35.0, 37.0, 31.0, 24.0, 34.0, 34.0, 25.0, 30.0, 28.0, 17.0, 9.0, 13.0, 13.0, 11.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.73828125, -3.625732421875, -3.51318359375, -3.400634765625, -3.2880859375, -3.175537109375, -3.06298828125, -2.950439453125, -2.837890625, -2.725341796875, -2.61279296875, -2.500244140625, -2.3876953125, -2.275146484375, -2.16259765625, -2.050048828125, -1.9375, -1.824951171875, -1.71240234375, -1.599853515625, -1.4873046875, -1.374755859375, -1.26220703125, -1.149658203125, -1.037109375, -0.924560546875, -0.81201171875, -0.699462890625, -0.5869140625, -0.474365234375, -0.36181640625, -0.249267578125, -0.13671875, -0.024169921875, 0.08837890625, 0.200927734375, 0.3134765625, 0.426025390625, 0.53857421875, 0.651123046875, 0.763671875, 0.876220703125, 0.98876953125, 1.101318359375, 1.2138671875, 1.326416015625, 1.43896484375, 1.551513671875, 1.6640625, 1.776611328125, 1.88916015625, 2.001708984375, 2.1142578125, 2.226806640625, 2.33935546875, 2.451904296875, 2.564453125, 2.677001953125, 2.78955078125, 2.902099609375, 3.0146484375, 3.127197265625, 3.23974609375, 3.352294921875, 3.46484375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 13.0, 18.0, 20.0, 21.0, 27.0, 57.0, 88.0, 111.0, 172.0, 273.0, 349.0, 560.0, 809.0, 1215.0, 1893.0, 2874.0, 4459.0, 6824.0, 11009.0, 17227.0, 27598.0, 44284.0, 74657.0, 126857.0, 407228.0, 1023594.0, 136106.0, 80281.0, 47795.0, 29500.0, 18603.0, 11454.0, 7348.0, 4719.0, 3055.0, 2015.0, 1292.0, 915.0, 587.0, 397.0, 248.0, 179.0, 128.0, 95.0, 63.0, 29.0, 23.0, 24.0, 12.0, 10.0, 6.0, 5.0, 2.0, 4.0, 2.0], "bins": [-0.345458984375, -0.33531951904296875, -0.3251800537109375, -0.31504058837890625, -0.304901123046875, -0.29476165771484375, -0.2846221923828125, -0.27448272705078125, -0.26434326171875, -0.25420379638671875, -0.2440643310546875, -0.23392486572265625, -0.223785400390625, -0.21364593505859375, -0.2035064697265625, -0.19336700439453125, -0.1832275390625, -0.17308807373046875, -0.1629486083984375, -0.15280914306640625, -0.142669677734375, -0.13253021240234375, -0.1223907470703125, -0.11225128173828125, -0.10211181640625, -0.09197235107421875, -0.0818328857421875, -0.07169342041015625, -0.061553955078125, -0.05141448974609375, -0.0412750244140625, -0.03113555908203125, -0.02099609375, -0.01085662841796875, -0.0007171630859375, 0.00942230224609375, 0.019561767578125, 0.02970123291015625, 0.0398406982421875, 0.04998016357421875, 0.06011962890625, 0.07025909423828125, 0.0803985595703125, 0.09053802490234375, 0.100677490234375, 0.11081695556640625, 0.1209564208984375, 0.13109588623046875, 0.1412353515625, 0.15137481689453125, 0.1615142822265625, 0.17165374755859375, 0.181793212890625, 0.19193267822265625, 0.2020721435546875, 0.21221160888671875, 0.22235107421875, 0.23249053955078125, 0.2426300048828125, 0.25276947021484375, 0.262908935546875, 0.27304840087890625, 0.2831878662109375, 0.29332733154296875, 0.303466796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 8.0, 13.0, 14.0, 24.0, 20.0, 17.0, 20.0, 29.0, 23.0, 45.0, 51.0, 60.0, 50.0, 43.0, 54.0, 57.0, 66.0, 47.0, 39.0, 43.0, 31.0, 32.0, 33.0, 31.0, 19.0, 13.0, 11.0, 12.0, 12.0, 9.0, 3.0, 6.0, 2.0, 4.0, 2.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.038238525390625, -0.03709220886230469, -0.035945892333984375, -0.03479957580566406, -0.03365325927734375, -0.03250694274902344, -0.031360626220703125, -0.030214309692382812, -0.0290679931640625, -0.027921676635742188, -0.026775360107421875, -0.025629043579101562, -0.02448272705078125, -0.023336410522460938, -0.022190093994140625, -0.021043777465820312, -0.0198974609375, -0.018751144409179688, -0.017604827880859375, -0.016458511352539062, -0.01531219482421875, -0.014165878295898438, -0.013019561767578125, -0.011873245239257812, -0.0107269287109375, -0.009580612182617188, -0.008434295654296875, -0.0072879791259765625, -0.00614166259765625, -0.0049953460693359375, -0.003849029541015625, -0.0027027130126953125, -0.001556396484375, -0.0004100799560546875, 0.000736236572265625, 0.0018825531005859375, 0.00302886962890625, 0.0041751861572265625, 0.005321502685546875, 0.0064678192138671875, 0.0076141357421875, 0.008760452270507812, 0.009906768798828125, 0.011053085327148438, 0.01219940185546875, 0.013345718383789062, 0.014492034912109375, 0.015638351440429688, 0.01678466796875, 0.017930984497070312, 0.019077301025390625, 0.020223617553710938, 0.02136993408203125, 0.022516250610351562, 0.023662567138671875, 0.024808883666992188, 0.0259552001953125, 0.027101516723632812, 0.028247833251953125, 0.029394149780273438, 0.03054046630859375, 0.03168678283691406, 0.032833099365234375, 0.03397941589355469, 0.035125732421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 2.0, 6.0, 2.0, 5.0, 5.0, 5.0, 10.0, 11.0, 15.0, 17.0, 20.0, 37.0, 34.0, 49.0, 62.0, 73.0, 100.0, 157.0, 230.0, 445.0, 2312.0, 828703.0, 213469.0, 1545.0, 437.0, 255.0, 151.0, 84.0, 64.0, 53.0, 32.0, 30.0, 36.0, 23.0, 11.0, 10.0, 7.0, 5.0, 8.0, 2.0, 2.0, 3.0, 9.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.7080078125, -0.6858291625976562, -0.6636505126953125, -0.6414718627929688, -0.619293212890625, -0.5971145629882812, -0.5749359130859375, -0.5527572631835938, -0.53057861328125, -0.5083999633789062, -0.4862213134765625, -0.46404266357421875, -0.441864013671875, -0.41968536376953125, -0.3975067138671875, -0.37532806396484375, -0.3531494140625, -0.33097076416015625, -0.3087921142578125, -0.28661346435546875, -0.264434814453125, -0.24225616455078125, -0.2200775146484375, -0.19789886474609375, -0.17572021484375, -0.15354156494140625, -0.1313629150390625, -0.10918426513671875, -0.087005615234375, -0.06482696533203125, -0.0426483154296875, -0.02046966552734375, 0.001708984375, 0.02388763427734375, 0.0460662841796875, 0.06824493408203125, 0.090423583984375, 0.11260223388671875, 0.1347808837890625, 0.15695953369140625, 0.17913818359375, 0.20131683349609375, 0.2234954833984375, 0.24567413330078125, 0.267852783203125, 0.29003143310546875, 0.3122100830078125, 0.33438873291015625, 0.3565673828125, 0.37874603271484375, 0.4009246826171875, 0.42310333251953125, 0.445281982421875, 0.46746063232421875, 0.4896392822265625, 0.5118179321289062, 0.53399658203125, 0.5561752319335938, 0.5783538818359375, 0.6005325317382812, 0.622711181640625, 0.6448898315429688, 0.6670684814453125, 0.6892471313476562, 0.71142578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 14.0, 72.0, 225.0, 464.0, 148.0, 37.0, 24.0, 11.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059545211493968964, -0.04999332129955292, -0.04044143110513687, -0.030889540910720825, -0.02133765071630478, -0.011785760521888733, -0.0022338703274726868, 0.007318019866943359, 0.016869910061359406, 0.02642180025577545, 0.0359736904501915, 0.045525580644607544, 0.05507747083902359, 0.06462936103343964, 0.07418125122785568, 0.08373314142227173, 0.09328503161668777, 0.10283692181110382, 0.11238881200551987, 0.12194070219993591, 0.13149258494377136, 0.141044482588768, 0.15059638023376465, 0.1601482629776001, 0.16970014572143555, 0.179252028465271, 0.18880392611026764, 0.19835582375526428, 0.20790770649909973, 0.21745958924293518, 0.22701148688793182, 0.23656338453292847, 0.24611526727676392, 0.25566715002059937, 0.2652190327644348, 0.27477094531059265, 0.2843228280544281, 0.29387471079826355, 0.3034266233444214, 0.31297850608825684, 0.3225303888320923, 0.33208227157592773, 0.3416341543197632, 0.351186066865921, 0.36073794960975647, 0.3702898323535919, 0.37984174489974976, 0.3893936276435852, 0.39894551038742065, 0.4084973931312561, 0.41804927587509155, 0.4276011884212494, 0.43715307116508484, 0.4467049539089203, 0.4562568664550781, 0.4658087491989136, 0.475360631942749, 0.4849125146865845, 0.4944643974304199, 0.5040162801742554, 0.5135681629180908, 0.523120105266571, 0.5326719880104065, 0.5422238707542419, 0.5517757534980774]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 11.0, 11.0, 10.0, 8.0, 14.0, 16.0, 11.0, 19.0, 23.0, 25.0, 34.0, 29.0, 32.0, 22.0, 42.0, 27.0, 34.0, 38.0, 44.0, 33.0, 30.0, 51.0, 31.0, 26.0, 35.0, 33.0, 33.0, 33.0, 23.0, 19.0, 30.0, 22.0, 18.0, 18.0, 15.0, 12.0, 11.0, 7.0, 14.0, 5.0, 6.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11718302965164185, -0.1135890930891037, -0.10999515652656555, -0.106401227414608, -0.10280729085206985, -0.09921335428953171, -0.09561942517757416, -0.09202548861503601, -0.08843155205249786, -0.08483761548995972, -0.08124367892742157, -0.07764974981546402, -0.07405581325292587, -0.07046187669038773, -0.06686794757843018, -0.06327401101589203, -0.05968007445335388, -0.056086137890815735, -0.052492205053567886, -0.04889827221632004, -0.04530433565378189, -0.041710399091243744, -0.038116466253995895, -0.03452253341674805, -0.0309285968542099, -0.027334662154316902, -0.023740727454423904, -0.020146792754530907, -0.01655285805463791, -0.012958923354744911, -0.009364988654851913, -0.005771053954958916, -0.002177119255065918, 0.0014168154448270798, 0.0050107501447200775, 0.008604684844613075, 0.012198619544506073, 0.01579255424439907, 0.01938648894429207, 0.022980423644185066, 0.026574358344078064, 0.03016829304397106, 0.03376222774386406, 0.03735616058111191, 0.040950097143650055, 0.0445440337061882, 0.04813796654343605, 0.0517318993806839, 0.055325835943222046, 0.05891977250576019, 0.06251370906829834, 0.06610763818025589, 0.06970157474279404, 0.07329551130533218, 0.07688944041728973, 0.08048337697982788, 0.08407731354236603, 0.08767125010490417, 0.09126518666744232, 0.09485911577939987, 0.09845305234193802, 0.10204698890447617, 0.10564091801643372, 0.10923485457897186, 0.11282879114151001]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 10.0, 5.0, 8.0, 14.0, 13.0, 17.0, 17.0, 20.0, 29.0, 19.0, 27.0, 31.0, 29.0, 31.0, 24.0, 33.0, 47.0, 40.0, 35.0, 41.0, 38.0, 41.0, 38.0, 27.0, 36.0, 27.0, 25.0, 33.0, 30.0, 28.0, 28.0, 20.0, 14.0, 18.0, 19.0, 9.0, 12.0, 11.0, 10.0, 12.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-5.51953125, -5.362060546875, -5.20458984375, -5.047119140625, -4.8896484375, -4.732177734375, -4.57470703125, -4.417236328125, -4.259765625, -4.102294921875, -3.94482421875, -3.787353515625, -3.6298828125, -3.472412109375, -3.31494140625, -3.157470703125, -3.0, -2.842529296875, -2.68505859375, -2.527587890625, -2.3701171875, -2.212646484375, -2.05517578125, -1.897705078125, -1.740234375, -1.582763671875, -1.42529296875, -1.267822265625, -1.1103515625, -0.952880859375, -0.79541015625, -0.637939453125, -0.48046875, -0.322998046875, -0.16552734375, -0.008056640625, 0.1494140625, 0.306884765625, 0.46435546875, 0.621826171875, 0.779296875, 0.936767578125, 1.09423828125, 1.251708984375, 1.4091796875, 1.566650390625, 1.72412109375, 1.881591796875, 2.0390625, 2.196533203125, 2.35400390625, 2.511474609375, 2.6689453125, 2.826416015625, 2.98388671875, 3.141357421875, 3.298828125, 3.456298828125, 3.61376953125, 3.771240234375, 3.9287109375, 4.086181640625, 4.24365234375, 4.401123046875, 4.55859375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 10.0, 16.0, 18.0, 18.0, 34.0, 45.0, 59.0, 84.0, 88.0, 158.0, 179.0, 271.0, 344.0, 456.0, 585.0, 819.0, 1135.0, 1458.0, 2140.0, 3242.0, 5139.0, 9829.0, 32298.0, 399085.0, 522380.0, 40596.0, 11029.0, 5455.0, 3306.0, 2237.0, 1594.0, 1120.0, 847.0, 622.0, 475.0, 328.0, 268.0, 187.0, 163.0, 115.0, 83.0, 66.0, 49.0, 34.0, 37.0, 15.0, 4.0, 8.0, 7.0, 9.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5859375, -12.193359375, -11.80078125, -11.408203125, -11.015625, -10.623046875, -10.23046875, -9.837890625, -9.4453125, -9.052734375, -8.66015625, -8.267578125, -7.875, -7.482421875, -7.08984375, -6.697265625, -6.3046875, -5.912109375, -5.51953125, -5.126953125, -4.734375, -4.341796875, -3.94921875, -3.556640625, -3.1640625, -2.771484375, -2.37890625, -1.986328125, -1.59375, -1.201171875, -0.80859375, -0.416015625, -0.0234375, 0.369140625, 0.76171875, 1.154296875, 1.546875, 1.939453125, 2.33203125, 2.724609375, 3.1171875, 3.509765625, 3.90234375, 4.294921875, 4.6875, 5.080078125, 5.47265625, 5.865234375, 6.2578125, 6.650390625, 7.04296875, 7.435546875, 7.828125, 8.220703125, 8.61328125, 9.005859375, 9.3984375, 9.791015625, 10.18359375, 10.576171875, 10.96875, 11.361328125, 11.75390625, 12.146484375, 12.5390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 14.0, 13.0, 14.0, 20.0, 19.0, 36.0, 27.0, 35.0, 32.0, 44.0, 46.0, 56.0, 61.0, 77.0, 150.0, 1620.0, 228.0, 82.0, 70.0, 50.0, 45.0, 46.0, 44.0, 39.0, 36.0, 26.0, 22.0, 27.0, 11.0, 16.0, 11.0, 12.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.498779296875, -20.84130859375, -20.183837890625, -19.5263671875, -18.868896484375, -18.21142578125, -17.553955078125, -16.896484375, -16.239013671875, -15.58154296875, -14.924072265625, -14.2666015625, -13.609130859375, -12.95166015625, -12.294189453125, -11.63671875, -10.979248046875, -10.32177734375, -9.664306640625, -9.0068359375, -8.349365234375, -7.69189453125, -7.034423828125, -6.376953125, -5.719482421875, -5.06201171875, -4.404541015625, -3.7470703125, -3.089599609375, -2.43212890625, -1.774658203125, -1.1171875, -0.459716796875, 0.19775390625, 0.855224609375, 1.5126953125, 2.170166015625, 2.82763671875, 3.485107421875, 4.142578125, 4.800048828125, 5.45751953125, 6.114990234375, 6.7724609375, 7.429931640625, 8.08740234375, 8.744873046875, 9.40234375, 10.059814453125, 10.71728515625, 11.374755859375, 12.0322265625, 12.689697265625, 13.34716796875, 14.004638671875, 14.662109375, 15.319580078125, 15.97705078125, 16.634521484375, 17.2919921875, 17.949462890625, 18.60693359375, 19.264404296875, 19.921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 10.0, 14.0, 21.0, 26.0, 26.0, 42.0, 51.0, 101.0, 149.0, 253.0, 392.0, 854.0, 1488.0, 3040.0, 6595.0, 16415.0, 75739.0, 2829682.0, 172010.0, 22698.0, 8318.0, 3706.0, 1820.0, 972.0, 509.0, 272.0, 181.0, 92.0, 79.0, 36.0, 30.0, 24.0, 19.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.859375, -28.91552734375, -27.9716796875, -27.02783203125, -26.083984375, -25.14013671875, -24.1962890625, -23.25244140625, -22.30859375, -21.36474609375, -20.4208984375, -19.47705078125, -18.533203125, -17.58935546875, -16.6455078125, -15.70166015625, -14.7578125, -13.81396484375, -12.8701171875, -11.92626953125, -10.982421875, -10.03857421875, -9.0947265625, -8.15087890625, -7.20703125, -6.26318359375, -5.3193359375, -4.37548828125, -3.431640625, -2.48779296875, -1.5439453125, -0.60009765625, 0.34375, 1.28759765625, 2.2314453125, 3.17529296875, 4.119140625, 5.06298828125, 6.0068359375, 6.95068359375, 7.89453125, 8.83837890625, 9.7822265625, 10.72607421875, 11.669921875, 12.61376953125, 13.5576171875, 14.50146484375, 15.4453125, 16.38916015625, 17.3330078125, 18.27685546875, 19.220703125, 20.16455078125, 21.1083984375, 22.05224609375, 22.99609375, 23.93994140625, 24.8837890625, 25.82763671875, 26.771484375, 27.71533203125, 28.6591796875, 29.60302734375, 30.546875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [23.0, 838.0, 155.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.15609359741211, -12.435873031616211, 5.2843475341796875, 23.004566192626953, 40.724788665771484, 58.445011138916016, 76.16522216796875, 93.88545227050781, 111.60566711425781, 129.3258819580078, 147.04611206054688, 164.76632690429688, 182.48654174804688, 200.20677185058594, 217.92698669433594, 235.647216796875, 253.367431640625, 271.087646484375, 288.807861328125, 306.528076171875, 324.2483215332031, 341.9685363769531, 359.6887512207031, 377.4089660644531, 395.12921142578125, 412.84942626953125, 430.56964111328125, 448.28985595703125, 466.0101013183594, 483.7303161621094, 501.4505310058594, 519.1707763671875, 536.8909301757812, 554.6111450195312, 572.3313598632812, 590.0515747070312, 607.7717895507812, 625.4920654296875, 643.2122802734375, 660.9324951171875, 678.6527099609375, 696.3729248046875, 714.0931396484375, 731.8133544921875, 749.5335693359375, 767.2537841796875, 784.9739990234375, 802.6942749023438, 820.4144287109375, 838.1346435546875, 855.8548583984375, 873.5750732421875, 891.2952880859375, 909.0155029296875, 926.7357177734375, 944.4559936523438, 962.1762084960938, 979.8964233398438, 997.6166381835938, 1015.3368530273438, 1033.05712890625, 1050.77734375, 1068.49755859375, 1086.2177734375, 1103.93798828125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 21.0, 11.0, 24.0, 20.0, 19.0, 27.0, 21.0, 31.0, 40.0, 30.0, 45.0, 40.0, 37.0, 39.0, 43.0, 37.0, 37.0, 37.0, 31.0, 36.0, 39.0, 26.0, 31.0, 25.0, 19.0, 26.0, 29.0, 25.0, 19.0, 17.0, 11.0, 13.0, 8.0, 8.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.10598373413086, -56.234596252441406, -54.36320877075195, -52.4918212890625, -50.62043380737305, -48.749046325683594, -46.877655029296875, -45.00627136230469, -43.13488006591797, -41.263492584228516, -39.39210510253906, -37.52071762084961, -35.649330139160156, -33.7779426574707, -31.906553268432617, -30.035165786743164, -28.163780212402344, -26.29239273071289, -24.421005249023438, -22.549617767333984, -20.67823028564453, -18.806842803955078, -16.935453414916992, -15.064065933227539, -13.192678451538086, -11.321290969848633, -9.44990348815918, -7.57851505279541, -5.707127571105957, -3.835740089416504, -1.9643516540527344, -0.09296417236328125, 1.7784271240234375, 3.6498148441314697, 5.521202564239502, 7.392590522766113, 9.263978004455566, 11.13536548614502, 13.006753921508789, 14.878141403198242, 16.749528884887695, 18.62091636657715, 20.4923038482666, 22.363693237304688, 24.23508071899414, 26.106468200683594, 27.977855682373047, 29.8492431640625, 31.720630645751953, 33.592018127441406, 35.46340560913086, 37.33479309082031, 39.206180572509766, 41.07756805419922, 42.94895935058594, 44.820343017578125, 46.691734313964844, 48.5631217956543, 50.43450927734375, 52.3058967590332, 54.177284240722656, 56.04867172241211, 57.92005920410156, 59.79145050048828, 61.66283416748047]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 2.0, 11.0, 10.0, 8.0, 15.0, 13.0, 24.0, 19.0, 22.0, 28.0, 21.0, 27.0, 32.0, 33.0, 38.0, 39.0, 37.0, 36.0, 48.0, 44.0, 35.0, 45.0, 43.0, 30.0, 32.0, 32.0, 26.0, 29.0, 31.0, 24.0, 19.0, 20.0, 23.0, 18.0, 14.0, 10.0, 15.0, 10.0, 6.0, 9.0, 9.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.34588623046875, -5.1722412109375, -4.99859619140625, -4.824951171875, -4.65130615234375, -4.4776611328125, -4.30401611328125, -4.13037109375, -3.95672607421875, -3.7830810546875, -3.60943603515625, -3.435791015625, -3.26214599609375, -3.0885009765625, -2.91485595703125, -2.7412109375, -2.56756591796875, -2.3939208984375, -2.22027587890625, -2.046630859375, -1.87298583984375, -1.6993408203125, -1.52569580078125, -1.35205078125, -1.17840576171875, -1.0047607421875, -0.83111572265625, -0.657470703125, -0.48382568359375, -0.3101806640625, -0.13653564453125, 0.037109375, 0.21075439453125, 0.3843994140625, 0.55804443359375, 0.731689453125, 0.90533447265625, 1.0789794921875, 1.25262451171875, 1.42626953125, 1.59991455078125, 1.7735595703125, 1.94720458984375, 2.120849609375, 2.29449462890625, 2.4681396484375, 2.64178466796875, 2.8154296875, 2.98907470703125, 3.1627197265625, 3.33636474609375, 3.510009765625, 3.68365478515625, 3.8572998046875, 4.03094482421875, 4.20458984375, 4.37823486328125, 4.5518798828125, 4.72552490234375, 4.899169921875, 5.07281494140625, 5.2464599609375, 5.42010498046875, 5.59375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 7.0, 9.0, 13.0, 20.0, 29.0, 52.0, 102.0, 144.0, 282.0, 539.0, 988.0, 2013.0, 4226.0, 10143.0, 26452.0, 97427.0, 1805913.0, 2092925.0, 105909.0, 28042.0, 10394.0, 4472.0, 1920.0, 1054.0, 507.0, 269.0, 153.0, 75.0, 59.0, 35.0, 32.0, 20.0, 15.0, 8.0, 3.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.671875, -22.8271484375, -21.982421875, -21.1376953125, -20.29296875, -19.4482421875, -18.603515625, -17.7587890625, -16.9140625, -16.0693359375, -15.224609375, -14.3798828125, -13.53515625, -12.6904296875, -11.845703125, -11.0009765625, -10.15625, -9.3115234375, -8.466796875, -7.6220703125, -6.77734375, -5.9326171875, -5.087890625, -4.2431640625, -3.3984375, -2.5537109375, -1.708984375, -0.8642578125, -0.01953125, 0.8251953125, 1.669921875, 2.5146484375, 3.359375, 4.2041015625, 5.048828125, 5.8935546875, 6.73828125, 7.5830078125, 8.427734375, 9.2724609375, 10.1171875, 10.9619140625, 11.806640625, 12.6513671875, 13.49609375, 14.3408203125, 15.185546875, 16.0302734375, 16.875, 17.7197265625, 18.564453125, 19.4091796875, 20.25390625, 21.0986328125, 21.943359375, 22.7880859375, 23.6328125, 24.4775390625, 25.322265625, 26.1669921875, 27.01171875, 27.8564453125, 28.701171875, 29.5458984375, 30.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 12.0, 10.0, 28.0, 26.0, 47.0, 65.0, 95.0, 122.0, 228.0, 348.0, 595.0, 783.0, 603.0, 400.0, 240.0, 147.0, 95.0, 47.0, 46.0, 35.0, 18.0, 26.0, 16.0, 6.0, 4.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.63427734375, -14.9404296875, -14.24658203125, -13.552734375, -12.85888671875, -12.1650390625, -11.47119140625, -10.77734375, -10.08349609375, -9.3896484375, -8.69580078125, -8.001953125, -7.30810546875, -6.6142578125, -5.92041015625, -5.2265625, -4.53271484375, -3.8388671875, -3.14501953125, -2.451171875, -1.75732421875, -1.0634765625, -0.36962890625, 0.32421875, 1.01806640625, 1.7119140625, 2.40576171875, 3.099609375, 3.79345703125, 4.4873046875, 5.18115234375, 5.875, 6.56884765625, 7.2626953125, 7.95654296875, 8.650390625, 9.34423828125, 10.0380859375, 10.73193359375, 11.42578125, 12.11962890625, 12.8134765625, 13.50732421875, 14.201171875, 14.89501953125, 15.5888671875, 16.28271484375, 16.9765625, 17.67041015625, 18.3642578125, 19.05810546875, 19.751953125, 20.44580078125, 21.1396484375, 21.83349609375, 22.52734375, 23.22119140625, 23.9150390625, 24.60888671875, 25.302734375, 25.99658203125, 26.6904296875, 27.38427734375, 28.078125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 12.0, 10.0, 11.0, 15.0, 31.0, 50.0, 67.0, 107.0, 202.0, 386.0, 757.0, 1468.0, 3340.0, 7570.0, 19028.0, 51094.0, 172584.0, 1372794.0, 2210842.0, 247825.0, 65421.0, 23484.0, 9376.0, 4040.0, 1832.0, 904.0, 411.0, 248.0, 145.0, 67.0, 50.0, 38.0, 22.0, 14.0, 8.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.875, -33.9599609375, -33.044921875, -32.1298828125, -31.21484375, -30.2998046875, -29.384765625, -28.4697265625, -27.5546875, -26.6396484375, -25.724609375, -24.8095703125, -23.89453125, -22.9794921875, -22.064453125, -21.1494140625, -20.234375, -19.3193359375, -18.404296875, -17.4892578125, -16.57421875, -15.6591796875, -14.744140625, -13.8291015625, -12.9140625, -11.9990234375, -11.083984375, -10.1689453125, -9.25390625, -8.3388671875, -7.423828125, -6.5087890625, -5.59375, -4.6787109375, -3.763671875, -2.8486328125, -1.93359375, -1.0185546875, -0.103515625, 0.8115234375, 1.7265625, 2.6416015625, 3.556640625, 4.4716796875, 5.38671875, 6.3017578125, 7.216796875, 8.1318359375, 9.046875, 9.9619140625, 10.876953125, 11.7919921875, 12.70703125, 13.6220703125, 14.537109375, 15.4521484375, 16.3671875, 17.2822265625, 18.197265625, 19.1123046875, 20.02734375, 20.9423828125, 21.857421875, 22.7724609375, 23.6875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 26.0, 28.0, 95.0, 112.0, 154.0, 197.0, 167.0, 104.0, 63.0, 25.0, 18.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.56088256835938, -109.8447494506836, -104.12861633300781, -98.4124755859375, -92.69634246826172, -86.98020935058594, -81.26406860351562, -75.54793548583984, -69.83180236816406, -64.11566925048828, -58.399532318115234, -52.68339538574219, -46.967262268066406, -41.251129150390625, -35.53499221801758, -29.81885528564453, -24.10272216796875, -18.386587142944336, -12.670452117919922, -6.954317092895508, -1.2381820678710938, 4.47795295715332, 10.194087982177734, 15.910224914550781, 21.626358032226562, 27.342493057250977, 33.05862808227539, 38.77476501464844, 44.49089813232422, 50.20703125, 55.92316818237305, 61.639305114746094, 67.35545349121094, 73.07158660888672, 78.7877197265625, 84.50386047363281, 90.2199935913086, 95.93612670898438, 101.65226745605469, 107.36840057373047, 113.08453369140625, 118.80066680908203, 124.51679992675781, 130.23294067382812, 135.94906616210938, 141.6652069091797, 147.38134765625, 153.09747314453125, 158.81361389160156, 164.52975463867188, 170.24588012695312, 175.96202087402344, 181.67816162109375, 187.394287109375, 193.1104278564453, 198.82656860351562, 204.54269409179688, 210.2588348388672, 215.97496032714844, 221.69110107421875, 227.4072265625, 233.1233673095703, 238.83950805664062, 244.55563354492188, 250.2717742919922]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 10.0, 16.0, 19.0, 13.0, 15.0, 19.0, 34.0, 30.0, 25.0, 42.0, 36.0, 37.0, 36.0, 39.0, 44.0, 38.0, 53.0, 37.0, 55.0, 44.0, 35.0, 40.0, 38.0, 35.0, 17.0, 19.0, 20.0, 17.0, 25.0, 22.0, 10.0, 18.0, 7.0, 9.0, 5.0, 10.0, 4.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.1502685546875, -53.32899475097656, -51.50772476196289, -49.68645095825195, -47.86518096923828, -46.043907165527344, -44.222633361816406, -42.40135955810547, -40.5800895690918, -38.75881576538086, -36.93754577636719, -35.11627197265625, -33.29499816894531, -31.47372817993164, -29.652454376220703, -27.8311824798584, -26.009910583496094, -24.18863868713379, -22.367366790771484, -20.546092987060547, -18.724821090698242, -16.903549194335938, -15.082276344299316, -13.261003494262695, -11.43973159790039, -9.618459701538086, -7.797186851501465, -5.975914478302002, -4.154642105102539, -2.3333702087402344, -0.5120973587036133, 1.3091754913330078, 3.1304473876953125, 4.951719760894775, 6.772992134094238, 8.59426498413086, 10.415536880493164, 12.236808776855469, 14.05808162689209, 15.879354476928711, 17.700626373291016, 19.52189826965332, 21.343170166015625, 23.164443969726562, 24.985715866088867, 26.806987762451172, 28.62826156616211, 30.449533462524414, 32.27080535888672, 34.092079162597656, 35.91334915161133, 37.734622955322266, 39.55589294433594, 41.377166748046875, 43.19844055175781, 45.01971435546875, 46.84098434448242, 48.66225814819336, 50.48352813720703, 52.30480194091797, 54.126075744628906, 55.94734573364258, 57.768619537353516, 59.58988952636719, 61.411163330078125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 2.0, 2.0, 7.0, 8.0, 12.0, 16.0, 17.0, 17.0, 28.0, 27.0, 27.0, 24.0, 33.0, 34.0, 34.0, 42.0, 49.0, 39.0, 49.0, 36.0, 52.0, 40.0, 35.0, 37.0, 35.0, 40.0, 32.0, 27.0, 25.0, 24.0, 27.0, 12.0, 26.0, 17.0, 14.0, 9.0, 4.0, 6.0, 8.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.40594482421875, -6.2103271484375, -6.01470947265625, -5.819091796875, -5.62347412109375, -5.4278564453125, -5.23223876953125, -5.03662109375, -4.84100341796875, -4.6453857421875, -4.44976806640625, -4.254150390625, -4.05853271484375, -3.8629150390625, -3.66729736328125, -3.4716796875, -3.27606201171875, -3.0804443359375, -2.88482666015625, -2.689208984375, -2.49359130859375, -2.2979736328125, -2.10235595703125, -1.90673828125, -1.71112060546875, -1.5155029296875, -1.31988525390625, -1.124267578125, -0.92864990234375, -0.7330322265625, -0.53741455078125, -0.341796875, -0.14617919921875, 0.0494384765625, 0.24505615234375, 0.440673828125, 0.63629150390625, 0.8319091796875, 1.02752685546875, 1.22314453125, 1.41876220703125, 1.6143798828125, 1.80999755859375, 2.005615234375, 2.20123291015625, 2.3968505859375, 2.59246826171875, 2.7880859375, 2.98370361328125, 3.1793212890625, 3.37493896484375, 3.570556640625, 3.76617431640625, 3.9617919921875, 4.15740966796875, 4.35302734375, 4.54864501953125, 4.7442626953125, 4.93988037109375, 5.135498046875, 5.33111572265625, 5.5267333984375, 5.72235107421875, 5.91796875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 21.0, 29.0, 46.0, 66.0, 96.0, 156.0, 262.0, 410.0, 667.0, 1117.0, 1983.0, 3221.0, 5633.0, 10150.0, 18607.0, 35083.0, 70112.0, 142614.0, 265691.0, 239743.0, 123494.0, 60715.0, 31063.0, 16100.0, 9126.0, 5044.0, 2913.0, 1675.0, 1085.0, 624.0, 336.0, 256.0, 148.0, 92.0, 55.0, 40.0, 17.0, 12.0, 19.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.072265625, -1.0396728515625, -1.007080078125, -0.9744873046875, -0.94189453125, -0.9093017578125, -0.876708984375, -0.8441162109375, -0.8115234375, -0.7789306640625, -0.746337890625, -0.7137451171875, -0.68115234375, -0.6485595703125, -0.615966796875, -0.5833740234375, -0.55078125, -0.5181884765625, -0.485595703125, -0.4530029296875, -0.42041015625, -0.3878173828125, -0.355224609375, -0.3226318359375, -0.2900390625, -0.2574462890625, -0.224853515625, -0.1922607421875, -0.15966796875, -0.1270751953125, -0.094482421875, -0.0618896484375, -0.029296875, 0.0032958984375, 0.035888671875, 0.0684814453125, 0.10107421875, 0.1336669921875, 0.166259765625, 0.1988525390625, 0.2314453125, 0.2640380859375, 0.296630859375, 0.3292236328125, 0.36181640625, 0.3944091796875, 0.427001953125, 0.4595947265625, 0.4921875, 0.5247802734375, 0.557373046875, 0.5899658203125, 0.62255859375, 0.6551513671875, 0.687744140625, 0.7203369140625, 0.7529296875, 0.7855224609375, 0.818115234375, 0.8507080078125, 0.88330078125, 0.9158935546875, 0.948486328125, 0.9810791015625, 1.013671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 7.0, 4.0, 10.0, 4.0, 8.0, 11.0, 16.0, 8.0, 17.0, 19.0, 22.0, 22.0, 24.0, 33.0, 43.0, 35.0, 37.0, 33.0, 34.0, 40.0, 34.0, 1062.0, 57.0, 31.0, 41.0, 30.0, 47.0, 38.0, 34.0, 33.0, 27.0, 20.0, 24.0, 24.0, 11.0, 15.0, 14.0, 16.0, 8.0, 7.0, 4.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.12109375, -3.99267578125, -3.8642578125, -3.73583984375, -3.607421875, -3.47900390625, -3.3505859375, -3.22216796875, -3.09375, -2.96533203125, -2.8369140625, -2.70849609375, -2.580078125, -2.45166015625, -2.3232421875, -2.19482421875, -2.06640625, -1.93798828125, -1.8095703125, -1.68115234375, -1.552734375, -1.42431640625, -1.2958984375, -1.16748046875, -1.0390625, -0.91064453125, -0.7822265625, -0.65380859375, -0.525390625, -0.39697265625, -0.2685546875, -0.14013671875, -0.01171875, 0.11669921875, 0.2451171875, 0.37353515625, 0.501953125, 0.63037109375, 0.7587890625, 0.88720703125, 1.015625, 1.14404296875, 1.2724609375, 1.40087890625, 1.529296875, 1.65771484375, 1.7861328125, 1.91455078125, 2.04296875, 2.17138671875, 2.2998046875, 2.42822265625, 2.556640625, 2.68505859375, 2.8134765625, 2.94189453125, 3.0703125, 3.19873046875, 3.3271484375, 3.45556640625, 3.583984375, 3.71240234375, 3.8408203125, 3.96923828125, 4.09765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 19.0, 39.0, 46.0, 69.0, 93.0, 144.0, 256.0, 408.0, 650.0, 888.0, 1467.0, 2379.0, 3718.0, 5644.0, 9121.0, 14783.0, 24456.0, 39420.0, 68037.0, 120006.0, 318229.0, 1120238.0, 156727.0, 83833.0, 49084.0, 29167.0, 17876.0, 11330.0, 6892.0, 4430.0, 2691.0, 1819.0, 1153.0, 722.0, 481.0, 299.0, 189.0, 112.0, 71.0, 55.0, 30.0, 23.0, 14.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342041015625, -0.3303260803222656, -0.31861114501953125, -0.3068962097167969, -0.2951812744140625, -0.2834663391113281, -0.27175140380859375, -0.2600364685058594, -0.248321533203125, -0.23660659790039062, -0.22489166259765625, -0.21317672729492188, -0.2014617919921875, -0.18974685668945312, -0.17803192138671875, -0.16631698608398438, -0.15460205078125, -0.14288711547851562, -0.13117218017578125, -0.11945724487304688, -0.1077423095703125, -0.09602737426757812, -0.08431243896484375, -0.07259750366210938, -0.060882568359375, -0.049167633056640625, -0.03745269775390625, -0.025737762451171875, -0.0140228271484375, -0.002307891845703125, 0.00940704345703125, 0.021121978759765625, 0.0328369140625, 0.044551849365234375, 0.05626678466796875, 0.06798171997070312, 0.0796966552734375, 0.09141159057617188, 0.10312652587890625, 0.11484146118164062, 0.126556396484375, 0.13827133178710938, 0.14998626708984375, 0.16170120239257812, 0.1734161376953125, 0.18513107299804688, 0.19684600830078125, 0.20856094360351562, 0.22027587890625, 0.23199081420898438, 0.24370574951171875, 0.2554206848144531, 0.2671356201171875, 0.2788505554199219, 0.29056549072265625, 0.3022804260253906, 0.313995361328125, 0.3257102966308594, 0.33742523193359375, 0.3491401672363281, 0.3608551025390625, 0.3725700378417969, 0.38428497314453125, 0.3959999084472656, 0.40771484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 14.0, 14.0, 21.0, 33.0, 45.0, 37.0, 68.0, 78.0, 64.0, 78.0, 79.0, 88.0, 64.0, 57.0, 59.0, 33.0, 24.0, 16.0, 22.0, 11.0, 8.0, 11.0, 3.0, 4.0, 7.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.1048583984375, -0.1016702651977539, -0.09848213195800781, -0.09529399871826172, -0.09210586547851562, -0.08891773223876953, -0.08572959899902344, -0.08254146575927734, -0.07935333251953125, -0.07616519927978516, -0.07297706604003906, -0.06978893280029297, -0.06660079956054688, -0.06341266632080078, -0.06022453308105469, -0.057036399841308594, -0.0538482666015625, -0.050660133361816406, -0.04747200012207031, -0.04428386688232422, -0.041095733642578125, -0.03790760040283203, -0.03471946716308594, -0.031531333923339844, -0.02834320068359375, -0.025155067443847656, -0.021966934204101562, -0.01877880096435547, -0.015590667724609375, -0.012402534484863281, -0.009214401245117188, -0.006026268005371094, -0.002838134765625, 0.00034999847412109375, 0.0035381317138671875, 0.006726264953613281, 0.009914398193359375, 0.013102531433105469, 0.016290664672851562, 0.019478797912597656, 0.02266693115234375, 0.025855064392089844, 0.029043197631835938, 0.03223133087158203, 0.035419464111328125, 0.03860759735107422, 0.04179573059082031, 0.044983863830566406, 0.0481719970703125, 0.051360130310058594, 0.05454826354980469, 0.05773639678955078, 0.060924530029296875, 0.06411266326904297, 0.06730079650878906, 0.07048892974853516, 0.07367706298828125, 0.07686519622802734, 0.08005332946777344, 0.08324146270751953, 0.08642959594726562, 0.08961772918701172, 0.09280586242675781, 0.0959939956665039, 0.09918212890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 4.0, 8.0, 3.0, 15.0, 11.0, 17.0, 31.0, 32.0, 46.0, 82.0, 126.0, 196.0, 562.0, 5405.0, 993088.0, 46770.0, 1365.0, 289.0, 169.0, 96.0, 57.0, 47.0, 36.0, 15.0, 14.0, 11.0, 11.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0703125, -2.005096435546875, -1.93988037109375, -1.874664306640625, -1.8094482421875, -1.744232177734375, -1.67901611328125, -1.613800048828125, -1.548583984375, -1.483367919921875, -1.41815185546875, -1.352935791015625, -1.2877197265625, -1.222503662109375, -1.15728759765625, -1.092071533203125, -1.02685546875, -0.961639404296875, -0.89642333984375, -0.831207275390625, -0.7659912109375, -0.700775146484375, -0.63555908203125, -0.570343017578125, -0.505126953125, -0.439910888671875, -0.37469482421875, -0.309478759765625, -0.2442626953125, -0.179046630859375, -0.11383056640625, -0.048614501953125, 0.0166015625, 0.081817626953125, 0.14703369140625, 0.212249755859375, 0.2774658203125, 0.342681884765625, 0.40789794921875, 0.473114013671875, 0.538330078125, 0.603546142578125, 0.66876220703125, 0.733978271484375, 0.7991943359375, 0.864410400390625, 0.92962646484375, 0.994842529296875, 1.06005859375, 1.125274658203125, 1.19049072265625, 1.255706787109375, 1.3209228515625, 1.386138916015625, 1.45135498046875, 1.516571044921875, 1.581787109375, 1.647003173828125, 1.71221923828125, 1.777435302734375, 1.8426513671875, 1.907867431640625, 1.97308349609375, 2.038299560546875, 2.103515625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 15.0, 17.0, 29.0, 43.0, 64.0, 112.0, 278.0, 185.0, 102.0, 56.0, 33.0, 16.0, 16.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19301098585128784, -0.1807277500629425, -0.16844452917575836, -0.15616129338741302, -0.14387807250022888, -0.13159483671188354, -0.11931160092353821, -0.10702837258577347, -0.09474514424800873, -0.08246191591024399, -0.07017868757247925, -0.05789545178413391, -0.04561222344636917, -0.03332899510860443, -0.021045759320259094, -0.008762530982494354, 0.0035206973552703857, 0.015803927555680275, 0.028087157756090164, 0.0403703898191452, 0.05265361815690994, 0.06493684649467468, 0.07722008228302002, 0.08950331062078476, 0.1017865389585495, 0.11406976729631424, 0.12635299563407898, 0.13863623142242432, 0.15091946721076965, 0.1632026880979538, 0.17548592388629913, 0.18776914477348328, 0.2000523805618286, 0.21233561635017395, 0.2246188372373581, 0.23690207302570343, 0.24918529391288757, 0.2614685297012329, 0.27375176548957825, 0.2860350012779236, 0.29831820726394653, 0.31060144305229187, 0.3228846788406372, 0.33516788482666016, 0.3474511206150055, 0.35973435640335083, 0.37201759219169617, 0.3843008279800415, 0.39658406376838684, 0.4088672995567322, 0.4211505353450775, 0.43343377113342285, 0.4457169771194458, 0.45800021290779114, 0.4702834486961365, 0.4825666844844818, 0.49484992027282715, 0.5071331262588501, 0.5194163918495178, 0.5316995978355408, 0.5439828634262085, 0.5562660694122314, 0.5685492753982544, 0.5808325409889221, 0.5931157469749451]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 5.0, 12.0, 12.0, 9.0, 14.0, 11.0, 16.0, 19.0, 14.0, 20.0, 25.0, 23.0, 29.0, 41.0, 31.0, 39.0, 28.0, 46.0, 42.0, 42.0, 30.0, 34.0, 31.0, 37.0, 26.0, 35.0, 23.0, 43.0, 22.0, 29.0, 23.0, 23.0, 20.0, 22.0, 15.0, 15.0, 20.0, 12.0, 6.0, 10.0, 4.0, 8.0, 7.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.2616593837738037, -0.2540225386619568, -0.24638566374778748, -0.23874881863594055, -0.23111195862293243, -0.22347509860992432, -0.2158382534980774, -0.20820139348506927, -0.20056453347206116, -0.19292767345905304, -0.18529081344604492, -0.177653968334198, -0.17001710832118988, -0.16238024830818176, -0.15474340319633484, -0.14710654318332672, -0.1394696831703186, -0.13183282315731049, -0.12419597059488297, -0.11655911803245544, -0.10892225801944733, -0.10128539800643921, -0.09364854544401169, -0.08601169288158417, -0.07837483286857605, -0.07073797285556793, -0.06310112029314041, -0.05546426400542259, -0.04782740771770477, -0.040190551429986954, -0.032553695142269135, -0.024916838854551315, -0.017279982566833496, -0.009643126279115677, -0.0020062699913978577, 0.0056305862963199615, 0.01326744258403778, 0.0209042988717556, 0.02854115515947342, 0.03617801144719124, 0.04381486773490906, 0.05145172402262688, 0.059088580310344696, 0.06672543287277222, 0.07436229288578033, 0.08199915289878845, 0.08963600546121597, 0.0972728580236435, 0.10490971803665161, 0.11254657804965973, 0.12018343061208725, 0.12782028317451477, 0.1354571431875229, 0.143094003200531, 0.15073084831237793, 0.15836770832538605, 0.16600456833839417, 0.17364142835140228, 0.1812782883644104, 0.18891513347625732, 0.19655199348926544, 0.20418885350227356, 0.21182569861412048, 0.2194625586271286, 0.22709941864013672]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 3.0, 2.0, 7.0, 7.0, 12.0, 17.0, 17.0, 15.0, 29.0, 27.0, 27.0, 24.0, 30.0, 38.0, 34.0, 38.0, 52.0, 37.0, 50.0, 36.0, 53.0, 40.0, 35.0, 35.0, 38.0, 40.0, 32.0, 27.0, 24.0, 24.0, 27.0, 13.0, 26.0, 16.0, 15.0, 8.0, 5.0, 6.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.61328125, -6.41754150390625, -6.2218017578125, -6.02606201171875, -5.830322265625, -5.63458251953125, -5.4388427734375, -5.24310302734375, -5.04736328125, -4.85162353515625, -4.6558837890625, -4.46014404296875, -4.264404296875, -4.06866455078125, -3.8729248046875, -3.67718505859375, -3.4814453125, -3.28570556640625, -3.0899658203125, -2.89422607421875, -2.698486328125, -2.50274658203125, -2.3070068359375, -2.11126708984375, -1.91552734375, -1.71978759765625, -1.5240478515625, -1.32830810546875, -1.132568359375, -0.93682861328125, -0.7410888671875, -0.54534912109375, -0.349609375, -0.15386962890625, 0.0418701171875, 0.23760986328125, 0.433349609375, 0.62908935546875, 0.8248291015625, 1.02056884765625, 1.21630859375, 1.41204833984375, 1.6077880859375, 1.80352783203125, 1.999267578125, 2.19500732421875, 2.3907470703125, 2.58648681640625, 2.7822265625, 2.97796630859375, 3.1737060546875, 3.36944580078125, 3.565185546875, 3.76092529296875, 3.9566650390625, 4.15240478515625, 4.34814453125, 4.54388427734375, 4.7396240234375, 4.93536376953125, 5.131103515625, 5.32684326171875, 5.5225830078125, 5.71832275390625, 5.9140625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 11.0, 19.0, 24.0, 28.0, 45.0, 59.0, 92.0, 163.0, 211.0, 334.0, 491.0, 676.0, 1008.0, 1475.0, 2145.0, 3230.0, 5312.0, 11837.0, 54249.0, 624269.0, 291217.0, 29684.0, 8605.0, 4458.0, 2890.0, 1896.0, 1265.0, 940.0, 594.0, 456.0, 277.0, 183.0, 138.0, 81.0, 52.0, 54.0, 32.0, 13.0, 15.0, 12.0, 8.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9375, -14.453125, -13.96875, -13.484375, -13.0, -12.515625, -12.03125, -11.546875, -11.0625, -10.578125, -10.09375, -9.609375, -9.125, -8.640625, -8.15625, -7.671875, -7.1875, -6.703125, -6.21875, -5.734375, -5.25, -4.765625, -4.28125, -3.796875, -3.3125, -2.828125, -2.34375, -1.859375, -1.375, -0.890625, -0.40625, 0.078125, 0.5625, 1.046875, 1.53125, 2.015625, 2.5, 2.984375, 3.46875, 3.953125, 4.4375, 4.921875, 5.40625, 5.890625, 6.375, 6.859375, 7.34375, 7.828125, 8.3125, 8.796875, 9.28125, 9.765625, 10.25, 10.734375, 11.21875, 11.703125, 12.1875, 12.671875, 13.15625, 13.640625, 14.125, 14.609375, 15.09375, 15.578125, 16.0625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 1.0, 3.0, 5.0, 9.0, 6.0, 6.0, 6.0, 11.0, 10.0, 16.0, 14.0, 17.0, 23.0, 19.0, 23.0, 17.0, 32.0, 34.0, 30.0, 49.0, 40.0, 53.0, 97.0, 189.0, 1487.0, 283.0, 108.0, 69.0, 52.0, 44.0, 45.0, 25.0, 34.0, 27.0, 26.0, 24.0, 18.0, 17.0, 12.0, 11.0, 22.0, 5.0, 9.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-21.46875, -20.866943359375, -20.26513671875, -19.663330078125, -19.0615234375, -18.459716796875, -17.85791015625, -17.256103515625, -16.654296875, -16.052490234375, -15.45068359375, -14.848876953125, -14.2470703125, -13.645263671875, -13.04345703125, -12.441650390625, -11.83984375, -11.238037109375, -10.63623046875, -10.034423828125, -9.4326171875, -8.830810546875, -8.22900390625, -7.627197265625, -7.025390625, -6.423583984375, -5.82177734375, -5.219970703125, -4.6181640625, -4.016357421875, -3.41455078125, -2.812744140625, -2.2109375, -1.609130859375, -1.00732421875, -0.405517578125, 0.1962890625, 0.798095703125, 1.39990234375, 2.001708984375, 2.603515625, 3.205322265625, 3.80712890625, 4.408935546875, 5.0107421875, 5.612548828125, 6.21435546875, 6.816162109375, 7.41796875, 8.019775390625, 8.62158203125, 9.223388671875, 9.8251953125, 10.427001953125, 11.02880859375, 11.630615234375, 12.232421875, 12.834228515625, 13.43603515625, 14.037841796875, 14.6396484375, 15.241455078125, 15.84326171875, 16.445068359375, 17.046875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 6.0, 9.0, 10.0, 11.0, 19.0, 10.0, 12.0, 28.0, 39.0, 49.0, 70.0, 91.0, 156.0, 253.0, 506.0, 1023.0, 2720.0, 8317.0, 43147.0, 2194949.0, 854143.0, 29294.0, 6442.0, 2293.0, 907.0, 447.0, 240.0, 130.0, 96.0, 56.0, 43.0, 41.0, 30.0, 19.0, 20.0, 14.0, 15.0, 5.0, 7.0, 5.0, 9.0, 7.0, 5.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.42431640625, -25.4423828125, -24.46044921875, -23.478515625, -22.49658203125, -21.5146484375, -20.53271484375, -19.55078125, -18.56884765625, -17.5869140625, -16.60498046875, -15.623046875, -14.64111328125, -13.6591796875, -12.67724609375, -11.6953125, -10.71337890625, -9.7314453125, -8.74951171875, -7.767578125, -6.78564453125, -5.8037109375, -4.82177734375, -3.83984375, -2.85791015625, -1.8759765625, -0.89404296875, 0.087890625, 1.06982421875, 2.0517578125, 3.03369140625, 4.015625, 4.99755859375, 5.9794921875, 6.96142578125, 7.943359375, 8.92529296875, 9.9072265625, 10.88916015625, 11.87109375, 12.85302734375, 13.8349609375, 14.81689453125, 15.798828125, 16.78076171875, 17.7626953125, 18.74462890625, 19.7265625, 20.70849609375, 21.6904296875, 22.67236328125, 23.654296875, 24.63623046875, 25.6181640625, 26.60009765625, 27.58203125, 28.56396484375, 29.5458984375, 30.52783203125, 31.509765625, 32.49169921875, 33.4736328125, 34.45556640625, 35.4375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 29.0, 29.0, 46.0, 73.0, 117.0, 129.0, 115.0, 115.0, 97.0, 80.0, 59.0, 48.0, 22.0, 8.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0], "bins": [-71.45100402832031, -70.0322494506836, -68.6135025024414, -67.19474792480469, -65.7760009765625, -64.35724639892578, -62.938499450683594, -61.51974868774414, -60.10099792480469, -58.682247161865234, -57.26349639892578, -55.84474563598633, -54.425994873046875, -53.00724411010742, -51.58849334716797, -50.169742584228516, -48.75099182128906, -47.33224105834961, -45.913490295410156, -44.4947395324707, -43.07598876953125, -41.6572380065918, -40.238487243652344, -38.81973648071289, -37.40098190307617, -35.98223114013672, -34.563480377197266, -33.14472961425781, -31.72597885131836, -30.307228088378906, -28.888477325439453, -27.4697265625, -26.05097770690918, -24.632226943969727, -23.213476181030273, -21.79472541809082, -20.375974655151367, -18.957223892211914, -17.538471221923828, -16.119720458984375, -14.700970649719238, -13.282219886779785, -11.863469123840332, -10.444717407226562, -9.02596664428711, -7.6072163581848145, -6.188465118408203, -4.76971435546875, -3.350963592529297, -1.9322127103805542, -0.5134618282318115, 0.9052891731262207, 2.324039936065674, 3.742790699005127, 5.161541938781738, 6.580292701721191, 7.9990434646606445, 9.417794227600098, 10.83654499053955, 12.25529670715332, 13.674047470092773, 15.092798233032227, 16.51154899597168, 17.930299758911133, 19.349050521850586]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 7.0, 6.0, 16.0, 10.0, 17.0, 18.0, 18.0, 17.0, 21.0, 26.0, 30.0, 23.0, 34.0, 34.0, 32.0, 40.0, 28.0, 34.0, 36.0, 36.0, 35.0, 47.0, 36.0, 40.0, 40.0, 35.0, 36.0, 31.0, 34.0, 31.0, 20.0, 25.0, 16.0, 16.0, 9.0, 12.0, 7.0, 7.0, 5.0, 7.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-57.27606201171875, -55.533939361572266, -53.79182052612305, -52.04969787597656, -50.307579040527344, -48.56545639038086, -46.823333740234375, -45.081214904785156, -43.33909225463867, -41.59696960449219, -39.85485076904297, -38.112728118896484, -36.37060546875, -34.62848663330078, -32.8863639831543, -31.144243240356445, -29.402122497558594, -27.660001754760742, -25.91788101196289, -24.175758361816406, -22.433637619018555, -20.691516876220703, -18.94939422607422, -17.207273483276367, -15.465152740478516, -13.723031997680664, -11.980910301208496, -10.238788604736328, -8.496667861938477, -6.754547119140625, -5.012425422668457, -3.270303726196289, -1.5281829833984375, 0.21393823623657227, 1.956059455871582, 3.698180675506592, 5.440301895141602, 7.182422637939453, 8.924544334411621, 10.666666030883789, 12.40878677368164, 14.150907516479492, 15.89302921295166, 17.635150909423828, 19.37727165222168, 21.11939239501953, 22.861515045166016, 24.603635787963867, 26.34575653076172, 28.08787727355957, 29.829998016357422, 31.572120666503906, 33.314239501953125, 35.05636215209961, 36.798484802246094, 38.54060363769531, 40.2827262878418, 42.02484893798828, 43.7669677734375, 45.509090423583984, 47.25121307373047, 48.99333190917969, 50.73545455932617, 52.477577209472656, 54.219696044921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 4.0, 5.0, 2.0, 9.0, 9.0, 12.0, 14.0, 19.0, 28.0, 20.0, 26.0, 31.0, 23.0, 25.0, 36.0, 40.0, 34.0, 50.0, 41.0, 59.0, 43.0, 42.0, 36.0, 37.0, 34.0, 32.0, 40.0, 33.0, 26.0, 24.0, 25.0, 24.0, 26.0, 18.0, 16.0, 12.0, 6.0, 6.0, 4.0, 5.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.03515625, -6.8370361328125, -6.638916015625, -6.4407958984375, -6.24267578125, -6.0445556640625, -5.846435546875, -5.6483154296875, -5.4501953125, -5.2520751953125, -5.053955078125, -4.8558349609375, -4.65771484375, -4.4595947265625, -4.261474609375, -4.0633544921875, -3.865234375, -3.6671142578125, -3.468994140625, -3.2708740234375, -3.07275390625, -2.8746337890625, -2.676513671875, -2.4783935546875, -2.2802734375, -2.0821533203125, -1.884033203125, -1.6859130859375, -1.48779296875, -1.2896728515625, -1.091552734375, -0.8934326171875, -0.6953125, -0.4971923828125, -0.299072265625, -0.1009521484375, 0.09716796875, 0.2952880859375, 0.493408203125, 0.6915283203125, 0.8896484375, 1.0877685546875, 1.285888671875, 1.4840087890625, 1.68212890625, 1.8802490234375, 2.078369140625, 2.2764892578125, 2.474609375, 2.6727294921875, 2.870849609375, 3.0689697265625, 3.26708984375, 3.4652099609375, 3.663330078125, 3.8614501953125, 4.0595703125, 4.2576904296875, 4.455810546875, 4.6539306640625, 4.85205078125, 5.0501708984375, 5.248291015625, 5.4464111328125, 5.64453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 13.0, 18.0, 24.0, 34.0, 42.0, 62.0, 97.0, 159.0, 211.0, 365.0, 533.0, 866.0, 1494.0, 2693.0, 4783.0, 9357.0, 20046.0, 49415.0, 206343.0, 2092413.0, 1571433.0, 154918.0, 42346.0, 17741.0, 8435.0, 4417.0, 2365.0, 1331.0, 846.0, 527.0, 335.0, 180.0, 137.0, 87.0, 67.0, 38.0, 36.0, 16.0, 11.0, 14.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.125, -16.552734375, -15.98046875, -15.408203125, -14.8359375, -14.263671875, -13.69140625, -13.119140625, -12.546875, -11.974609375, -11.40234375, -10.830078125, -10.2578125, -9.685546875, -9.11328125, -8.541015625, -7.96875, -7.396484375, -6.82421875, -6.251953125, -5.6796875, -5.107421875, -4.53515625, -3.962890625, -3.390625, -2.818359375, -2.24609375, -1.673828125, -1.1015625, -0.529296875, 0.04296875, 0.615234375, 1.1875, 1.759765625, 2.33203125, 2.904296875, 3.4765625, 4.048828125, 4.62109375, 5.193359375, 5.765625, 6.337890625, 6.91015625, 7.482421875, 8.0546875, 8.626953125, 9.19921875, 9.771484375, 10.34375, 10.916015625, 11.48828125, 12.060546875, 12.6328125, 13.205078125, 13.77734375, 14.349609375, 14.921875, 15.494140625, 16.06640625, 16.638671875, 17.2109375, 17.783203125, 18.35546875, 18.927734375, 19.5]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 11.0, 13.0, 14.0, 17.0, 36.0, 45.0, 45.0, 65.0, 95.0, 128.0, 181.0, 276.0, 419.0, 558.0, 613.0, 457.0, 336.0, 196.0, 151.0, 98.0, 82.0, 50.0, 44.0, 28.0, 26.0, 13.0, 20.0, 13.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.712158203125, -16.15869140625, -15.605224609375, -15.0517578125, -14.498291015625, -13.94482421875, -13.391357421875, -12.837890625, -12.284423828125, -11.73095703125, -11.177490234375, -10.6240234375, -10.070556640625, -9.51708984375, -8.963623046875, -8.41015625, -7.856689453125, -7.30322265625, -6.749755859375, -6.1962890625, -5.642822265625, -5.08935546875, -4.535888671875, -3.982421875, -3.428955078125, -2.87548828125, -2.322021484375, -1.7685546875, -1.215087890625, -0.66162109375, -0.108154296875, 0.4453125, 0.998779296875, 1.55224609375, 2.105712890625, 2.6591796875, 3.212646484375, 3.76611328125, 4.319580078125, 4.873046875, 5.426513671875, 5.97998046875, 6.533447265625, 7.0869140625, 7.640380859375, 8.19384765625, 8.747314453125, 9.30078125, 9.854248046875, 10.40771484375, 10.961181640625, 11.5146484375, 12.068115234375, 12.62158203125, 13.175048828125, 13.728515625, 14.281982421875, 14.83544921875, 15.388916015625, 15.9423828125, 16.495849609375, 17.04931640625, 17.602783203125, 18.15625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 8.0, 25.0, 24.0, 44.0, 69.0, 99.0, 174.0, 252.0, 498.0, 813.0, 1450.0, 2621.0, 4954.0, 9908.0, 20682.0, 47786.0, 134025.0, 644431.0, 2510797.0, 599983.0, 129101.0, 46126.0, 20149.0, 9595.0, 4754.0, 2493.0, 1413.0, 788.0, 453.0, 296.0, 159.0, 117.0, 68.0, 46.0, 23.0, 24.0, 8.0, 7.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -25.2216796875, -24.490234375, -23.7587890625, -23.02734375, -22.2958984375, -21.564453125, -20.8330078125, -20.1015625, -19.3701171875, -18.638671875, -17.9072265625, -17.17578125, -16.4443359375, -15.712890625, -14.9814453125, -14.25, -13.5185546875, -12.787109375, -12.0556640625, -11.32421875, -10.5927734375, -9.861328125, -9.1298828125, -8.3984375, -7.6669921875, -6.935546875, -6.2041015625, -5.47265625, -4.7412109375, -4.009765625, -3.2783203125, -2.546875, -1.8154296875, -1.083984375, -0.3525390625, 0.37890625, 1.1103515625, 1.841796875, 2.5732421875, 3.3046875, 4.0361328125, 4.767578125, 5.4990234375, 6.23046875, 6.9619140625, 7.693359375, 8.4248046875, 9.15625, 9.8876953125, 10.619140625, 11.3505859375, 12.08203125, 12.8134765625, 13.544921875, 14.2763671875, 15.0078125, 15.7392578125, 16.470703125, 17.2021484375, 17.93359375, 18.6650390625, 19.396484375, 20.1279296875, 20.859375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 11.0, 17.0, 22.0, 31.0, 40.0, 59.0, 58.0, 82.0, 93.0, 99.0, 87.0, 89.0, 81.0, 56.0, 53.0, 25.0, 21.0, 18.0, 14.0, 7.0, 7.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.526580810546875, -48.63359451293945, -45.74060821533203, -42.84762191772461, -39.95463562011719, -37.061649322509766, -34.168663024902344, -31.275676727294922, -28.3826904296875, -25.489704132080078, -22.596717834472656, -19.703731536865234, -16.810745239257812, -13.91775894165039, -11.024772644042969, -8.131786346435547, -5.238800048828125, -2.345813751220703, 0.5471725463867188, 3.4401588439941406, 6.3331451416015625, 9.226131439208984, 12.119117736816406, 15.012104034423828, 17.90509033203125, 20.798076629638672, 23.691062927246094, 26.584049224853516, 29.477035522460938, 32.37002182006836, 35.26300811767578, 38.1559944152832, 41.048980712890625, 43.94196701049805, 46.83495330810547, 49.72793960571289, 52.62092590332031, 55.513912200927734, 58.406898498535156, 61.29988479614258, 64.19287109375, 67.08586120605469, 69.97884368896484, 72.871826171875, 75.76481628417969, 78.65780639648438, 81.55078887939453, 84.44377136230469, 87.33676147460938, 90.22975158691406, 93.12273406982422, 96.01571655273438, 98.90870666503906, 101.80169677734375, 104.6946792602539, 107.58766174316406, 110.48065185546875, 113.37364196777344, 116.2666244506836, 119.15960693359375, 122.05259704589844, 124.94558715820312, 127.83856964111328, 130.73155212402344, 133.62454223632812]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 11.0, 9.0, 6.0, 15.0, 20.0, 18.0, 24.0, 29.0, 31.0, 34.0, 40.0, 36.0, 53.0, 39.0, 54.0, 55.0, 57.0, 52.0, 45.0, 44.0, 43.0, 42.0, 40.0, 31.0, 21.0, 31.0, 28.0, 23.0, 16.0, 9.0, 8.0, 4.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.716678619384766, -57.68655014038086, -55.65642166137695, -53.62629318237305, -51.59616470336914, -49.566036224365234, -47.535911560058594, -45.50578308105469, -43.47565460205078, -41.445526123046875, -39.41539764404297, -37.38526916503906, -35.355140686035156, -33.32501220703125, -31.294885635375977, -29.26475715637207, -27.23462677001953, -25.204498291015625, -23.17436981201172, -21.144241333007812, -19.114112854003906, -17.083984375, -15.053857803344727, -13.02372932434082, -10.993600845336914, -8.963472366333008, -6.93334436416626, -4.903216361999512, -2.8730878829956055, -0.8429594039916992, 1.1871681213378906, 3.217296600341797, 5.247428894042969, 7.277557373046875, 9.307685852050781, 11.337813377380371, 13.367941856384277, 15.398070335388184, 17.428197860717773, 19.45832633972168, 21.488454818725586, 23.518583297729492, 25.5487117767334, 27.578838348388672, 29.608966827392578, 31.639095306396484, 33.66922378540039, 35.6993522644043, 37.7294807434082, 39.75960922241211, 41.789737701416016, 43.81986618041992, 45.84999465942383, 47.880123138427734, 49.910247802734375, 51.94037628173828, 53.97050476074219, 56.000633239746094, 58.03076171875, 60.060890197753906, 62.09101867675781, 64.12114715576172, 66.15127563476562, 68.18140411376953, 70.21153259277344]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 10.0, 7.0, 11.0, 13.0, 12.0, 12.0, 18.0, 22.0, 29.0, 38.0, 33.0, 28.0, 39.0, 34.0, 39.0, 52.0, 48.0, 44.0, 47.0, 41.0, 40.0, 34.0, 37.0, 31.0, 33.0, 36.0, 32.0, 18.0, 25.0, 20.0, 15.0, 17.0, 12.0, 13.0, 6.0, 7.0, 6.0, 6.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 5.0], "bins": [-7.48046875, -7.2774658203125, -7.074462890625, -6.8714599609375, -6.66845703125, -6.4654541015625, -6.262451171875, -6.0594482421875, -5.8564453125, -5.6534423828125, -5.450439453125, -5.2474365234375, -5.04443359375, -4.8414306640625, -4.638427734375, -4.4354248046875, -4.232421875, -4.0294189453125, -3.826416015625, -3.6234130859375, -3.42041015625, -3.2174072265625, -3.014404296875, -2.8114013671875, -2.6083984375, -2.4053955078125, -2.202392578125, -1.9993896484375, -1.79638671875, -1.5933837890625, -1.390380859375, -1.1873779296875, -0.984375, -0.7813720703125, -0.578369140625, -0.3753662109375, -0.17236328125, 0.0306396484375, 0.233642578125, 0.4366455078125, 0.6396484375, 0.8426513671875, 1.045654296875, 1.2486572265625, 1.45166015625, 1.6546630859375, 1.857666015625, 2.0606689453125, 2.263671875, 2.4666748046875, 2.669677734375, 2.8726806640625, 3.07568359375, 3.2786865234375, 3.481689453125, 3.6846923828125, 3.8876953125, 4.0906982421875, 4.293701171875, 4.4967041015625, 4.69970703125, 4.9027099609375, 5.105712890625, 5.3087158203125, 5.51171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 6.0, 6.0, 25.0, 24.0, 33.0, 65.0, 62.0, 119.0, 186.0, 246.0, 371.0, 635.0, 848.0, 1303.0, 2130.0, 3310.0, 5220.0, 8614.0, 14124.0, 24186.0, 42488.0, 77162.0, 140210.0, 232712.0, 213107.0, 122195.0, 67094.0, 37190.0, 21456.0, 12674.0, 7682.0, 4643.0, 2939.0, 1820.0, 1265.0, 819.0, 507.0, 349.0, 220.0, 160.0, 113.0, 80.0, 52.0, 37.0, 29.0, 7.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1131439208984375, -1.075897216796875, -1.0386505126953125, -1.00140380859375, -0.9641571044921875, -0.926910400390625, -0.8896636962890625, -0.8524169921875, -0.8151702880859375, -0.777923583984375, -0.7406768798828125, -0.70343017578125, -0.6661834716796875, -0.628936767578125, -0.5916900634765625, -0.554443359375, -0.5171966552734375, -0.479949951171875, -0.4427032470703125, -0.40545654296875, -0.3682098388671875, -0.330963134765625, -0.2937164306640625, -0.2564697265625, -0.2192230224609375, -0.181976318359375, -0.1447296142578125, -0.10748291015625, -0.0702362060546875, -0.032989501953125, 0.0042572021484375, 0.04150390625, 0.0787506103515625, 0.115997314453125, 0.1532440185546875, 0.19049072265625, 0.2277374267578125, 0.264984130859375, 0.3022308349609375, 0.3394775390625, 0.3767242431640625, 0.413970947265625, 0.4512176513671875, 0.48846435546875, 0.5257110595703125, 0.562957763671875, 0.6002044677734375, 0.637451171875, 0.6746978759765625, 0.711944580078125, 0.7491912841796875, 0.78643798828125, 0.8236846923828125, 0.860931396484375, 0.8981781005859375, 0.9354248046875, 0.9726715087890625, 1.009918212890625, 1.0471649169921875, 1.08441162109375, 1.1216583251953125, 1.158905029296875, 1.1961517333984375, 1.2333984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 7.0, 3.0, 5.0, 5.0, 10.0, 9.0, 16.0, 14.0, 16.0, 13.0, 19.0, 26.0, 24.0, 20.0, 30.0, 31.0, 29.0, 35.0, 26.0, 32.0, 39.0, 39.0, 34.0, 1057.0, 37.0, 40.0, 40.0, 32.0, 27.0, 30.0, 34.0, 25.0, 18.0, 21.0, 24.0, 22.0, 19.0, 23.0, 20.0, 18.0, 12.0, 11.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.626953125, -3.506256103515625, -3.38555908203125, -3.264862060546875, -3.1441650390625, -3.023468017578125, -2.90277099609375, -2.782073974609375, -2.661376953125, -2.540679931640625, -2.41998291015625, -2.299285888671875, -2.1785888671875, -2.057891845703125, -1.93719482421875, -1.816497802734375, -1.69580078125, -1.575103759765625, -1.45440673828125, -1.333709716796875, -1.2130126953125, -1.092315673828125, -0.97161865234375, -0.850921630859375, -0.730224609375, -0.609527587890625, -0.48883056640625, -0.368133544921875, -0.2474365234375, -0.126739501953125, -0.00604248046875, 0.114654541015625, 0.2353515625, 0.356048583984375, 0.47674560546875, 0.597442626953125, 0.7181396484375, 0.838836669921875, 0.95953369140625, 1.080230712890625, 1.200927734375, 1.321624755859375, 1.44232177734375, 1.563018798828125, 1.6837158203125, 1.804412841796875, 1.92510986328125, 2.045806884765625, 2.16650390625, 2.287200927734375, 2.40789794921875, 2.528594970703125, 2.6492919921875, 2.769989013671875, 2.89068603515625, 3.011383056640625, 3.132080078125, 3.252777099609375, 3.37347412109375, 3.494171142578125, 3.6148681640625, 3.735565185546875, 3.85626220703125, 3.976959228515625, 4.09765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 11.0, 11.0, 20.0, 27.0, 34.0, 56.0, 76.0, 101.0, 204.0, 271.0, 455.0, 733.0, 1111.0, 1890.0, 3352.0, 6129.0, 10973.0, 20779.0, 39234.0, 79302.0, 176744.0, 1143632.0, 360488.0, 126102.0, 58994.0, 30294.0, 15891.0, 8599.0, 4880.0, 2747.0, 1465.0, 935.0, 539.0, 353.0, 219.0, 129.0, 116.0, 63.0, 35.0, 32.0, 25.0, 20.0, 12.0, 6.0, 12.0, 6.0, 5.0, 7.0, 1.0, 0.0, 2.0], "bins": [-0.65234375, -0.6335983276367188, -0.6148529052734375, -0.5961074829101562, -0.577362060546875, -0.5586166381835938, -0.5398712158203125, -0.5211257934570312, -0.50238037109375, -0.48363494873046875, -0.4648895263671875, -0.44614410400390625, -0.427398681640625, -0.40865325927734375, -0.3899078369140625, -0.37116241455078125, -0.3524169921875, -0.33367156982421875, -0.3149261474609375, -0.29618072509765625, -0.277435302734375, -0.25868988037109375, -0.2399444580078125, -0.22119903564453125, -0.20245361328125, -0.18370819091796875, -0.1649627685546875, -0.14621734619140625, -0.127471923828125, -0.10872650146484375, -0.0899810791015625, -0.07123565673828125, -0.052490234375, -0.03374481201171875, -0.0149993896484375, 0.00374603271484375, 0.022491455078125, 0.04123687744140625, 0.0599822998046875, 0.07872772216796875, 0.09747314453125, 0.11621856689453125, 0.1349639892578125, 0.15370941162109375, 0.172454833984375, 0.19120025634765625, 0.2099456787109375, 0.22869110107421875, 0.2474365234375, 0.26618194580078125, 0.2849273681640625, 0.30367279052734375, 0.322418212890625, 0.34116363525390625, 0.3599090576171875, 0.37865447998046875, 0.39739990234375, 0.41614532470703125, 0.4348907470703125, 0.45363616943359375, 0.472381591796875, 0.49112701416015625, 0.5098724365234375, 0.5286178588867188, 0.54736328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 3.0, 13.0, 6.0, 15.0, 4.0, 16.0, 15.0, 16.0, 26.0, 24.0, 46.0, 50.0, 80.0, 138.0, 170.0, 80.0, 63.0, 48.0, 25.0, 26.0, 18.0, 19.0, 14.0, 14.0, 14.0, 4.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.267822265625, -0.2599773406982422, -0.2521324157714844, -0.24428749084472656, -0.23644256591796875, -0.22859764099121094, -0.22075271606445312, -0.2129077911376953, -0.2050628662109375, -0.1972179412841797, -0.18937301635742188, -0.18152809143066406, -0.17368316650390625, -0.16583824157714844, -0.15799331665039062, -0.1501483917236328, -0.142303466796875, -0.1344585418701172, -0.12661361694335938, -0.11876869201660156, -0.11092376708984375, -0.10307884216308594, -0.09523391723632812, -0.08738899230957031, -0.0795440673828125, -0.07169914245605469, -0.06385421752929688, -0.05600929260253906, -0.04816436767578125, -0.04031944274902344, -0.032474517822265625, -0.024629592895507812, -0.01678466796875, -0.008939743041992188, -0.001094818115234375, 0.0067501068115234375, 0.01459503173828125, 0.022439956665039062, 0.030284881591796875, 0.03812980651855469, 0.0459747314453125, 0.05381965637207031, 0.061664581298828125, 0.06950950622558594, 0.07735443115234375, 0.08519935607910156, 0.09304428100585938, 0.10088920593261719, 0.108734130859375, 0.11657905578613281, 0.12442398071289062, 0.13226890563964844, 0.14011383056640625, 0.14795875549316406, 0.15580368041992188, 0.1636486053466797, 0.1714935302734375, 0.1793384552001953, 0.18718338012695312, 0.19502830505371094, 0.20287322998046875, 0.21071815490722656, 0.21856307983398438, 0.2264080047607422, 0.2342529296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 7.0, 5.0, 17.0, 27.0, 31.0, 36.0, 52.0, 81.0, 94.0, 194.0, 425.0, 3604.0, 948206.0, 93417.0, 1493.0, 319.0, 177.0, 99.0, 64.0, 36.0, 34.0, 26.0, 10.0, 17.0, 10.0, 12.0, 4.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4765625, -4.32659912109375, -4.1766357421875, -4.02667236328125, -3.876708984375, -3.72674560546875, -3.5767822265625, -3.42681884765625, -3.27685546875, -3.12689208984375, -2.9769287109375, -2.82696533203125, -2.677001953125, -2.52703857421875, -2.3770751953125, -2.22711181640625, -2.0771484375, -1.92718505859375, -1.7772216796875, -1.62725830078125, -1.477294921875, -1.32733154296875, -1.1773681640625, -1.02740478515625, -0.87744140625, -0.72747802734375, -0.5775146484375, -0.42755126953125, -0.277587890625, -0.12762451171875, 0.0223388671875, 0.17230224609375, 0.322265625, 0.47222900390625, 0.6221923828125, 0.77215576171875, 0.922119140625, 1.07208251953125, 1.2220458984375, 1.37200927734375, 1.52197265625, 1.67193603515625, 1.8218994140625, 1.97186279296875, 2.121826171875, 2.27178955078125, 2.4217529296875, 2.57171630859375, 2.7216796875, 2.87164306640625, 3.0216064453125, 3.17156982421875, 3.321533203125, 3.47149658203125, 3.6214599609375, 3.77142333984375, 3.92138671875, 4.07135009765625, 4.2213134765625, 4.37127685546875, 4.521240234375, 4.67120361328125, 4.8211669921875, 4.97113037109375, 5.12109375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 19.0, 26.0, 59.0, 90.0, 237.0, 310.0, 116.0, 60.0, 32.0, 20.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3423917293548584, -1.3018056154251099, -1.2612195014953613, -1.2206332683563232, -1.1800471544265747, -1.1394610404968262, -1.0988749265670776, -1.058288812637329, -1.017702579498291, -0.9771164655685425, -0.9365302920341492, -0.8959441781044006, -0.8553580045700073, -0.8147718906402588, -0.7741857767105103, -0.7335996627807617, -0.6930135488510132, -0.6524274349212646, -0.6118412613868713, -0.5712551474571228, -0.5306689739227295, -0.49008285999298096, -0.4494967460632324, -0.4089106023311615, -0.3683244585990906, -0.32773831486701965, -0.28715217113494873, -0.2465660572052002, -0.20597991347312927, -0.16539376974105835, -0.12480764091014862, -0.08422151207923889, -0.04363536834716797, -0.003049232065677643, 0.03753690421581268, 0.07812304049730301, 0.11870917677879333, 0.15929532051086426, 0.199881449341774, 0.24046757817268372, 0.28105372190475464, 0.32163986563682556, 0.3622260093688965, 0.402812123298645, 0.44339826703071594, 0.48398441076278687, 0.5245705246925354, 0.5651566982269287, 0.6057428121566772, 0.6463289260864258, 0.6869150996208191, 0.7275012135505676, 0.7680873870849609, 0.8086735010147095, 0.849259614944458, 0.8898457288742065, 0.9304319024085999, 0.9710180163383484, 1.0116041898727417, 1.0521903038024902, 1.0927764177322388, 1.1333625316619873, 1.1739487648010254, 1.214534878730774, 1.2551209926605225]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 11.0, 9.0, 20.0, 19.0, 19.0, 22.0, 10.0, 22.0, 28.0, 20.0, 27.0, 44.0, 27.0, 35.0, 38.0, 50.0, 48.0, 48.0, 31.0, 40.0, 33.0, 49.0, 38.0, 31.0, 45.0, 20.0, 27.0, 16.0, 21.0, 23.0, 23.0, 20.0, 13.0, 11.0, 10.0, 7.0, 5.0, 8.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.7208524346351624, -0.7001281976699829, -0.6794039607048035, -0.658679723739624, -0.6379554867744446, -0.6172312498092651, -0.5965070128440857, -0.5757827758789062, -0.5550585389137268, -0.5343343019485474, -0.5136100649833679, -0.4928858280181885, -0.47216159105300903, -0.4514373540878296, -0.43071311712265015, -0.4099888801574707, -0.38926464319229126, -0.3685404062271118, -0.3478161692619324, -0.32709193229675293, -0.3063676953315735, -0.28564345836639404, -0.2649192214012146, -0.24419498443603516, -0.2234707474708557, -0.20274651050567627, -0.18202227354049683, -0.16129803657531738, -0.14057379961013794, -0.1198495626449585, -0.09912532567977905, -0.07840108871459961, -0.057676851749420166, -0.03695261478424072, -0.01622837781906128, 0.004495859146118164, 0.025220096111297607, 0.04594433307647705, 0.0666685700416565, 0.08739280700683594, 0.10811704397201538, 0.12884128093719482, 0.14956551790237427, 0.1702897548675537, 0.19101399183273315, 0.2117382287979126, 0.23246246576309204, 0.2531867027282715, 0.2739109396934509, 0.29463517665863037, 0.3153594136238098, 0.33608365058898926, 0.3568078875541687, 0.37753212451934814, 0.3982563614845276, 0.41898059844970703, 0.4397048354148865, 0.4604290723800659, 0.48115330934524536, 0.5018775463104248, 0.5226017832756042, 0.5433260202407837, 0.5640502572059631, 0.5847744941711426, 0.605498731136322]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 7.0, 10.0, 13.0, 11.0, 10.0, 13.0, 18.0, 22.0, 29.0, 37.0, 34.0, 30.0, 35.0, 35.0, 41.0, 55.0, 45.0, 44.0, 47.0, 41.0, 40.0, 35.0, 39.0, 28.0, 35.0, 35.0, 33.0, 17.0, 27.0, 17.0, 16.0, 17.0, 10.0, 14.0, 7.0, 6.0, 7.0, 5.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0], "bins": [-7.50390625, -7.30023193359375, -7.0965576171875, -6.89288330078125, -6.689208984375, -6.48553466796875, -6.2818603515625, -6.07818603515625, -5.87451171875, -5.67083740234375, -5.4671630859375, -5.26348876953125, -5.059814453125, -4.85614013671875, -4.6524658203125, -4.44879150390625, -4.2451171875, -4.04144287109375, -3.8377685546875, -3.63409423828125, -3.430419921875, -3.22674560546875, -3.0230712890625, -2.81939697265625, -2.61572265625, -2.41204833984375, -2.2083740234375, -2.00469970703125, -1.801025390625, -1.59735107421875, -1.3936767578125, -1.19000244140625, -0.986328125, -0.78265380859375, -0.5789794921875, -0.37530517578125, -0.171630859375, 0.03204345703125, 0.2357177734375, 0.43939208984375, 0.64306640625, 0.84674072265625, 1.0504150390625, 1.25408935546875, 1.457763671875, 1.66143798828125, 1.8651123046875, 2.06878662109375, 2.2724609375, 2.47613525390625, 2.6798095703125, 2.88348388671875, 3.087158203125, 3.29083251953125, 3.4945068359375, 3.69818115234375, 3.90185546875, 4.10552978515625, 4.3092041015625, 4.51287841796875, 4.716552734375, 4.92022705078125, 5.1239013671875, 5.32757568359375, 5.53125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 9.0, 10.0, 19.0, 16.0, 21.0, 40.0, 56.0, 66.0, 98.0, 148.0, 191.0, 258.0, 352.0, 500.0, 627.0, 924.0, 1297.0, 1945.0, 2902.0, 4716.0, 7849.0, 16736.0, 49871.0, 231793.0, 527118.0, 135576.0, 33800.0, 12692.0, 6528.0, 3917.0, 2574.0, 1710.0, 1185.0, 823.0, 614.0, 396.0, 312.0, 256.0, 143.0, 115.0, 75.0, 65.0, 47.0, 41.0, 30.0, 26.0, 16.0, 18.0, 11.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.5234375, -8.25146484375, -7.9794921875, -7.70751953125, -7.435546875, -7.16357421875, -6.8916015625, -6.61962890625, -6.34765625, -6.07568359375, -5.8037109375, -5.53173828125, -5.259765625, -4.98779296875, -4.7158203125, -4.44384765625, -4.171875, -3.89990234375, -3.6279296875, -3.35595703125, -3.083984375, -2.81201171875, -2.5400390625, -2.26806640625, -1.99609375, -1.72412109375, -1.4521484375, -1.18017578125, -0.908203125, -0.63623046875, -0.3642578125, -0.09228515625, 0.1796875, 0.45166015625, 0.7236328125, 0.99560546875, 1.267578125, 1.53955078125, 1.8115234375, 2.08349609375, 2.35546875, 2.62744140625, 2.8994140625, 3.17138671875, 3.443359375, 3.71533203125, 3.9873046875, 4.25927734375, 4.53125, 4.80322265625, 5.0751953125, 5.34716796875, 5.619140625, 5.89111328125, 6.1630859375, 6.43505859375, 6.70703125, 6.97900390625, 7.2509765625, 7.52294921875, 7.794921875, 8.06689453125, 8.3388671875, 8.61083984375, 8.8828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 0.0, 5.0, 5.0, 2.0, 12.0, 11.0, 7.0, 10.0, 15.0, 14.0, 24.0, 13.0, 22.0, 24.0, 30.0, 30.0, 36.0, 35.0, 37.0, 47.0, 45.0, 87.0, 225.0, 1492.0, 271.0, 91.0, 48.0, 51.0, 37.0, 32.0, 39.0, 34.0, 37.0, 22.0, 19.0, 15.0, 24.0, 15.0, 15.0, 10.0, 12.0, 11.0, 15.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.9375, -17.331298828125, -16.72509765625, -16.118896484375, -15.5126953125, -14.906494140625, -14.30029296875, -13.694091796875, -13.087890625, -12.481689453125, -11.87548828125, -11.269287109375, -10.6630859375, -10.056884765625, -9.45068359375, -8.844482421875, -8.23828125, -7.632080078125, -7.02587890625, -6.419677734375, -5.8134765625, -5.207275390625, -4.60107421875, -3.994873046875, -3.388671875, -2.782470703125, -2.17626953125, -1.570068359375, -0.9638671875, -0.357666015625, 0.24853515625, 0.854736328125, 1.4609375, 2.067138671875, 2.67333984375, 3.279541015625, 3.8857421875, 4.491943359375, 5.09814453125, 5.704345703125, 6.310546875, 6.916748046875, 7.52294921875, 8.129150390625, 8.7353515625, 9.341552734375, 9.94775390625, 10.553955078125, 11.16015625, 11.766357421875, 12.37255859375, 12.978759765625, 13.5849609375, 14.191162109375, 14.79736328125, 15.403564453125, 16.009765625, 16.615966796875, 17.22216796875, 17.828369140625, 18.4345703125, 19.040771484375, 19.64697265625, 20.253173828125, 20.859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 13.0, 11.0, 14.0, 10.0, 15.0, 21.0, 19.0, 25.0, 33.0, 41.0, 59.0, 103.0, 115.0, 185.0, 288.0, 517.0, 1079.0, 3037.0, 14597.0, 434921.0, 2652179.0, 30305.0, 4885.0, 1446.0, 681.0, 368.0, 208.0, 110.0, 102.0, 56.0, 59.0, 34.0, 30.0, 30.0, 18.0, 16.0, 7.0, 8.0, 10.0, 14.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-39.34375, -38.1923828125, -37.041015625, -35.8896484375, -34.73828125, -33.5869140625, -32.435546875, -31.2841796875, -30.1328125, -28.9814453125, -27.830078125, -26.6787109375, -25.52734375, -24.3759765625, -23.224609375, -22.0732421875, -20.921875, -19.7705078125, -18.619140625, -17.4677734375, -16.31640625, -15.1650390625, -14.013671875, -12.8623046875, -11.7109375, -10.5595703125, -9.408203125, -8.2568359375, -7.10546875, -5.9541015625, -4.802734375, -3.6513671875, -2.5, -1.3486328125, -0.197265625, 0.9541015625, 2.10546875, 3.2568359375, 4.408203125, 5.5595703125, 6.7109375, 7.8623046875, 9.013671875, 10.1650390625, 11.31640625, 12.4677734375, 13.619140625, 14.7705078125, 15.921875, 17.0732421875, 18.224609375, 19.3759765625, 20.52734375, 21.6787109375, 22.830078125, 23.9814453125, 25.1328125, 26.2841796875, 27.435546875, 28.5869140625, 29.73828125, 30.8896484375, 32.041015625, 33.1923828125, 34.34375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 793.0, 217.0, 2.0], "bins": [-854.281005859375, -840.447265625, -826.6135864257812, -812.7798461914062, -798.9461669921875, -785.1124267578125, -771.2787475585938, -757.4450073242188, -743.611328125, -729.777587890625, -715.9439086914062, -702.1101684570312, -688.2764892578125, -674.4427490234375, -660.6090698242188, -646.7753295898438, -632.9415893554688, -619.1078491210938, -605.274169921875, -591.4404296875, -577.6067504882812, -563.7730102539062, -549.9393310546875, -536.1055908203125, -522.2718505859375, -508.4381408691406, -494.60443115234375, -480.7707214355469, -466.93701171875, -453.103271484375, -439.2695617675781, -425.43585205078125, -411.6021423339844, -397.7684326171875, -383.9347229003906, -370.10101318359375, -356.26727294921875, -342.43359375, -328.599853515625, -314.7661437988281, -300.93243408203125, -287.0987243652344, -273.2650146484375, -259.4313049316406, -245.5975799560547, -231.7638702392578, -217.93014526367188, -204.096435546875, -190.2627410888672, -176.4290313720703, -162.59530639648438, -148.7615966796875, -134.92788696289062, -121.09417724609375, -107.26045989990234, -93.42674255371094, -79.59302520751953, -65.75930786132812, -51.92559814453125, -38.09188461303711, -24.25817108154297, -10.424461364746094, 3.4092559814453125, 17.24297332763672, 31.07668113708496]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 3.0, 9.0, 8.0, 14.0, 19.0, 15.0, 15.0, 17.0, 17.0, 28.0, 19.0, 26.0, 40.0, 33.0, 37.0, 33.0, 42.0, 47.0, 47.0, 31.0, 45.0, 24.0, 19.0, 42.0, 25.0, 38.0, 34.0, 28.0, 30.0, 26.0, 20.0, 25.0, 14.0, 23.0, 13.0, 9.0, 10.0, 6.0, 11.0, 14.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.142913818359375, -45.61171340942383, -44.08051300048828, -42.549312591552734, -41.01811218261719, -39.48691177368164, -37.955711364746094, -36.42450714111328, -34.893310546875, -33.36211013793945, -31.830909729003906, -30.29970932006836, -28.768508911132812, -27.237308502197266, -25.706106185913086, -24.17490577697754, -22.64370346069336, -21.112503051757812, -19.581302642822266, -18.05010223388672, -16.518901824951172, -14.987700462341309, -13.456499099731445, -11.925298690795898, -10.394098281860352, -8.862897872924805, -7.3316969871521, -5.8004961013793945, -4.269295692443848, -2.738095283508301, -1.2068939208984375, 0.3243064880371094, 1.8555068969726562, 3.3867075443267822, 4.917908191680908, 6.449109077453613, 7.98030948638916, 9.511509895324707, 11.04271125793457, 12.573911666870117, 14.105112075805664, 15.636312484741211, 17.167512893676758, 18.698715209960938, 20.229915618896484, 21.76111602783203, 23.292316436767578, 24.823516845703125, 26.354717254638672, 27.88591766357422, 29.417118072509766, 30.948318481445312, 32.47951889038086, 34.010719299316406, 35.54192352294922, 37.0731201171875, 38.60432434082031, 40.13552474975586, 41.666725158691406, 43.19792556762695, 44.7291259765625, 46.26032638549805, 47.791526794433594, 49.322731018066406, 50.85392761230469]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 15.0, 8.0, 10.0, 6.0, 10.0, 12.0, 10.0, 20.0, 29.0, 25.0, 30.0, 36.0, 32.0, 27.0, 37.0, 37.0, 37.0, 65.0, 54.0, 63.0, 30.0, 43.0, 33.0, 34.0, 40.0, 34.0, 35.0, 20.0, 29.0, 26.0, 13.0, 14.0, 15.0, 15.0, 11.0, 7.0, 8.0, 5.0, 4.0, 8.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.80859375, -7.5965576171875, -7.384521484375, -7.1724853515625, -6.96044921875, -6.7484130859375, -6.536376953125, -6.3243408203125, -6.1123046875, -5.9002685546875, -5.688232421875, -5.4761962890625, -5.26416015625, -5.0521240234375, -4.840087890625, -4.6280517578125, -4.416015625, -4.2039794921875, -3.991943359375, -3.7799072265625, -3.56787109375, -3.3558349609375, -3.143798828125, -2.9317626953125, -2.7197265625, -2.5076904296875, -2.295654296875, -2.0836181640625, -1.87158203125, -1.6595458984375, -1.447509765625, -1.2354736328125, -1.0234375, -0.8114013671875, -0.599365234375, -0.3873291015625, -0.17529296875, 0.0367431640625, 0.248779296875, 0.4608154296875, 0.6728515625, 0.8848876953125, 1.096923828125, 1.3089599609375, 1.52099609375, 1.7330322265625, 1.945068359375, 2.1571044921875, 2.369140625, 2.5811767578125, 2.793212890625, 3.0052490234375, 3.21728515625, 3.4293212890625, 3.641357421875, 3.8533935546875, 4.0654296875, 4.2774658203125, 4.489501953125, 4.7015380859375, 4.91357421875, 5.1256103515625, 5.337646484375, 5.5496826171875, 5.76171875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 5.0, 14.0, 12.0, 26.0, 44.0, 47.0, 85.0, 114.0, 189.0, 276.0, 559.0, 970.0, 1831.0, 3765.0, 8287.0, 20583.0, 64948.0, 556522.0, 3144163.0, 311988.0, 49479.0, 16786.0, 6747.0, 3196.0, 1577.0, 837.0, 474.0, 267.0, 161.0, 105.0, 57.0, 53.0, 29.0, 22.0, 16.0, 12.0, 6.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.890625, -25.115478515625, -24.34033203125, -23.565185546875, -22.7900390625, -22.014892578125, -21.23974609375, -20.464599609375, -19.689453125, -18.914306640625, -18.13916015625, -17.364013671875, -16.5888671875, -15.813720703125, -15.03857421875, -14.263427734375, -13.48828125, -12.713134765625, -11.93798828125, -11.162841796875, -10.3876953125, -9.612548828125, -8.83740234375, -8.062255859375, -7.287109375, -6.511962890625, -5.73681640625, -4.961669921875, -4.1865234375, -3.411376953125, -2.63623046875, -1.861083984375, -1.0859375, -0.310791015625, 0.46435546875, 1.239501953125, 2.0146484375, 2.789794921875, 3.56494140625, 4.340087890625, 5.115234375, 5.890380859375, 6.66552734375, 7.440673828125, 8.2158203125, 8.990966796875, 9.76611328125, 10.541259765625, 11.31640625, 12.091552734375, 12.86669921875, 13.641845703125, 14.4169921875, 15.192138671875, 15.96728515625, 16.742431640625, 17.517578125, 18.292724609375, 19.06787109375, 19.843017578125, 20.6181640625, 21.393310546875, 22.16845703125, 22.943603515625, 23.71875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 13.0, 8.0, 19.0, 26.0, 38.0, 73.0, 79.0, 140.0, 240.0, 426.0, 718.0, 856.0, 604.0, 322.0, 198.0, 126.0, 56.0, 42.0, 29.0, 19.0, 12.0, 12.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.426025390625, -19.61767578125, -18.809326171875, -18.0009765625, -17.192626953125, -16.38427734375, -15.575927734375, -14.767578125, -13.959228515625, -13.15087890625, -12.342529296875, -11.5341796875, -10.725830078125, -9.91748046875, -9.109130859375, -8.30078125, -7.492431640625, -6.68408203125, -5.875732421875, -5.0673828125, -4.259033203125, -3.45068359375, -2.642333984375, -1.833984375, -1.025634765625, -0.21728515625, 0.591064453125, 1.3994140625, 2.207763671875, 3.01611328125, 3.824462890625, 4.6328125, 5.441162109375, 6.24951171875, 7.057861328125, 7.8662109375, 8.674560546875, 9.48291015625, 10.291259765625, 11.099609375, 11.907958984375, 12.71630859375, 13.524658203125, 14.3330078125, 15.141357421875, 15.94970703125, 16.758056640625, 17.56640625, 18.374755859375, 19.18310546875, 19.991455078125, 20.7998046875, 21.608154296875, 22.41650390625, 23.224853515625, 24.033203125, 24.841552734375, 25.64990234375, 26.458251953125, 27.2666015625, 28.074951171875, 28.88330078125, 29.691650390625, 30.5]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 7.0, 16.0, 17.0, 36.0, 54.0, 114.0, 168.0, 381.0, 981.0, 2916.0, 11145.0, 60151.0, 947518.0, 3013689.0, 130292.0, 19545.0, 4642.0, 1500.0, 534.0, 237.0, 140.0, 63.0, 55.0, 23.0, 21.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.625, -55.06005859375, -53.4951171875, -51.93017578125, -50.365234375, -48.80029296875, -47.2353515625, -45.67041015625, -44.10546875, -42.54052734375, -40.9755859375, -39.41064453125, -37.845703125, -36.28076171875, -34.7158203125, -33.15087890625, -31.5859375, -30.02099609375, -28.4560546875, -26.89111328125, -25.326171875, -23.76123046875, -22.1962890625, -20.63134765625, -19.06640625, -17.50146484375, -15.9365234375, -14.37158203125, -12.806640625, -11.24169921875, -9.6767578125, -8.11181640625, -6.546875, -4.98193359375, -3.4169921875, -1.85205078125, -0.287109375, 1.27783203125, 2.8427734375, 4.40771484375, 5.97265625, 7.53759765625, 9.1025390625, 10.66748046875, 12.232421875, 13.79736328125, 15.3623046875, 16.92724609375, 18.4921875, 20.05712890625, 21.6220703125, 23.18701171875, 24.751953125, 26.31689453125, 27.8818359375, 29.44677734375, 31.01171875, 32.57666015625, 34.1416015625, 35.70654296875, 37.271484375, 38.83642578125, 40.4013671875, 41.96630859375, 43.53125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 7.0, 13.0, 13.0, 19.0, 21.0, 33.0, 39.0, 57.0, 61.0, 61.0, 85.0, 83.0, 77.0, 88.0, 64.0, 79.0, 45.0, 38.0, 33.0, 16.0, 26.0, 16.0, 10.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.3864974975586, -95.80854797363281, -93.23059844970703, -90.65264892578125, -88.07469940185547, -85.49674987792969, -82.9188003540039, -80.34085083007812, -77.76290130615234, -75.18495178222656, -72.60700225830078, -70.029052734375, -67.45110321044922, -64.87315368652344, -62.295204162597656, -59.717254638671875, -57.139305114746094, -54.56135559082031, -51.98340606689453, -49.40545654296875, -46.82750701904297, -44.24955749511719, -41.671607971191406, -39.093658447265625, -36.515708923339844, -33.93775939941406, -31.35980987548828, -28.7818603515625, -26.20391082763672, -23.625961303710938, -21.048011779785156, -18.470062255859375, -15.892112731933594, -13.314163208007812, -10.736213684082031, -8.15826416015625, -5.580314636230469, -3.0023651123046875, -0.42441558837890625, 2.153533935546875, 4.731483459472656, 7.3094329833984375, 9.887382507324219, 12.46533203125, 15.043281555175781, 17.621231079101562, 20.199180603027344, 22.777130126953125, 25.355079650878906, 27.933029174804688, 30.51097869873047, 33.08892822265625, 35.66687774658203, 38.24482727050781, 40.822776794433594, 43.400726318359375, 45.978675842285156, 48.55662536621094, 51.13457489013672, 53.7125244140625, 56.29047393798828, 58.86842346191406, 61.446372985839844, 64.02432250976562, 66.6022720336914]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 3.0, 7.0, 10.0, 13.0, 9.0, 11.0, 10.0, 14.0, 11.0, 20.0, 19.0, 22.0, 33.0, 31.0, 30.0, 37.0, 37.0, 37.0, 29.0, 41.0, 47.0, 38.0, 45.0, 34.0, 27.0, 34.0, 36.0, 42.0, 21.0, 33.0, 26.0, 23.0, 20.0, 24.0, 15.0, 20.0, 19.0, 12.0, 9.0, 14.0, 12.0, 7.0, 4.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.45613098144531, -48.80888366699219, -47.16163635253906, -45.51438903808594, -43.86714172363281, -42.21989440917969, -40.57264709472656, -38.92539978027344, -37.27815246582031, -35.63090515136719, -33.98365783691406, -32.33641052246094, -30.689163208007812, -29.041915893554688, -27.39466667175293, -25.747419357299805, -24.100170135498047, -22.452922821044922, -20.805675506591797, -19.158428192138672, -17.511180877685547, -15.863932609558105, -14.216684341430664, -12.569437026977539, -10.922189712524414, -9.274942398071289, -7.627694606781006, -5.980446815490723, -4.333199501037598, -2.6859521865844727, -1.0387039184570312, 0.6085433959960938, 2.2557907104492188, 3.903038263320923, 5.550285816192627, 7.19753360748291, 8.844780921936035, 10.49202823638916, 12.139276504516602, 13.786523818969727, 15.433771133422852, 17.081018447875977, 18.7282657623291, 20.37551498413086, 22.022762298583984, 23.67000961303711, 25.317256927490234, 26.96450424194336, 28.611751556396484, 30.25899887084961, 31.906246185302734, 33.55349349975586, 35.200740814208984, 36.84798812866211, 38.4952392578125, 40.142486572265625, 41.78973388671875, 43.436981201171875, 45.084228515625, 46.731475830078125, 48.37872314453125, 50.025970458984375, 51.6732177734375, 53.320465087890625, 54.96771240234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 9.0, 3.0, 3.0, 9.0, 11.0, 7.0, 12.0, 8.0, 12.0, 9.0, 15.0, 20.0, 20.0, 32.0, 24.0, 26.0, 33.0, 41.0, 41.0, 49.0, 38.0, 45.0, 48.0, 33.0, 47.0, 39.0, 40.0, 41.0, 29.0, 24.0, 34.0, 33.0, 27.0, 26.0, 21.0, 15.0, 15.0, 10.0, 10.0, 10.0, 7.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-7.6953125, -7.48626708984375, -7.2772216796875, -7.06817626953125, -6.859130859375, -6.65008544921875, -6.4410400390625, -6.23199462890625, -6.02294921875, -5.81390380859375, -5.6048583984375, -5.39581298828125, -5.186767578125, -4.97772216796875, -4.7686767578125, -4.55963134765625, -4.3505859375, -4.14154052734375, -3.9324951171875, -3.72344970703125, -3.514404296875, -3.30535888671875, -3.0963134765625, -2.88726806640625, -2.67822265625, -2.46917724609375, -2.2601318359375, -2.05108642578125, -1.842041015625, -1.63299560546875, -1.4239501953125, -1.21490478515625, -1.005859375, -0.79681396484375, -0.5877685546875, -0.37872314453125, -0.169677734375, 0.03936767578125, 0.2484130859375, 0.45745849609375, 0.66650390625, 0.87554931640625, 1.0845947265625, 1.29364013671875, 1.502685546875, 1.71173095703125, 1.9207763671875, 2.12982177734375, 2.3388671875, 2.54791259765625, 2.7569580078125, 2.96600341796875, 3.175048828125, 3.38409423828125, 3.5931396484375, 3.80218505859375, 4.01123046875, 4.22027587890625, 4.4293212890625, 4.63836669921875, 4.847412109375, 5.05645751953125, 5.2655029296875, 5.47454833984375, 5.68359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 14.0, 16.0, 19.0, 40.0, 60.0, 80.0, 134.0, 201.0, 368.0, 569.0, 917.0, 1605.0, 2521.0, 4078.0, 6978.0, 12025.0, 21066.0, 38319.0, 72346.0, 139654.0, 247485.0, 229488.0, 124483.0, 65094.0, 34856.0, 19083.0, 10968.0, 6290.0, 3803.0, 2325.0, 1439.0, 849.0, 496.0, 338.0, 202.0, 121.0, 74.0, 56.0, 28.0, 12.0, 11.0, 14.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.140625, -1.103729248046875, -1.06683349609375, -1.029937744140625, -0.9930419921875, -0.956146240234375, -0.91925048828125, -0.882354736328125, -0.845458984375, -0.808563232421875, -0.77166748046875, -0.734771728515625, -0.6978759765625, -0.660980224609375, -0.62408447265625, -0.587188720703125, -0.55029296875, -0.513397216796875, -0.47650146484375, -0.439605712890625, -0.4027099609375, -0.365814208984375, -0.32891845703125, -0.292022705078125, -0.255126953125, -0.218231201171875, -0.18133544921875, -0.144439697265625, -0.1075439453125, -0.070648193359375, -0.03375244140625, 0.003143310546875, 0.0400390625, 0.076934814453125, 0.11383056640625, 0.150726318359375, 0.1876220703125, 0.224517822265625, 0.26141357421875, 0.298309326171875, 0.335205078125, 0.372100830078125, 0.40899658203125, 0.445892333984375, 0.4827880859375, 0.519683837890625, 0.55657958984375, 0.593475341796875, 0.63037109375, 0.667266845703125, 0.70416259765625, 0.741058349609375, 0.7779541015625, 0.814849853515625, 0.85174560546875, 0.888641357421875, 0.925537109375, 0.962432861328125, 0.99932861328125, 1.036224365234375, 1.0731201171875, 1.110015869140625, 1.14691162109375, 1.183807373046875, 1.220703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 6.0, 21.0, 19.0, 18.0, 22.0, 27.0, 16.0, 21.0, 25.0, 26.0, 20.0, 47.0, 48.0, 34.0, 43.0, 42.0, 1066.0, 44.0, 36.0, 31.0, 25.0, 47.0, 44.0, 30.0, 26.0, 31.0, 24.0, 24.0, 18.0, 17.0, 19.0, 16.0, 11.0, 7.0, 7.0, 5.0, 3.0, 9.0, 3.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.37890625, -4.24139404296875, -4.1038818359375, -3.96636962890625, -3.828857421875, -3.69134521484375, -3.5538330078125, -3.41632080078125, -3.27880859375, -3.14129638671875, -3.0037841796875, -2.86627197265625, -2.728759765625, -2.59124755859375, -2.4537353515625, -2.31622314453125, -2.1787109375, -2.04119873046875, -1.9036865234375, -1.76617431640625, -1.628662109375, -1.49114990234375, -1.3536376953125, -1.21612548828125, -1.07861328125, -0.94110107421875, -0.8035888671875, -0.66607666015625, -0.528564453125, -0.39105224609375, -0.2535400390625, -0.11602783203125, 0.021484375, 0.15899658203125, 0.2965087890625, 0.43402099609375, 0.571533203125, 0.70904541015625, 0.8465576171875, 0.98406982421875, 1.12158203125, 1.25909423828125, 1.3966064453125, 1.53411865234375, 1.671630859375, 1.80914306640625, 1.9466552734375, 2.08416748046875, 2.2216796875, 2.35919189453125, 2.4967041015625, 2.63421630859375, 2.771728515625, 2.90924072265625, 3.0467529296875, 3.18426513671875, 3.32177734375, 3.45928955078125, 3.5968017578125, 3.73431396484375, 3.871826171875, 4.00933837890625, 4.1468505859375, 4.28436279296875, 4.421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 11.0, 17.0, 19.0, 33.0, 55.0, 60.0, 113.0, 163.0, 210.0, 312.0, 432.0, 629.0, 1027.0, 1663.0, 2398.0, 3921.0, 6175.0, 9613.0, 15854.0, 25496.0, 42040.0, 70857.0, 120373.0, 287802.0, 1138285.0, 149152.0, 86457.0, 51826.0, 30916.0, 19062.0, 11650.0, 7396.0, 4564.0, 2889.0, 1919.0, 1232.0, 817.0, 564.0, 367.0, 247.0, 180.0, 97.0, 74.0, 44.0, 36.0, 24.0, 21.0, 18.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.4111328125, -0.39910888671875, -0.3870849609375, -0.37506103515625, -0.363037109375, -0.35101318359375, -0.3389892578125, -0.32696533203125, -0.31494140625, -0.30291748046875, -0.2908935546875, -0.27886962890625, -0.266845703125, -0.25482177734375, -0.2427978515625, -0.23077392578125, -0.21875, -0.20672607421875, -0.1947021484375, -0.18267822265625, -0.170654296875, -0.15863037109375, -0.1466064453125, -0.13458251953125, -0.12255859375, -0.11053466796875, -0.0985107421875, -0.08648681640625, -0.074462890625, -0.06243896484375, -0.0504150390625, -0.03839111328125, -0.0263671875, -0.01434326171875, -0.0023193359375, 0.00970458984375, 0.021728515625, 0.03375244140625, 0.0457763671875, 0.05780029296875, 0.06982421875, 0.08184814453125, 0.0938720703125, 0.10589599609375, 0.117919921875, 0.12994384765625, 0.1419677734375, 0.15399169921875, 0.166015625, 0.17803955078125, 0.1900634765625, 0.20208740234375, 0.214111328125, 0.22613525390625, 0.2381591796875, 0.25018310546875, 0.26220703125, 0.27423095703125, 0.2862548828125, 0.29827880859375, 0.310302734375, 0.32232666015625, 0.3343505859375, 0.34637451171875, 0.3583984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 11.0, 14.0, 9.0, 21.0, 13.0, 20.0, 18.0, 20.0, 37.0, 51.0, 63.0, 53.0, 46.0, 48.0, 45.0, 49.0, 40.0, 45.0, 55.0, 39.0, 37.0, 43.0, 22.0, 34.0, 24.0, 14.0, 13.0, 11.0, 11.0, 9.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.06640625, -0.06417655944824219, -0.061946868896484375, -0.05971717834472656, -0.05748748779296875, -0.05525779724121094, -0.053028106689453125, -0.05079841613769531, -0.0485687255859375, -0.04633903503417969, -0.044109344482421875, -0.04187965393066406, -0.03964996337890625, -0.03742027282714844, -0.035190582275390625, -0.03296089172363281, -0.030731201171875, -0.028501510620117188, -0.026271820068359375, -0.024042129516601562, -0.02181243896484375, -0.019582748413085938, -0.017353057861328125, -0.015123367309570312, -0.0128936767578125, -0.010663986206054688, -0.008434295654296875, -0.0062046051025390625, -0.00397491455078125, -0.0017452239990234375, 0.000484466552734375, 0.0027141571044921875, 0.00494384765625, 0.0071735382080078125, 0.009403228759765625, 0.011632919311523438, 0.01386260986328125, 0.016092300415039062, 0.018321990966796875, 0.020551681518554688, 0.0227813720703125, 0.025011062622070312, 0.027240753173828125, 0.029470443725585938, 0.03170013427734375, 0.03392982482910156, 0.036159515380859375, 0.03838920593261719, 0.040618896484375, 0.04284858703613281, 0.045078277587890625, 0.04730796813964844, 0.04953765869140625, 0.05176734924316406, 0.053997039794921875, 0.05622673034667969, 0.0584564208984375, 0.06068611145019531, 0.06291580200195312, 0.06514549255371094, 0.06737518310546875, 0.06960487365722656, 0.07183456420898438, 0.07406425476074219, 0.0762939453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 14.0, 13.0, 15.0, 20.0, 27.0, 45.0, 48.0, 60.0, 56.0, 135.0, 220.0, 409.0, 2091.0, 78093.0, 957944.0, 7696.0, 761.0, 277.0, 161.0, 100.0, 73.0, 46.0, 34.0, 27.0, 18.0, 24.0, 19.0, 11.0, 11.0, 10.0, 7.0, 12.0, 3.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5185546875, -1.4741973876953125, -1.429840087890625, -1.3854827880859375, -1.34112548828125, -1.2967681884765625, -1.252410888671875, -1.2080535888671875, -1.1636962890625, -1.1193389892578125, -1.074981689453125, -1.0306243896484375, -0.98626708984375, -0.9419097900390625, -0.897552490234375, -0.8531951904296875, -0.808837890625, -0.7644805908203125, -0.720123291015625, -0.6757659912109375, -0.63140869140625, -0.5870513916015625, -0.542694091796875, -0.4983367919921875, -0.4539794921875, -0.4096221923828125, -0.365264892578125, -0.3209075927734375, -0.27655029296875, -0.2321929931640625, -0.187835693359375, -0.1434783935546875, -0.09912109375, -0.0547637939453125, -0.010406494140625, 0.0339508056640625, 0.07830810546875, 0.1226654052734375, 0.167022705078125, 0.2113800048828125, 0.2557373046875, 0.3000946044921875, 0.344451904296875, 0.3888092041015625, 0.43316650390625, 0.4775238037109375, 0.521881103515625, 0.5662384033203125, 0.610595703125, 0.6549530029296875, 0.699310302734375, 0.7436676025390625, 0.78802490234375, 0.8323822021484375, 0.876739501953125, 0.9210968017578125, 0.9654541015625, 1.0098114013671875, 1.054168701171875, 1.0985260009765625, 1.14288330078125, 1.1872406005859375, 1.231597900390625, 1.2759552001953125, 1.3203125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 10.0, 40.0, 89.0, 388.0, 342.0, 89.0, 34.0, 11.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17508479952812195, -0.14563986659049988, -0.11619493365287781, -0.08675000071525574, -0.05730506777763367, -0.027860134840011597, 0.0015847980976104736, 0.031029731035232544, 0.060474663972854614, 0.08991959691047668, 0.11936452984809875, 0.14880946278572083, 0.1782543957233429, 0.20769932866096497, 0.23714426159858704, 0.2665891945362091, 0.2960341274738312, 0.32547906041145325, 0.3549239933490753, 0.3843689262866974, 0.41381385922431946, 0.44325879216194153, 0.4727037250995636, 0.5021486282348633, 0.5315935611724854, 0.5610384941101074, 0.5904834270477295, 0.6199283599853516, 0.6493732929229736, 0.6788182258605957, 0.7082631587982178, 0.7377080917358398, 0.7671530246734619, 0.796597957611084, 0.826042890548706, 0.8554878234863281, 0.8849327564239502, 0.9143776893615723, 0.9438226222991943, 0.9732675552368164, 1.0027124881744385, 1.0321574211120605, 1.0616023540496826, 1.0910472869873047, 1.1204922199249268, 1.1499371528625488, 1.179382085800171, 1.208827018737793, 1.238271951675415, 1.267716884613037, 1.2971618175506592, 1.3266067504882812, 1.3560516834259033, 1.3854966163635254, 1.4149415493011475, 1.4443864822387695, 1.4738314151763916, 1.5032763481140137, 1.5327212810516357, 1.5621662139892578, 1.5916111469268799, 1.621056079864502, 1.650501012802124, 1.679945945739746, 1.7093908786773682]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 11.0, 7.0, 5.0, 11.0, 11.0, 12.0, 9.0, 16.0, 14.0, 16.0, 21.0, 20.0, 20.0, 32.0, 35.0, 31.0, 24.0, 26.0, 41.0, 38.0, 34.0, 40.0, 34.0, 37.0, 39.0, 40.0, 40.0, 30.0, 32.0, 37.0, 24.0, 21.0, 28.0, 34.0, 17.0, 17.0, 13.0, 13.0, 14.0, 7.0, 7.0, 8.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0], "bins": [-0.2874789237976074, -0.27904948592185974, -0.27062007784843445, -0.26219063997268677, -0.2537612318992615, -0.2453317940235138, -0.2369023710489273, -0.22847294807434082, -0.22004352509975433, -0.21161410212516785, -0.20318467915058136, -0.19475525617599487, -0.1863258183002472, -0.1778964102268219, -0.16946697235107422, -0.16103754937648773, -0.15260812640190125, -0.14417870342731476, -0.13574928045272827, -0.12731985747814178, -0.1188904270529747, -0.11046100407838821, -0.10203157365322113, -0.09360215067863464, -0.08517272770404816, -0.07674330472946167, -0.06831388175487518, -0.0598844513297081, -0.05145502835512161, -0.043025605380535126, -0.03459617868065834, -0.026166751980781555, -0.01773732900619507, -0.009307904168963432, -0.0008784793317317963, 0.00755094550549984, 0.015980370342731476, 0.024409793317317963, 0.03283922001719475, 0.04126864671707153, 0.04969806969165802, 0.05812749266624451, 0.066556915640831, 0.07498634606599808, 0.08341576904058456, 0.09184519201517105, 0.10027462244033813, 0.10870404541492462, 0.11713346838951111, 0.1255628913640976, 0.13399231433868408, 0.14242173731327057, 0.15085116028785706, 0.15928059816360474, 0.16771002113819122, 0.1761394441127777, 0.1845688670873642, 0.19299829006195068, 0.20142771303653717, 0.20985713601112366, 0.21828657388687134, 0.22671598196029663, 0.2351454198360443, 0.2435748428106308, 0.2520042657852173]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 9.0, 3.0, 3.0, 9.0, 11.0, 7.0, 12.0, 8.0, 12.0, 9.0, 15.0, 21.0, 19.0, 32.0, 24.0, 27.0, 33.0, 40.0, 39.0, 51.0, 38.0, 46.0, 46.0, 35.0, 47.0, 36.0, 43.0, 42.0, 28.0, 24.0, 32.0, 34.0, 28.0, 26.0, 20.0, 15.0, 16.0, 9.0, 10.0, 10.0, 7.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-7.69921875, -7.49005126953125, -7.2808837890625, -7.07171630859375, -6.862548828125, -6.65338134765625, -6.4442138671875, -6.23504638671875, -6.02587890625, -5.81671142578125, -5.6075439453125, -5.39837646484375, -5.189208984375, -4.98004150390625, -4.7708740234375, -4.56170654296875, -4.3525390625, -4.14337158203125, -3.9342041015625, -3.72503662109375, -3.515869140625, -3.30670166015625, -3.0975341796875, -2.88836669921875, -2.67919921875, -2.47003173828125, -2.2608642578125, -2.05169677734375, -1.842529296875, -1.63336181640625, -1.4241943359375, -1.21502685546875, -1.005859375, -0.79669189453125, -0.5875244140625, -0.37835693359375, -0.169189453125, 0.03997802734375, 0.2491455078125, 0.45831298828125, 0.66748046875, 0.87664794921875, 1.0858154296875, 1.29498291015625, 1.504150390625, 1.71331787109375, 1.9224853515625, 2.13165283203125, 2.3408203125, 2.54998779296875, 2.7591552734375, 2.96832275390625, 3.177490234375, 3.38665771484375, 3.5958251953125, 3.80499267578125, 4.01416015625, 4.22332763671875, 4.4324951171875, 4.64166259765625, 4.850830078125, 5.05999755859375, 5.2691650390625, 5.47833251953125, 5.6875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 16.0, 14.0, 20.0, 28.0, 38.0, 52.0, 79.0, 109.0, 137.0, 208.0, 274.0, 363.0, 552.0, 682.0, 1003.0, 1332.0, 1886.0, 2429.0, 3527.0, 5366.0, 9080.0, 19869.0, 54726.0, 224417.0, 504071.0, 139584.0, 39462.0, 15270.0, 7765.0, 4621.0, 3147.0, 2364.0, 1608.0, 1171.0, 873.0, 668.0, 472.0, 363.0, 262.0, 181.0, 129.0, 97.0, 76.0, 56.0, 35.0, 17.0, 27.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0], "bins": [-8.96875, -8.6998291015625, -8.430908203125, -8.1619873046875, -7.89306640625, -7.6241455078125, -7.355224609375, -7.0863037109375, -6.8173828125, -6.5484619140625, -6.279541015625, -6.0106201171875, -5.74169921875, -5.4727783203125, -5.203857421875, -4.9349365234375, -4.666015625, -4.3970947265625, -4.128173828125, -3.8592529296875, -3.59033203125, -3.3214111328125, -3.052490234375, -2.7835693359375, -2.5146484375, -2.2457275390625, -1.976806640625, -1.7078857421875, -1.43896484375, -1.1700439453125, -0.901123046875, -0.6322021484375, -0.36328125, -0.0943603515625, 0.174560546875, 0.4434814453125, 0.71240234375, 0.9813232421875, 1.250244140625, 1.5191650390625, 1.7880859375, 2.0570068359375, 2.325927734375, 2.5948486328125, 2.86376953125, 3.1326904296875, 3.401611328125, 3.6705322265625, 3.939453125, 4.2083740234375, 4.477294921875, 4.7462158203125, 5.01513671875, 5.2840576171875, 5.552978515625, 5.8218994140625, 6.0908203125, 6.3597412109375, 6.628662109375, 6.8975830078125, 7.16650390625, 7.4354248046875, 7.704345703125, 7.9732666015625, 8.2421875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 8.0, 9.0, 20.0, 17.0, 13.0, 31.0, 14.0, 30.0, 31.0, 27.0, 43.0, 38.0, 57.0, 44.0, 77.0, 159.0, 1552.0, 300.0, 101.0, 71.0, 54.0, 48.0, 40.0, 36.0, 34.0, 29.0, 20.0, 20.0, 14.0, 18.0, 17.0, 14.0, 8.0, 15.0, 6.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.65673828125, -18.9228515625, -18.18896484375, -17.455078125, -16.72119140625, -15.9873046875, -15.25341796875, -14.51953125, -13.78564453125, -13.0517578125, -12.31787109375, -11.583984375, -10.85009765625, -10.1162109375, -9.38232421875, -8.6484375, -7.91455078125, -7.1806640625, -6.44677734375, -5.712890625, -4.97900390625, -4.2451171875, -3.51123046875, -2.77734375, -2.04345703125, -1.3095703125, -0.57568359375, 0.158203125, 0.89208984375, 1.6259765625, 2.35986328125, 3.09375, 3.82763671875, 4.5615234375, 5.29541015625, 6.029296875, 6.76318359375, 7.4970703125, 8.23095703125, 8.96484375, 9.69873046875, 10.4326171875, 11.16650390625, 11.900390625, 12.63427734375, 13.3681640625, 14.10205078125, 14.8359375, 15.56982421875, 16.3037109375, 17.03759765625, 17.771484375, 18.50537109375, 19.2392578125, 19.97314453125, 20.70703125, 21.44091796875, 22.1748046875, 22.90869140625, 23.642578125, 24.37646484375, 25.1103515625, 25.84423828125, 26.578125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 13.0, 22.0, 15.0, 26.0, 30.0, 31.0, 53.0, 79.0, 111.0, 144.0, 261.0, 433.0, 1149.0, 4233.0, 23021.0, 2182775.0, 908671.0, 18739.0, 3719.0, 1001.0, 420.0, 227.0, 158.0, 100.0, 57.0, 43.0, 35.0, 32.0, 27.0, 17.0, 19.0, 10.0, 3.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.3828125, -39.953125, -38.5234375, -37.09375, -35.6640625, -34.234375, -32.8046875, -31.375, -29.9453125, -28.515625, -27.0859375, -25.65625, -24.2265625, -22.796875, -21.3671875, -19.9375, -18.5078125, -17.078125, -15.6484375, -14.21875, -12.7890625, -11.359375, -9.9296875, -8.5, -7.0703125, -5.640625, -4.2109375, -2.78125, -1.3515625, 0.078125, 1.5078125, 2.9375, 4.3671875, 5.796875, 7.2265625, 8.65625, 10.0859375, 11.515625, 12.9453125, 14.375, 15.8046875, 17.234375, 18.6640625, 20.09375, 21.5234375, 22.953125, 24.3828125, 25.8125, 27.2421875, 28.671875, 30.1015625, 31.53125, 32.9609375, 34.390625, 35.8203125, 37.25, 38.6796875, 40.109375, 41.5390625, 42.96875, 44.3984375, 45.828125, 47.2578125, 48.6875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 54.0, 760.0, 204.0], "bins": [-727.6083374023438, -715.9910278320312, -704.3737182617188, -692.7564697265625, -681.13916015625, -669.5218505859375, -657.904541015625, -646.2872314453125, -634.669921875, -623.0526123046875, -611.435302734375, -599.8180541992188, -588.2007446289062, -576.5834350585938, -564.9661254882812, -553.3488159179688, -541.7315673828125, -530.1142578125, -518.4969482421875, -506.8796691894531, -495.26239013671875, -483.64508056640625, -472.02777099609375, -460.41046142578125, -448.7931823730469, -437.1758728027344, -425.55859375, -413.9412841796875, -402.323974609375, -390.7066955566406, -379.0893859863281, -367.47210693359375, -355.85479736328125, -344.23748779296875, -332.6202087402344, -321.0028991699219, -309.3856201171875, -297.768310546875, -286.1510009765625, -274.53369140625, -262.9164123535156, -251.2991180419922, -239.68182373046875, -228.06451416015625, -216.4472198486328, -204.82992553710938, -193.21261596679688, -181.59532165527344, -169.97804260253906, -158.36074829101562, -146.74343872070312, -135.1261444091797, -123.50885009765625, -111.89155578613281, -100.27425384521484, -88.65695190429688, -77.03965759277344, -65.42236328125, -53.80506134033203, -42.18776321411133, -30.570465087890625, -18.953166961669922, -7.335868835449219, 4.28143310546875, 15.898731231689453]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 4.0, 13.0, 15.0, 14.0, 11.0, 26.0, 21.0, 26.0, 21.0, 16.0, 26.0, 25.0, 34.0, 34.0, 36.0, 35.0, 38.0, 35.0, 41.0, 34.0, 35.0, 40.0, 29.0, 34.0, 40.0, 30.0, 29.0, 28.0, 37.0, 24.0, 21.0, 17.0, 19.0, 15.0, 13.0, 7.0, 11.0, 14.0, 8.0, 9.0, 2.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-57.890052795410156, -56.039669036865234, -54.18928527832031, -52.338905334472656, -50.488521575927734, -48.63813781738281, -46.787757873535156, -44.937374114990234, -43.08699035644531, -41.23660659790039, -39.38622283935547, -37.53584289550781, -35.68545913696289, -33.83507537841797, -31.98469352722168, -30.13431167602539, -28.28392791748047, -26.433544158935547, -24.583162307739258, -22.73278045654297, -20.882396697998047, -19.032012939453125, -17.181631088256836, -15.33124828338623, -13.480865478515625, -11.63048267364502, -9.780099868774414, -7.929717063903809, -6.079334259033203, -4.228951454162598, -2.378568649291992, -0.5281858444213867, 1.3222007751464844, 3.17258358001709, 5.022966384887695, 6.873349189758301, 8.723731994628906, 10.574114799499512, 12.424497604370117, 14.274880409240723, 16.125263214111328, 17.97564697265625, 19.82602882385254, 21.676410675048828, 23.52679443359375, 25.377178192138672, 27.22756004333496, 29.07794189453125, 30.928325653076172, 32.778709411621094, 34.62908935546875, 36.47947311401367, 38.329856872558594, 40.180240631103516, 42.03062438964844, 43.881004333496094, 45.731388092041016, 47.58177185058594, 49.432151794433594, 51.282535552978516, 53.13291931152344, 54.98330307006836, 56.83368682861328, 58.68406677246094, 60.53445053100586]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 4.0, 10.0, 9.0, 10.0, 8.0, 10.0, 13.0, 14.0, 24.0, 19.0, 17.0, 33.0, 36.0, 30.0, 35.0, 41.0, 33.0, 43.0, 37.0, 51.0, 42.0, 52.0, 40.0, 47.0, 36.0, 22.0, 29.0, 38.0, 27.0, 25.0, 20.0, 28.0, 13.0, 13.0, 21.0, 11.0, 12.0, 5.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0], "bins": [-8.0703125, -7.852783203125, -7.63525390625, -7.417724609375, -7.2001953125, -6.982666015625, -6.76513671875, -6.547607421875, -6.330078125, -6.112548828125, -5.89501953125, -5.677490234375, -5.4599609375, -5.242431640625, -5.02490234375, -4.807373046875, -4.58984375, -4.372314453125, -4.15478515625, -3.937255859375, -3.7197265625, -3.502197265625, -3.28466796875, -3.067138671875, -2.849609375, -2.632080078125, -2.41455078125, -2.197021484375, -1.9794921875, -1.761962890625, -1.54443359375, -1.326904296875, -1.109375, -0.891845703125, -0.67431640625, -0.456787109375, -0.2392578125, -0.021728515625, 0.19580078125, 0.413330078125, 0.630859375, 0.848388671875, 1.06591796875, 1.283447265625, 1.5009765625, 1.718505859375, 1.93603515625, 2.153564453125, 2.37109375, 2.588623046875, 2.80615234375, 3.023681640625, 3.2412109375, 3.458740234375, 3.67626953125, 3.893798828125, 4.111328125, 4.328857421875, 4.54638671875, 4.763916015625, 4.9814453125, 5.198974609375, 5.41650390625, 5.634033203125, 5.8515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 6.0, 5.0, 6.0, 8.0, 7.0, 14.0, 14.0, 26.0, 37.0, 67.0, 87.0, 154.0, 252.0, 446.0, 817.0, 1420.0, 2754.0, 5599.0, 12068.0, 28660.0, 95322.0, 798084.0, 2727034.0, 414070.0, 65984.0, 22244.0, 9582.0, 4466.0, 2273.0, 1134.0, 656.0, 397.0, 213.0, 124.0, 82.0, 48.0, 38.0, 29.0, 18.0, 10.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.124267578125, -16.49853515625, -15.872802734375, -15.2470703125, -14.621337890625, -13.99560546875, -13.369873046875, -12.744140625, -12.118408203125, -11.49267578125, -10.866943359375, -10.2412109375, -9.615478515625, -8.98974609375, -8.364013671875, -7.73828125, -7.112548828125, -6.48681640625, -5.861083984375, -5.2353515625, -4.609619140625, -3.98388671875, -3.358154296875, -2.732421875, -2.106689453125, -1.48095703125, -0.855224609375, -0.2294921875, 0.396240234375, 1.02197265625, 1.647705078125, 2.2734375, 2.899169921875, 3.52490234375, 4.150634765625, 4.7763671875, 5.402099609375, 6.02783203125, 6.653564453125, 7.279296875, 7.905029296875, 8.53076171875, 9.156494140625, 9.7822265625, 10.407958984375, 11.03369140625, 11.659423828125, 12.28515625, 12.910888671875, 13.53662109375, 14.162353515625, 14.7880859375, 15.413818359375, 16.03955078125, 16.665283203125, 17.291015625, 17.916748046875, 18.54248046875, 19.168212890625, 19.7939453125, 20.419677734375, 21.04541015625, 21.671142578125, 22.296875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 13.0, 19.0, 29.0, 48.0, 69.0, 91.0, 167.0, 291.0, 429.0, 652.0, 753.0, 552.0, 328.0, 211.0, 116.0, 104.0, 61.0, 35.0, 19.0, 15.0, 17.0, 9.0, 10.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.21875, -31.473388671875, -30.72802734375, -29.982666015625, -29.2373046875, -28.491943359375, -27.74658203125, -27.001220703125, -26.255859375, -25.510498046875, -24.76513671875, -24.019775390625, -23.2744140625, -22.529052734375, -21.78369140625, -21.038330078125, -20.29296875, -19.547607421875, -18.80224609375, -18.056884765625, -17.3115234375, -16.566162109375, -15.82080078125, -15.075439453125, -14.330078125, -13.584716796875, -12.83935546875, -12.093994140625, -11.3486328125, -10.603271484375, -9.85791015625, -9.112548828125, -8.3671875, -7.621826171875, -6.87646484375, -6.131103515625, -5.3857421875, -4.640380859375, -3.89501953125, -3.149658203125, -2.404296875, -1.658935546875, -0.91357421875, -0.168212890625, 0.5771484375, 1.322509765625, 2.06787109375, 2.813232421875, 3.55859375, 4.303955078125, 5.04931640625, 5.794677734375, 6.5400390625, 7.285400390625, 8.03076171875, 8.776123046875, 9.521484375, 10.266845703125, 11.01220703125, 11.757568359375, 12.5029296875, 13.248291015625, 13.99365234375, 14.739013671875, 15.484375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 13.0, 8.0, 30.0, 29.0, 53.0, 68.0, 88.0, 170.0, 361.0, 791.0, 1867.0, 5089.0, 15984.0, 62787.0, 431453.0, 3090150.0, 491118.0, 68356.0, 16779.0, 5478.0, 1972.0, 836.0, 353.0, 177.0, 115.0, 49.0, 32.0, 24.0, 19.0, 8.0, 8.0, 9.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.609375, -24.520751953125, -23.43212890625, -22.343505859375, -21.2548828125, -20.166259765625, -19.07763671875, -17.989013671875, -16.900390625, -15.811767578125, -14.72314453125, -13.634521484375, -12.5458984375, -11.457275390625, -10.36865234375, -9.280029296875, -8.19140625, -7.102783203125, -6.01416015625, -4.925537109375, -3.8369140625, -2.748291015625, -1.65966796875, -0.571044921875, 0.517578125, 1.606201171875, 2.69482421875, 3.783447265625, 4.8720703125, 5.960693359375, 7.04931640625, 8.137939453125, 9.2265625, 10.315185546875, 11.40380859375, 12.492431640625, 13.5810546875, 14.669677734375, 15.75830078125, 16.846923828125, 17.935546875, 19.024169921875, 20.11279296875, 21.201416015625, 22.2900390625, 23.378662109375, 24.46728515625, 25.555908203125, 26.64453125, 27.733154296875, 28.82177734375, 29.910400390625, 30.9990234375, 32.087646484375, 33.17626953125, 34.264892578125, 35.353515625, 36.442138671875, 37.53076171875, 38.619384765625, 39.7080078125, 40.796630859375, 41.88525390625, 42.973876953125, 44.0625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 7.0, 15.0, 33.0, 56.0, 81.0, 134.0, 153.0, 140.0, 125.0, 106.0, 59.0, 39.0, 27.0, 14.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-217.85951232910156, -213.31866455078125, -208.77783203125, -204.23699951171875, -199.69615173339844, -195.15530395507812, -190.61447143554688, -186.07363891601562, -181.5327911376953, -176.991943359375, -172.45111083984375, -167.9102783203125, -163.3694305419922, -158.82858276367188, -154.28775024414062, -149.74691772460938, -145.20606994628906, -140.66522216796875, -136.1243896484375, -131.58355712890625, -127.04270935058594, -122.50186920166016, -117.96102905273438, -113.4201889038086, -108.87934875488281, -104.33850860595703, -99.79766845703125, -95.25682830810547, -90.71598815917969, -86.1751480102539, -81.63430786132812, -77.09346771240234, -72.5526351928711, -68.01179504394531, -63.47095489501953, -58.93011474609375, -54.38927459716797, -49.84843444824219, -45.307594299316406, -40.766754150390625, -36.225914001464844, -31.685073852539062, -27.14423370361328, -22.6033935546875, -18.06255340576172, -13.521713256835938, -8.980873107910156, -4.440032958984375, 0.10080718994140625, 4.6416473388671875, 9.182487487792969, 13.72332763671875, 18.26416778564453, 22.805007934570312, 27.345848083496094, 31.886688232421875, 36.427528381347656, 40.96836853027344, 45.50920867919922, 50.050048828125, 54.59088897705078, 59.13172912597656, 63.672569274902344, 68.21340942382812, 72.7542495727539]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 8.0, 11.0, 10.0, 5.0, 18.0, 18.0, 26.0, 23.0, 33.0, 43.0, 28.0, 36.0, 30.0, 32.0, 43.0, 47.0, 52.0, 41.0, 49.0, 33.0, 44.0, 40.0, 46.0, 30.0, 29.0, 24.0, 31.0, 26.0, 30.0, 18.0, 18.0, 9.0, 4.0, 5.0, 5.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.053070068359375, -59.09006881713867, -57.1270637512207, -55.1640625, -53.2010612487793, -51.238059997558594, -49.275054931640625, -47.31205368041992, -45.34905242919922, -43.386051177978516, -41.42304611206055, -39.460044860839844, -37.49704360961914, -35.53404235839844, -33.57103729248047, -31.608036041259766, -29.645030975341797, -27.68202781677246, -25.719026565551758, -23.756023406982422, -21.79302215576172, -19.830018997192383, -17.867015838623047, -15.904013633728027, -13.941011428833008, -11.978009223937988, -10.015007019042969, -8.052003860473633, -6.089001655578613, -4.125999450683594, -2.162996292114258, -0.19999408721923828, 1.7630081176757812, 3.72601056098938, 5.6890130043029785, 7.652015686035156, 9.615017890930176, 11.578020095825195, 13.541023254394531, 15.50402545928955, 17.46702766418457, 19.430030822753906, 21.39303207397461, 23.356035232543945, 25.31903839111328, 27.282039642333984, 29.24504280090332, 31.208045959472656, 33.17104721069336, 35.13404846191406, 37.09705352783203, 39.060054779052734, 41.02305603027344, 42.986061096191406, 44.94906234741211, 46.91206359863281, 48.87506866455078, 50.838069915771484, 52.80107498168945, 54.764076232910156, 56.72707748413086, 58.69007873535156, 60.65308380126953, 62.616085052490234, 64.57908630371094]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 5.0, 13.0, 9.0, 13.0, 13.0, 12.0, 13.0, 13.0, 22.0, 24.0, 27.0, 20.0, 32.0, 41.0, 46.0, 33.0, 50.0, 38.0, 43.0, 42.0, 46.0, 45.0, 38.0, 36.0, 47.0, 34.0, 24.0, 34.0, 18.0, 23.0, 22.0, 23.0, 15.0, 12.0, 9.0, 10.0, 10.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.58203125, -7.3623046875, -7.142578125, -6.9228515625, -6.703125, -6.4833984375, -6.263671875, -6.0439453125, -5.82421875, -5.6044921875, -5.384765625, -5.1650390625, -4.9453125, -4.7255859375, -4.505859375, -4.2861328125, -4.06640625, -3.8466796875, -3.626953125, -3.4072265625, -3.1875, -2.9677734375, -2.748046875, -2.5283203125, -2.30859375, -2.0888671875, -1.869140625, -1.6494140625, -1.4296875, -1.2099609375, -0.990234375, -0.7705078125, -0.55078125, -0.3310546875, -0.111328125, 0.1083984375, 0.328125, 0.5478515625, 0.767578125, 0.9873046875, 1.20703125, 1.4267578125, 1.646484375, 1.8662109375, 2.0859375, 2.3056640625, 2.525390625, 2.7451171875, 2.96484375, 3.1845703125, 3.404296875, 3.6240234375, 3.84375, 4.0634765625, 4.283203125, 4.5029296875, 4.72265625, 4.9423828125, 5.162109375, 5.3818359375, 5.6015625, 5.8212890625, 6.041015625, 6.2607421875, 6.48046875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 12.0, 15.0, 14.0, 20.0, 31.0, 49.0, 56.0, 94.0, 171.0, 241.0, 399.0, 546.0, 781.0, 1236.0, 1884.0, 2863.0, 4438.0, 6846.0, 11219.0, 17956.0, 30096.0, 51186.0, 88877.0, 154248.0, 228397.0, 183555.0, 108196.0, 61781.0, 35810.0, 21497.0, 12890.0, 8174.0, 5276.0, 3301.0, 2198.0, 1427.0, 941.0, 614.0, 405.0, 232.0, 190.0, 117.0, 76.0, 72.0, 39.0, 31.0, 25.0, 13.0, 10.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.039581298828125, -1.00201416015625, -0.964447021484375, -0.9268798828125, -0.889312744140625, -0.85174560546875, -0.814178466796875, -0.776611328125, -0.739044189453125, -0.70147705078125, -0.663909912109375, -0.6263427734375, -0.588775634765625, -0.55120849609375, -0.513641357421875, -0.47607421875, -0.438507080078125, -0.40093994140625, -0.363372802734375, -0.3258056640625, -0.288238525390625, -0.25067138671875, -0.213104248046875, -0.175537109375, -0.137969970703125, -0.10040283203125, -0.062835693359375, -0.0252685546875, 0.012298583984375, 0.04986572265625, 0.087432861328125, 0.125, 0.162567138671875, 0.20013427734375, 0.237701416015625, 0.2752685546875, 0.312835693359375, 0.35040283203125, 0.387969970703125, 0.425537109375, 0.463104248046875, 0.50067138671875, 0.538238525390625, 0.5758056640625, 0.613372802734375, 0.65093994140625, 0.688507080078125, 0.72607421875, 0.763641357421875, 0.80120849609375, 0.838775634765625, 0.8763427734375, 0.913909912109375, 0.95147705078125, 0.989044189453125, 1.026611328125, 1.064178466796875, 1.10174560546875, 1.139312744140625, 1.1768798828125, 1.214447021484375, 1.25201416015625, 1.289581298828125, 1.3271484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 11.0, 12.0, 10.0, 16.0, 10.0, 17.0, 17.0, 16.0, 8.0, 33.0, 19.0, 22.0, 34.0, 21.0, 33.0, 43.0, 31.0, 36.0, 32.0, 36.0, 1054.0, 37.0, 42.0, 40.0, 41.0, 33.0, 34.0, 26.0, 24.0, 28.0, 27.0, 13.0, 25.0, 22.0, 23.0, 14.0, 14.0, 12.0, 10.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 7.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.96484375, -3.84027099609375, -3.7156982421875, -3.59112548828125, -3.466552734375, -3.34197998046875, -3.2174072265625, -3.09283447265625, -2.96826171875, -2.84368896484375, -2.7191162109375, -2.59454345703125, -2.469970703125, -2.34539794921875, -2.2208251953125, -2.09625244140625, -1.9716796875, -1.84710693359375, -1.7225341796875, -1.59796142578125, -1.473388671875, -1.34881591796875, -1.2242431640625, -1.09967041015625, -0.97509765625, -0.85052490234375, -0.7259521484375, -0.60137939453125, -0.476806640625, -0.35223388671875, -0.2276611328125, -0.10308837890625, 0.021484375, 0.14605712890625, 0.2706298828125, 0.39520263671875, 0.519775390625, 0.64434814453125, 0.7689208984375, 0.89349365234375, 1.01806640625, 1.14263916015625, 1.2672119140625, 1.39178466796875, 1.516357421875, 1.64093017578125, 1.7655029296875, 1.89007568359375, 2.0146484375, 2.13922119140625, 2.2637939453125, 2.38836669921875, 2.512939453125, 2.63751220703125, 2.7620849609375, 2.88665771484375, 3.01123046875, 3.13580322265625, 3.2603759765625, 3.38494873046875, 3.509521484375, 3.63409423828125, 3.7586669921875, 3.88323974609375, 4.0078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 0.0, 6.0, 2.0, 7.0, 10.0, 11.0, 12.0, 27.0, 30.0, 38.0, 49.0, 69.0, 104.0, 155.0, 210.0, 368.0, 485.0, 898.0, 1341.0, 2217.0, 3532.0, 5974.0, 9991.0, 17262.0, 30365.0, 52681.0, 94966.0, 177568.0, 1206583.0, 229081.0, 114111.0, 62854.0, 35713.0, 20280.0, 12031.0, 7038.0, 4168.0, 2565.0, 1545.0, 949.0, 590.0, 418.0, 270.0, 156.0, 123.0, 90.0, 56.0, 37.0, 30.0, 22.0, 20.0, 13.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.482421875, -0.4676475524902344, -0.45287322998046875, -0.4380989074707031, -0.4233245849609375, -0.4085502624511719, -0.39377593994140625, -0.3790016174316406, -0.364227294921875, -0.3494529724121094, -0.33467864990234375, -0.3199043273925781, -0.3051300048828125, -0.2903556823730469, -0.27558135986328125, -0.2608070373535156, -0.24603271484375, -0.23125839233398438, -0.21648406982421875, -0.20170974731445312, -0.1869354248046875, -0.17216110229492188, -0.15738677978515625, -0.14261245727539062, -0.127838134765625, -0.11306381225585938, -0.09828948974609375, -0.08351516723632812, -0.0687408447265625, -0.053966522216796875, -0.03919219970703125, -0.024417877197265625, -0.0096435546875, 0.005130767822265625, 0.01990509033203125, 0.034679412841796875, 0.0494537353515625, 0.06422805786132812, 0.07900238037109375, 0.09377670288085938, 0.108551025390625, 0.12332534790039062, 0.13809967041015625, 0.15287399291992188, 0.1676483154296875, 0.18242263793945312, 0.19719696044921875, 0.21197128295898438, 0.22674560546875, 0.24151992797851562, 0.25629425048828125, 0.2710685729980469, 0.2858428955078125, 0.3006172180175781, 0.31539154052734375, 0.3301658630371094, 0.344940185546875, 0.3597145080566406, 0.37448883056640625, 0.3892631530761719, 0.4040374755859375, 0.4188117980957031, 0.43358612060546875, 0.4483604431152344, 0.463134765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 6.0, 5.0, 7.0, 13.0, 12.0, 17.0, 14.0, 14.0, 35.0, 62.0, 127.0, 187.0, 191.0, 94.0, 41.0, 30.0, 14.0, 12.0, 17.0, 20.0, 8.0, 8.0, 10.0, 4.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19091796875, -0.18510818481445312, -0.17929840087890625, -0.17348861694335938, -0.1676788330078125, -0.16186904907226562, -0.15605926513671875, -0.15024948120117188, -0.144439697265625, -0.13862991333007812, -0.13282012939453125, -0.12701034545898438, -0.1212005615234375, -0.11539077758789062, -0.10958099365234375, -0.10377120971679688, -0.09796142578125, -0.09215164184570312, -0.08634185791015625, -0.08053207397460938, -0.0747222900390625, -0.06891250610351562, -0.06310272216796875, -0.057292938232421875, -0.051483154296875, -0.045673370361328125, -0.03986358642578125, -0.034053802490234375, -0.0282440185546875, -0.022434234619140625, -0.01662445068359375, -0.010814666748046875, -0.0050048828125, 0.000804901123046875, 0.00661468505859375, 0.012424468994140625, 0.0182342529296875, 0.024044036865234375, 0.02985382080078125, 0.035663604736328125, 0.041473388671875, 0.047283172607421875, 0.05309295654296875, 0.058902740478515625, 0.0647125244140625, 0.07052230834960938, 0.07633209228515625, 0.08214187622070312, 0.08795166015625, 0.09376144409179688, 0.09957122802734375, 0.10538101196289062, 0.1111907958984375, 0.11700057983398438, 0.12281036376953125, 0.12862014770507812, 0.134429931640625, 0.14023971557617188, 0.14604949951171875, 0.15185928344726562, 0.1576690673828125, 0.16347885131835938, 0.16928863525390625, 0.17509841918945312, 0.180908203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 8.0, 4.0, 7.0, 7.0, 14.0, 23.0, 27.0, 35.0, 42.0, 119.0, 245.0, 1097.0, 84639.0, 959275.0, 2312.0, 329.0, 152.0, 56.0, 37.0, 26.0, 17.0, 13.0, 11.0, 6.0, 4.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.68621826171875, -3.5638427734375, -3.44146728515625, -3.319091796875, -3.19671630859375, -3.0743408203125, -2.95196533203125, -2.82958984375, -2.70721435546875, -2.5848388671875, -2.46246337890625, -2.340087890625, -2.21771240234375, -2.0953369140625, -1.97296142578125, -1.8505859375, -1.72821044921875, -1.6058349609375, -1.48345947265625, -1.361083984375, -1.23870849609375, -1.1163330078125, -0.99395751953125, -0.87158203125, -0.74920654296875, -0.6268310546875, -0.50445556640625, -0.382080078125, -0.25970458984375, -0.1373291015625, -0.01495361328125, 0.107421875, 0.22979736328125, 0.3521728515625, 0.47454833984375, 0.596923828125, 0.71929931640625, 0.8416748046875, 0.96405029296875, 1.08642578125, 1.20880126953125, 1.3311767578125, 1.45355224609375, 1.575927734375, 1.69830322265625, 1.8206787109375, 1.94305419921875, 2.0654296875, 2.18780517578125, 2.3101806640625, 2.43255615234375, 2.554931640625, 2.67730712890625, 2.7996826171875, 2.92205810546875, 3.04443359375, 3.16680908203125, 3.2891845703125, 3.41156005859375, 3.533935546875, 3.65631103515625, 3.7786865234375, 3.90106201171875, 4.0234375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0, 5.0, 15.0, 15.0, 13.0, 26.0, 47.0, 70.0, 106.0, 207.0, 222.0, 88.0, 63.0, 35.0, 29.0, 16.0, 12.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.309217631816864, -0.2910042703151703, -0.2727908790111542, -0.25457751750946045, -0.23636414110660553, -0.2181507647037506, -0.19993740320205688, -0.18172402679920197, -0.16351065039634705, -0.14529727399349213, -0.1270838975906372, -0.10887053608894348, -0.09065715968608856, -0.07244378328323364, -0.05423041433095932, -0.036017045378685, -0.017803668975830078, 0.00040970370173454285, 0.018623076379299164, 0.036836449056863785, 0.055049821734428406, 0.07326319813728333, 0.09147656708955765, 0.10968993604183197, 0.1279033124446869, 0.1461166888475418, 0.16433006525039673, 0.18254342675209045, 0.20075680315494537, 0.2189701795578003, 0.23718354105949402, 0.25539690256118774, 0.2736102342605591, 0.2918235957622528, 0.3100369870662689, 0.32825034856796265, 0.34646373987197876, 0.3646771013736725, 0.3828904628753662, 0.4011038541793823, 0.41931721568107605, 0.4375305771827698, 0.4557439684867859, 0.4739573299884796, 0.49217069149017334, 0.5103840827941895, 0.5285974740982056, 0.5468108057975769, 0.565024197101593, 0.5832375884056091, 0.6014509201049805, 0.6196643114089966, 0.6378777027130127, 0.6560910940170288, 0.6743044257164001, 0.6925178170204163, 0.7107311487197876, 0.7289445400238037, 0.747157871723175, 0.7653712630271912, 0.7835846543312073, 0.8017979860305786, 0.8200113773345947, 0.8382247686386108, 0.856438159942627]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 4.0, 9.0, 3.0, 12.0, 17.0, 13.0, 23.0, 18.0, 16.0, 19.0, 27.0, 21.0, 32.0, 38.0, 40.0, 29.0, 33.0, 38.0, 26.0, 43.0, 42.0, 37.0, 36.0, 33.0, 40.0, 34.0, 38.0, 37.0, 26.0, 31.0, 22.0, 10.0, 25.0, 24.0, 20.0, 14.0, 6.0, 6.0, 6.0, 12.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.41460734605789185, -0.4021484851837158, -0.3896896243095398, -0.37723076343536377, -0.36477190256118774, -0.3523130416870117, -0.3398541808128357, -0.32739534974098206, -0.31493648886680603, -0.30247762799263, -0.290018767118454, -0.27755990624427795, -0.26510104537010193, -0.2526422142982483, -0.24018333852291107, -0.22772449254989624, -0.21526561677455902, -0.202806755900383, -0.19034789502620697, -0.17788904905319214, -0.1654301881790161, -0.1529713273048401, -0.14051246643066406, -0.12805360555648804, -0.11559475213289261, -0.10313589125871658, -0.09067703783512115, -0.07821817696094513, -0.0657593160867691, -0.053300462663173676, -0.04084160178899765, -0.02838274836540222, -0.015923887491226196, -0.0034650294110178947, 0.008993828669190407, 0.021452687680721283, 0.03391154482960701, 0.04637040197849274, 0.05882926285266876, 0.07128811627626419, 0.08374697715044022, 0.09620583802461624, 0.10866469144821167, 0.1211235523223877, 0.13358241319656372, 0.14604127407073975, 0.15850013494491577, 0.1709589809179306, 0.18341784179210663, 0.19587670266628265, 0.20833556354045868, 0.2207944095134735, 0.23325327038764954, 0.24571213126182556, 0.2581709921360016, 0.2706298530101776, 0.28308871388435364, 0.29554757475852966, 0.3080064356327057, 0.3204652965068817, 0.33292415738105774, 0.3453829884529114, 0.3578418493270874, 0.3703007102012634, 0.38275957107543945]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 3.0, 13.0, 9.0, 13.0, 14.0, 12.0, 13.0, 13.0, 22.0, 23.0, 27.0, 21.0, 32.0, 41.0, 44.0, 30.0, 54.0, 37.0, 41.0, 40.0, 50.0, 48.0, 37.0, 38.0, 42.0, 38.0, 23.0, 35.0, 18.0, 23.0, 21.0, 24.0, 15.0, 11.0, 9.0, 10.0, 10.0, 13.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.59765625, -7.377685546875, -7.15771484375, -6.937744140625, -6.7177734375, -6.497802734375, -6.27783203125, -6.057861328125, -5.837890625, -5.617919921875, -5.39794921875, -5.177978515625, -4.9580078125, -4.738037109375, -4.51806640625, -4.298095703125, -4.078125, -3.858154296875, -3.63818359375, -3.418212890625, -3.1982421875, -2.978271484375, -2.75830078125, -2.538330078125, -2.318359375, -2.098388671875, -1.87841796875, -1.658447265625, -1.4384765625, -1.218505859375, -0.99853515625, -0.778564453125, -0.55859375, -0.338623046875, -0.11865234375, 0.101318359375, 0.3212890625, 0.541259765625, 0.76123046875, 0.981201171875, 1.201171875, 1.421142578125, 1.64111328125, 1.861083984375, 2.0810546875, 2.301025390625, 2.52099609375, 2.740966796875, 2.9609375, 3.180908203125, 3.40087890625, 3.620849609375, 3.8408203125, 4.060791015625, 4.28076171875, 4.500732421875, 4.720703125, 4.940673828125, 5.16064453125, 5.380615234375, 5.6005859375, 5.820556640625, 6.04052734375, 6.260498046875, 6.48046875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 16.0, 17.0, 38.0, 38.0, 44.0, 52.0, 88.0, 137.0, 186.0, 278.0, 388.0, 488.0, 706.0, 1047.0, 1489.0, 2294.0, 3782.0, 7061.0, 16079.0, 46873.0, 156922.0, 398491.0, 274851.0, 86319.0, 26576.0, 10252.0, 4996.0, 2929.0, 1905.0, 1235.0, 873.0, 600.0, 415.0, 320.0, 222.0, 152.0, 109.0, 90.0, 42.0, 53.0, 29.0, 14.0, 13.0, 12.0, 8.0, 11.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.46875, -8.2020263671875, -7.935302734375, -7.6685791015625, -7.40185546875, -7.1351318359375, -6.868408203125, -6.6016845703125, -6.3349609375, -6.0682373046875, -5.801513671875, -5.5347900390625, -5.26806640625, -5.0013427734375, -4.734619140625, -4.4678955078125, -4.201171875, -3.9344482421875, -3.667724609375, -3.4010009765625, -3.13427734375, -2.8675537109375, -2.600830078125, -2.3341064453125, -2.0673828125, -1.8006591796875, -1.533935546875, -1.2672119140625, -1.00048828125, -0.7337646484375, -0.467041015625, -0.2003173828125, 0.06640625, 0.3331298828125, 0.599853515625, 0.8665771484375, 1.13330078125, 1.4000244140625, 1.666748046875, 1.9334716796875, 2.2001953125, 2.4669189453125, 2.733642578125, 3.0003662109375, 3.26708984375, 3.5338134765625, 3.800537109375, 4.0672607421875, 4.333984375, 4.6007080078125, 4.867431640625, 5.1341552734375, 5.40087890625, 5.6676025390625, 5.934326171875, 6.2010498046875, 6.4677734375, 6.7344970703125, 7.001220703125, 7.2679443359375, 7.53466796875, 7.8013916015625, 8.068115234375, 8.3348388671875, 8.6015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 10.0, 3.0, 8.0, 10.0, 10.0, 15.0, 16.0, 18.0, 22.0, 27.0, 32.0, 36.0, 30.0, 49.0, 50.0, 60.0, 57.0, 114.0, 227.0, 1397.0, 277.0, 125.0, 81.0, 55.0, 49.0, 27.0, 34.0, 41.0, 28.0, 14.0, 16.0, 25.0, 16.0, 15.0, 16.0, 11.0, 7.0, 6.0, 2.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.265625, -24.533447265625, -23.80126953125, -23.069091796875, -22.3369140625, -21.604736328125, -20.87255859375, -20.140380859375, -19.408203125, -18.676025390625, -17.94384765625, -17.211669921875, -16.4794921875, -15.747314453125, -15.01513671875, -14.282958984375, -13.55078125, -12.818603515625, -12.08642578125, -11.354248046875, -10.6220703125, -9.889892578125, -9.15771484375, -8.425537109375, -7.693359375, -6.961181640625, -6.22900390625, -5.496826171875, -4.7646484375, -4.032470703125, -3.30029296875, -2.568115234375, -1.8359375, -1.103759765625, -0.37158203125, 0.360595703125, 1.0927734375, 1.824951171875, 2.55712890625, 3.289306640625, 4.021484375, 4.753662109375, 5.48583984375, 6.218017578125, 6.9501953125, 7.682373046875, 8.41455078125, 9.146728515625, 9.87890625, 10.611083984375, 11.34326171875, 12.075439453125, 12.8076171875, 13.539794921875, 14.27197265625, 15.004150390625, 15.736328125, 16.468505859375, 17.20068359375, 17.932861328125, 18.6650390625, 19.397216796875, 20.12939453125, 20.861572265625, 21.59375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 15.0, 12.0, 25.0, 21.0, 27.0, 36.0, 51.0, 71.0, 97.0, 123.0, 169.0, 334.0, 548.0, 1414.0, 5924.0, 98861.0, 2969061.0, 61222.0, 4952.0, 1197.0, 525.0, 292.0, 182.0, 133.0, 97.0, 66.0, 49.0, 47.0, 26.0, 27.0, 17.0, 15.0, 10.0, 6.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.5, -39.076171875, -37.65234375, -36.228515625, -34.8046875, -33.380859375, -31.95703125, -30.533203125, -29.109375, -27.685546875, -26.26171875, -24.837890625, -23.4140625, -21.990234375, -20.56640625, -19.142578125, -17.71875, -16.294921875, -14.87109375, -13.447265625, -12.0234375, -10.599609375, -9.17578125, -7.751953125, -6.328125, -4.904296875, -3.48046875, -2.056640625, -0.6328125, 0.791015625, 2.21484375, 3.638671875, 5.0625, 6.486328125, 7.91015625, 9.333984375, 10.7578125, 12.181640625, 13.60546875, 15.029296875, 16.453125, 17.876953125, 19.30078125, 20.724609375, 22.1484375, 23.572265625, 24.99609375, 26.419921875, 27.84375, 29.267578125, 30.69140625, 32.115234375, 33.5390625, 34.962890625, 36.38671875, 37.810546875, 39.234375, 40.658203125, 42.08203125, 43.505859375, 44.9296875, 46.353515625, 47.77734375, 49.201171875, 50.625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 91.0, 423.0, 394.0, 94.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.11189270019531, -85.93836212158203, -79.76482391357422, -73.59129333496094, -67.41775512695312, -61.244224548339844, -55.07069396972656, -48.897159576416016, -42.72362518310547, -36.55009078979492, -30.376558303833008, -24.203025817871094, -18.029491424560547, -11.85595703125, -5.682426452636719, 0.4911079406738281, 6.664642333984375, 12.838175773620605, 19.011709213256836, 25.18524169921875, 31.358776092529297, 37.532310485839844, 43.705841064453125, 49.87937545776367, 56.05290985107422, 62.226444244384766, 68.39997863769531, 74.5735092163086, 80.74703979492188, 86.92057800292969, 93.09410858154297, 99.26763916015625, 105.441162109375, 111.61469268798828, 117.7882308959961, 123.96176147460938, 130.1352996826172, 136.308837890625, 142.48236083984375, 148.65589904785156, 154.82943725585938, 161.0029754638672, 167.17649841308594, 173.35003662109375, 179.52357482910156, 185.69711303710938, 191.87063598632812, 198.04417419433594, 204.2176971435547, 210.3912353515625, 216.56475830078125, 222.73829650878906, 228.91183471679688, 235.08535766601562, 241.25889587402344, 247.43243408203125, 253.60595703125, 259.77947998046875, 265.9530334472656, 272.1265563964844, 278.3000793457031, 284.4736328125, 290.64715576171875, 296.8206787109375, 302.9942321777344]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 4.0, 7.0, 13.0, 15.0, 19.0, 19.0, 23.0, 24.0, 22.0, 35.0, 31.0, 39.0, 36.0, 34.0, 41.0, 40.0, 39.0, 38.0, 45.0, 41.0, 41.0, 32.0, 36.0, 31.0, 32.0, 28.0, 29.0, 23.0, 23.0, 22.0, 13.0, 17.0, 19.0, 15.0, 11.0, 8.0, 11.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-61.509971618652344, -59.73705291748047, -57.96413040161133, -56.19121170043945, -54.41828918457031, -52.64537048339844, -50.8724479675293, -49.09952926635742, -47.32660675048828, -45.553688049316406, -43.780765533447266, -42.00784683227539, -40.23492431640625, -38.462005615234375, -36.689083099365234, -34.91616439819336, -33.14324188232422, -31.37032127380371, -29.597400665283203, -27.824480056762695, -26.051559448242188, -24.278640747070312, -22.505718231201172, -20.732799530029297, -18.959880828857422, -17.186960220336914, -15.414039611816406, -13.641119003295898, -11.86819839477539, -10.0952787399292, -8.322358131408691, -6.549437522888184, -4.776515960693359, -3.0035953521728516, -1.2306749820709229, 0.5422453880310059, 2.3151659965515137, 4.088086128234863, 5.861006736755371, 7.633927345275879, 9.406847953796387, 11.179768562316895, 12.952689170837402, 14.725608825683594, 16.4985294342041, 18.27145004272461, 20.044370651245117, 21.817291259765625, 23.590211868286133, 25.36313247680664, 27.13605308532715, 28.908973693847656, 30.681894302368164, 32.45481491088867, 34.22773361206055, 36.00065612792969, 37.77357482910156, 39.54649353027344, 41.31941604614258, 43.09233474731445, 44.865257263183594, 46.63817596435547, 48.41109848022461, 50.184017181396484, 51.956939697265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 5.0, 10.0, 13.0, 10.0, 13.0, 11.0, 10.0, 9.0, 15.0, 28.0, 28.0, 20.0, 27.0, 29.0, 44.0, 36.0, 45.0, 35.0, 42.0, 42.0, 38.0, 52.0, 28.0, 37.0, 40.0, 41.0, 35.0, 29.0, 25.0, 20.0, 17.0, 25.0, 28.0, 17.0, 10.0, 9.0, 7.0, 10.0, 14.0, 9.0, 9.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.2421875, -7.02587890625, -6.8095703125, -6.59326171875, -6.376953125, -6.16064453125, -5.9443359375, -5.72802734375, -5.51171875, -5.29541015625, -5.0791015625, -4.86279296875, -4.646484375, -4.43017578125, -4.2138671875, -3.99755859375, -3.78125, -3.56494140625, -3.3486328125, -3.13232421875, -2.916015625, -2.69970703125, -2.4833984375, -2.26708984375, -2.05078125, -1.83447265625, -1.6181640625, -1.40185546875, -1.185546875, -0.96923828125, -0.7529296875, -0.53662109375, -0.3203125, -0.10400390625, 0.1123046875, 0.32861328125, 0.544921875, 0.76123046875, 0.9775390625, 1.19384765625, 1.41015625, 1.62646484375, 1.8427734375, 2.05908203125, 2.275390625, 2.49169921875, 2.7080078125, 2.92431640625, 3.140625, 3.35693359375, 3.5732421875, 3.78955078125, 4.005859375, 4.22216796875, 4.4384765625, 4.65478515625, 4.87109375, 5.08740234375, 5.3037109375, 5.52001953125, 5.736328125, 5.95263671875, 6.1689453125, 6.38525390625, 6.6015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 7.0, 17.0, 8.0, 32.0, 29.0, 48.0, 78.0, 99.0, 155.0, 236.0, 342.0, 642.0, 1207.0, 2279.0, 4523.0, 9610.0, 22935.0, 68472.0, 438612.0, 2777615.0, 727444.0, 89927.0, 27803.0, 11234.0, 5040.0, 2636.0, 1293.0, 755.0, 421.0, 256.0, 171.0, 113.0, 73.0, 48.0, 36.0, 19.0, 15.0, 13.0, 14.0, 6.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.5625, -20.880126953125, -20.19775390625, -19.515380859375, -18.8330078125, -18.150634765625, -17.46826171875, -16.785888671875, -16.103515625, -15.421142578125, -14.73876953125, -14.056396484375, -13.3740234375, -12.691650390625, -12.00927734375, -11.326904296875, -10.64453125, -9.962158203125, -9.27978515625, -8.597412109375, -7.9150390625, -7.232666015625, -6.55029296875, -5.867919921875, -5.185546875, -4.503173828125, -3.82080078125, -3.138427734375, -2.4560546875, -1.773681640625, -1.09130859375, -0.408935546875, 0.2734375, 0.955810546875, 1.63818359375, 2.320556640625, 3.0029296875, 3.685302734375, 4.36767578125, 5.050048828125, 5.732421875, 6.414794921875, 7.09716796875, 7.779541015625, 8.4619140625, 9.144287109375, 9.82666015625, 10.509033203125, 11.19140625, 11.873779296875, 12.55615234375, 13.238525390625, 13.9208984375, 14.603271484375, 15.28564453125, 15.968017578125, 16.650390625, 17.332763671875, 18.01513671875, 18.697509765625, 19.3798828125, 20.062255859375, 20.74462890625, 21.427001953125, 22.109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 7.0, 10.0, 9.0, 13.0, 11.0, 22.0, 34.0, 41.0, 60.0, 94.0, 134.0, 179.0, 243.0, 397.0, 575.0, 637.0, 500.0, 347.0, 237.0, 160.0, 117.0, 69.0, 43.0, 34.0, 26.0, 23.0, 20.0, 8.0, 6.0, 11.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.8173828125, -17.166015625, -16.5146484375, -15.86328125, -15.2119140625, -14.560546875, -13.9091796875, -13.2578125, -12.6064453125, -11.955078125, -11.3037109375, -10.65234375, -10.0009765625, -9.349609375, -8.6982421875, -8.046875, -7.3955078125, -6.744140625, -6.0927734375, -5.44140625, -4.7900390625, -4.138671875, -3.4873046875, -2.8359375, -2.1845703125, -1.533203125, -0.8818359375, -0.23046875, 0.4208984375, 1.072265625, 1.7236328125, 2.375, 3.0263671875, 3.677734375, 4.3291015625, 4.98046875, 5.6318359375, 6.283203125, 6.9345703125, 7.5859375, 8.2373046875, 8.888671875, 9.5400390625, 10.19140625, 10.8427734375, 11.494140625, 12.1455078125, 12.796875, 13.4482421875, 14.099609375, 14.7509765625, 15.40234375, 16.0537109375, 16.705078125, 17.3564453125, 18.0078125, 18.6591796875, 19.310546875, 19.9619140625, 20.61328125, 21.2646484375, 21.916015625, 22.5673828125, 23.21875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 12.0, 24.0, 26.0, 48.0, 61.0, 78.0, 160.0, 318.0, 559.0, 1431.0, 3533.0, 10622.0, 38168.0, 199695.0, 2555355.0, 1235229.0, 111353.0, 25193.0, 7496.0, 2682.0, 1101.0, 491.0, 260.0, 128.0, 88.0, 53.0, 28.0, 22.0, 15.0, 12.0, 7.0, 9.0, 9.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.03125, -41.894287109375, -40.75732421875, -39.620361328125, -38.4833984375, -37.346435546875, -36.20947265625, -35.072509765625, -33.935546875, -32.798583984375, -31.66162109375, -30.524658203125, -29.3876953125, -28.250732421875, -27.11376953125, -25.976806640625, -24.83984375, -23.702880859375, -22.56591796875, -21.428955078125, -20.2919921875, -19.155029296875, -18.01806640625, -16.881103515625, -15.744140625, -14.607177734375, -13.47021484375, -12.333251953125, -11.1962890625, -10.059326171875, -8.92236328125, -7.785400390625, -6.6484375, -5.511474609375, -4.37451171875, -3.237548828125, -2.1005859375, -0.963623046875, 0.17333984375, 1.310302734375, 2.447265625, 3.584228515625, 4.72119140625, 5.858154296875, 6.9951171875, 8.132080078125, 9.26904296875, 10.406005859375, 11.54296875, 12.679931640625, 13.81689453125, 14.953857421875, 16.0908203125, 17.227783203125, 18.36474609375, 19.501708984375, 20.638671875, 21.775634765625, 22.91259765625, 24.049560546875, 25.1865234375, 26.323486328125, 27.46044921875, 28.597412109375, 29.734375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 16.0, 20.0, 60.0, 117.0, 186.0, 218.0, 185.0, 119.0, 50.0, 27.0, 12.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.3811950683594, -343.4544372558594, -336.5276794433594, -329.6009216308594, -322.6741638183594, -315.7474060058594, -308.8206481933594, -301.8938903808594, -294.9671325683594, -288.0403747558594, -281.1136169433594, -274.1868591308594, -267.2601013183594, -260.3333435058594, -253.40658569335938, -246.47982788085938, -239.55307006835938, -232.62631225585938, -225.69955444335938, -218.77279663085938, -211.84603881835938, -204.91928100585938, -197.99252319335938, -191.06576538085938, -184.13900756835938, -177.21224975585938, -170.28549194335938, -163.35873413085938, -156.43197631835938, -149.50521850585938, -142.57846069335938, -135.65170288085938, -128.7249298095703, -121.79817199707031, -114.87141418457031, -107.94465637207031, -101.01789855957031, -94.09114074707031, -87.16438293457031, -80.23762512207031, -73.31086730957031, -66.38410949707031, -59.45735168457031, -52.53059387207031, -45.60383605957031, -38.67707824707031, -31.750320434570312, -24.823562622070312, -17.896804809570312, -10.970046997070312, -4.0432891845703125, 2.8834686279296875, 9.810226440429688, 16.736984252929688, 23.663742065429688, 30.590499877929688, 37.51725769042969, 44.44401550292969, 51.37077331542969, 58.29753112792969, 65.22428894042969, 72.15104675292969, 79.07780456542969, 86.00456237792969, 92.93132019042969]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 13.0, 11.0, 11.0, 14.0, 12.0, 16.0, 16.0, 19.0, 22.0, 18.0, 33.0, 27.0, 36.0, 23.0, 34.0, 43.0, 31.0, 35.0, 40.0, 34.0, 37.0, 24.0, 27.0, 37.0, 42.0, 35.0, 32.0, 25.0, 30.0, 25.0, 18.0, 15.0, 16.0, 26.0, 19.0, 15.0, 15.0, 5.0, 12.0, 6.0, 2.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0], "bins": [-49.65329360961914, -48.12528991699219, -46.597286224365234, -45.06928253173828, -43.541282653808594, -42.01327896118164, -40.48527526855469, -38.957271575927734, -37.42926788330078, -35.90126419067383, -34.373260498046875, -32.84526062011719, -31.3172550201416, -29.78925323486328, -28.261249542236328, -26.733245849609375, -25.205244064331055, -23.6772403717041, -22.14923858642578, -20.621234893798828, -19.093231201171875, -17.565227508544922, -16.0372257232666, -14.509222030639648, -12.981219291687012, -11.453216552734375, -9.925212860107422, -8.397210121154785, -6.86920690536499, -5.341203689575195, -3.8132009506225586, -2.2851972579956055, -0.7571945190429688, 0.7708085775375366, 2.298811674118042, 3.826814651489258, 5.354817867279053, 6.882821083068848, 8.410823822021484, 9.938827514648438, 11.466830253601074, 12.994832992553711, 14.522836685180664, 16.050838470458984, 17.578842163085938, 19.10684585571289, 20.634849548339844, 22.162853240966797, 23.690855026245117, 25.21885871887207, 26.74686050415039, 28.274864196777344, 29.802867889404297, 31.33087158203125, 32.85887145996094, 34.386878967285156, 35.914878845214844, 37.4428825378418, 38.97088623046875, 40.49888610839844, 42.02688980102539, 43.554893493652344, 45.0828971862793, 46.61090087890625, 48.1389045715332]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 3.0, 11.0, 10.0, 9.0, 10.0, 18.0, 16.0, 14.0, 27.0, 24.0, 19.0, 32.0, 25.0, 30.0, 25.0, 41.0, 32.0, 46.0, 38.0, 39.0, 58.0, 47.0, 35.0, 38.0, 29.0, 36.0, 41.0, 26.0, 25.0, 21.0, 22.0, 15.0, 23.0, 17.0, 13.0, 12.0, 13.0, 16.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.88671875, -6.6641845703125, -6.441650390625, -6.2191162109375, -5.99658203125, -5.7740478515625, -5.551513671875, -5.3289794921875, -5.1064453125, -4.8839111328125, -4.661376953125, -4.4388427734375, -4.21630859375, -3.9937744140625, -3.771240234375, -3.5487060546875, -3.326171875, -3.1036376953125, -2.881103515625, -2.6585693359375, -2.43603515625, -2.2135009765625, -1.990966796875, -1.7684326171875, -1.5458984375, -1.3233642578125, -1.100830078125, -0.8782958984375, -0.65576171875, -0.4332275390625, -0.210693359375, 0.0118408203125, 0.234375, 0.4569091796875, 0.679443359375, 0.9019775390625, 1.12451171875, 1.3470458984375, 1.569580078125, 1.7921142578125, 2.0146484375, 2.2371826171875, 2.459716796875, 2.6822509765625, 2.90478515625, 3.1273193359375, 3.349853515625, 3.5723876953125, 3.794921875, 4.0174560546875, 4.239990234375, 4.4625244140625, 4.68505859375, 4.9075927734375, 5.130126953125, 5.3526611328125, 5.5751953125, 5.7977294921875, 6.020263671875, 6.2427978515625, 6.46533203125, 6.6878662109375, 6.910400390625, 7.1329345703125, 7.35546875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 23.0, 14.0, 21.0, 43.0, 72.0, 113.0, 161.0, 260.0, 360.0, 562.0, 916.0, 1364.0, 2303.0, 3601.0, 5923.0, 10226.0, 16669.0, 29045.0, 51262.0, 89632.0, 156698.0, 233470.0, 186755.0, 110098.0, 62189.0, 35241.0, 20475.0, 12158.0, 7138.0, 4367.0, 2708.0, 1739.0, 1061.0, 622.0, 430.0, 301.0, 180.0, 116.0, 67.0, 45.0, 42.0, 23.0, 20.0, 13.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.2939453125, -1.2543487548828125, -1.214752197265625, -1.1751556396484375, -1.13555908203125, -1.0959625244140625, -1.056365966796875, -1.0167694091796875, -0.9771728515625, -0.9375762939453125, -0.897979736328125, -0.8583831787109375, -0.81878662109375, -0.7791900634765625, -0.739593505859375, -0.6999969482421875, -0.660400390625, -0.6208038330078125, -0.581207275390625, -0.5416107177734375, -0.50201416015625, -0.4624176025390625, -0.422821044921875, -0.3832244873046875, -0.3436279296875, -0.3040313720703125, -0.264434814453125, -0.2248382568359375, -0.18524169921875, -0.1456451416015625, -0.106048583984375, -0.0664520263671875, -0.02685546875, 0.0127410888671875, 0.052337646484375, 0.0919342041015625, 0.13153076171875, 0.1711273193359375, 0.210723876953125, 0.2503204345703125, 0.2899169921875, 0.3295135498046875, 0.369110107421875, 0.4087066650390625, 0.44830322265625, 0.4878997802734375, 0.527496337890625, 0.5670928955078125, 0.606689453125, 0.6462860107421875, 0.685882568359375, 0.7254791259765625, 0.76507568359375, 0.8046722412109375, 0.844268798828125, 0.8838653564453125, 0.9234619140625, 0.9630584716796875, 1.002655029296875, 1.0422515869140625, 1.08184814453125, 1.1214447021484375, 1.161041259765625, 1.2006378173828125, 1.240234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 12.0, 13.0, 18.0, 18.0, 8.0, 24.0, 26.0, 24.0, 25.0, 27.0, 43.0, 33.0, 46.0, 39.0, 38.0, 41.0, 40.0, 1079.0, 55.0, 41.0, 38.0, 35.0, 29.0, 26.0, 24.0, 30.0, 23.0, 23.0, 31.0, 27.0, 20.0, 11.0, 12.0, 7.0, 9.0, 3.0, 3.0, 9.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.35546875, -5.18988037109375, -5.0242919921875, -4.85870361328125, -4.693115234375, -4.52752685546875, -4.3619384765625, -4.19635009765625, -4.03076171875, -3.86517333984375, -3.6995849609375, -3.53399658203125, -3.368408203125, -3.20281982421875, -3.0372314453125, -2.87164306640625, -2.7060546875, -2.54046630859375, -2.3748779296875, -2.20928955078125, -2.043701171875, -1.87811279296875, -1.7125244140625, -1.54693603515625, -1.38134765625, -1.21575927734375, -1.0501708984375, -0.88458251953125, -0.718994140625, -0.55340576171875, -0.3878173828125, -0.22222900390625, -0.056640625, 0.10894775390625, 0.2745361328125, 0.44012451171875, 0.605712890625, 0.77130126953125, 0.9368896484375, 1.10247802734375, 1.26806640625, 1.43365478515625, 1.5992431640625, 1.76483154296875, 1.930419921875, 2.09600830078125, 2.2615966796875, 2.42718505859375, 2.5927734375, 2.75836181640625, 2.9239501953125, 3.08953857421875, 3.255126953125, 3.42071533203125, 3.5863037109375, 3.75189208984375, 3.91748046875, 4.08306884765625, 4.2486572265625, 4.41424560546875, 4.579833984375, 4.74542236328125, 4.9110107421875, 5.07659912109375, 5.2421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 13.0, 18.0, 31.0, 58.0, 105.0, 131.0, 214.0, 312.0, 453.0, 769.0, 1224.0, 1943.0, 3241.0, 5067.0, 8537.0, 13896.0, 23334.0, 40332.0, 71627.0, 130888.0, 330645.0, 1102407.0, 158964.0, 85426.0, 47757.0, 27622.0, 16357.0, 9869.0, 5990.0, 3633.0, 2218.0, 1515.0, 916.0, 541.0, 357.0, 232.0, 159.0, 118.0, 64.0, 43.0, 33.0, 16.0, 10.0, 11.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.46142578125, -0.4466133117675781, -0.43180084228515625, -0.4169883728027344, -0.4021759033203125, -0.3873634338378906, -0.37255096435546875, -0.3577384948730469, -0.342926025390625, -0.3281135559082031, -0.31330108642578125, -0.2984886169433594, -0.2836761474609375, -0.2688636779785156, -0.25405120849609375, -0.23923873901367188, -0.22442626953125, -0.20961380004882812, -0.19480133056640625, -0.17998886108398438, -0.1651763916015625, -0.15036392211914062, -0.13555145263671875, -0.12073898315429688, -0.105926513671875, -0.09111404418945312, -0.07630157470703125, -0.061489105224609375, -0.0466766357421875, -0.031864166259765625, -0.01705169677734375, -0.002239227294921875, 0.0125732421875, 0.027385711669921875, 0.04219818115234375, 0.057010650634765625, 0.0718231201171875, 0.08663558959960938, 0.10144805908203125, 0.11626052856445312, 0.131072998046875, 0.14588546752929688, 0.16069793701171875, 0.17551040649414062, 0.1903228759765625, 0.20513534545898438, 0.21994781494140625, 0.23476028442382812, 0.24957275390625, 0.2643852233886719, 0.27919769287109375, 0.2940101623535156, 0.3088226318359375, 0.3236351013183594, 0.33844757080078125, 0.3532600402832031, 0.368072509765625, 0.3828849792480469, 0.39769744873046875, 0.4125099182128906, 0.4273223876953125, 0.4421348571777344, 0.45694732666015625, 0.4717597961425781, 0.486572265625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 4.0, 8.0, 10.0, 4.0, 12.0, 12.0, 25.0, 39.0, 95.0, 202.0, 250.0, 144.0, 65.0, 32.0, 17.0, 19.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32958984375, -0.3190498352050781, -0.30850982666015625, -0.2979698181152344, -0.2874298095703125, -0.2768898010253906, -0.26634979248046875, -0.2558097839355469, -0.245269775390625, -0.23472976684570312, -0.22418975830078125, -0.21364974975585938, -0.2031097412109375, -0.19256973266601562, -0.18202972412109375, -0.17148971557617188, -0.16094970703125, -0.15040969848632812, -0.13986968994140625, -0.12932968139648438, -0.1187896728515625, -0.10824966430664062, -0.09770965576171875, -0.08716964721679688, -0.076629638671875, -0.06608963012695312, -0.05554962158203125, -0.045009613037109375, -0.0344696044921875, -0.023929595947265625, -0.01338958740234375, -0.002849578857421875, 0.0076904296875, 0.018230438232421875, 0.02877044677734375, 0.039310455322265625, 0.0498504638671875, 0.060390472412109375, 0.07093048095703125, 0.08147048950195312, 0.092010498046875, 0.10255050659179688, 0.11309051513671875, 0.12363052368164062, 0.1341705322265625, 0.14471054077148438, 0.15525054931640625, 0.16579055786132812, 0.17633056640625, 0.18687057495117188, 0.19741058349609375, 0.20795059204101562, 0.2184906005859375, 0.22903060913085938, 0.23957061767578125, 0.2501106262207031, 0.260650634765625, 0.2711906433105469, 0.28173065185546875, 0.2922706604003906, 0.3028106689453125, 0.3133506774902344, 0.32389068603515625, 0.3344306945800781, 0.344970703125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 8.0, 25.0, 38.0, 52.0, 113.0, 293.0, 3302.0, 1019622.0, 24090.0, 634.0, 161.0, 75.0, 32.0, 22.0, 9.0, 16.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.953125, -6.74066162109375, -6.5281982421875, -6.31573486328125, -6.103271484375, -5.89080810546875, -5.6783447265625, -5.46588134765625, -5.25341796875, -5.04095458984375, -4.8284912109375, -4.61602783203125, -4.403564453125, -4.19110107421875, -3.9786376953125, -3.76617431640625, -3.5537109375, -3.34124755859375, -3.1287841796875, -2.91632080078125, -2.703857421875, -2.49139404296875, -2.2789306640625, -2.06646728515625, -1.85400390625, -1.64154052734375, -1.4290771484375, -1.21661376953125, -1.004150390625, -0.79168701171875, -0.5792236328125, -0.36676025390625, -0.154296875, 0.05816650390625, 0.2706298828125, 0.48309326171875, 0.695556640625, 0.90802001953125, 1.1204833984375, 1.33294677734375, 1.54541015625, 1.75787353515625, 1.9703369140625, 2.18280029296875, 2.395263671875, 2.60772705078125, 2.8201904296875, 3.03265380859375, 3.2451171875, 3.45758056640625, 3.6700439453125, 3.88250732421875, 4.094970703125, 4.30743408203125, 4.5198974609375, 4.73236083984375, 4.94482421875, 5.15728759765625, 5.3697509765625, 5.58221435546875, 5.794677734375, 6.00714111328125, 6.2196044921875, 6.43206787109375, 6.64453125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 10.0, 3.0, 12.0, 18.0, 23.0, 43.0, 51.0, 94.0, 153.0, 261.0, 133.0, 67.0, 50.0, 25.0, 19.0, 16.0, 3.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46889767050743103, -0.44180095195770264, -0.41470426321029663, -0.38760754466056824, -0.36051082611083984, -0.33341413736343384, -0.30631741881370544, -0.27922070026397705, -0.25212401151657104, -0.22502730786800385, -0.19793058931827545, -0.17083388566970825, -0.14373716711997986, -0.11664046347141266, -0.08954375982284546, -0.062447041273117065, -0.03535032272338867, -0.008253613486886024, 0.018843095749616623, 0.04593980312347412, 0.07303651422262192, 0.10013322532176971, 0.12722992897033691, 0.1543266475200653, 0.1814233511686325, 0.2085200548171997, 0.2356167733669281, 0.2627134919166565, 0.2898101806640625, 0.3169068992137909, 0.3440036177635193, 0.3711003065109253, 0.3981969952583313, 0.4252937138080597, 0.4523904025554657, 0.4794871211051941, 0.5065838098526001, 0.5336805582046509, 0.5607772469520569, 0.5878739356994629, 0.6149706840515137, 0.6420673727989197, 0.6691641211509705, 0.6962608098983765, 0.7233574986457825, 0.7504542469978333, 0.7775509357452393, 0.80464768409729, 0.8317443132400513, 0.8588410019874573, 0.8859377503395081, 0.9130344390869141, 0.9401311278343201, 0.9672278761863708, 0.9943245649337769, 1.0214213132858276, 1.0485180616378784, 1.0756148099899292, 1.1027114391326904, 1.1298081874847412, 1.156904935836792, 1.1840015649795532, 1.211098313331604, 1.2381950616836548, 1.265291690826416]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 6.0, 4.0, 8.0, 3.0, 5.0, 13.0, 12.0, 22.0, 16.0, 24.0, 20.0, 20.0, 27.0, 28.0, 26.0, 37.0, 33.0, 31.0, 36.0, 33.0, 42.0, 28.0, 47.0, 38.0, 32.0, 30.0, 35.0, 36.0, 36.0, 29.0, 38.0, 30.0, 25.0, 22.0, 17.0, 26.0, 16.0, 17.0, 10.0, 11.0, 2.0, 7.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.49825114011764526, -0.482431024312973, -0.4666109085083008, -0.45079079270362854, -0.4349706768989563, -0.41915053129196167, -0.40333041548728943, -0.3875102996826172, -0.37169018387794495, -0.3558700680732727, -0.34004995226860046, -0.3242298364639282, -0.3084096908569336, -0.29258960485458374, -0.2767694592475891, -0.26094934344291687, -0.24512922763824463, -0.2293091118335724, -0.21348899602890015, -0.1976688653230667, -0.18184874951839447, -0.16602863371372223, -0.1502085030078888, -0.13438838720321655, -0.11856827139854431, -0.10274815559387207, -0.08692803233861923, -0.0711079090833664, -0.05528779327869415, -0.03946767747402191, -0.023647554218769073, -0.007827430963516235, 0.00799262523651123, 0.02381274476647377, 0.03963286429643631, 0.05545298382639885, 0.07127310335636139, 0.08709321916103363, 0.10291334241628647, 0.1187334656715393, 0.13455358147621155, 0.1503736972808838, 0.16619381308555603, 0.18201394379138947, 0.1978340595960617, 0.21365417540073395, 0.22947430610656738, 0.24529442191123962, 0.26111453771591187, 0.2769346535205841, 0.29275476932525635, 0.3085748851299286, 0.32439500093460083, 0.34021514654159546, 0.3560352623462677, 0.37185537815093994, 0.3876754939556122, 0.4034956097602844, 0.41931572556495667, 0.4351358413696289, 0.45095598697662354, 0.4667760729789734, 0.482596218585968, 0.49841633439064026, 0.5142364501953125]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 3.0, 4.0, 3.0, 10.0, 11.0, 9.0, 11.0, 18.0, 17.0, 13.0, 26.0, 22.0, 20.0, 35.0, 24.0, 30.0, 25.0, 43.0, 30.0, 45.0, 39.0, 38.0, 60.0, 46.0, 36.0, 37.0, 27.0, 40.0, 36.0, 29.0, 25.0, 22.0, 19.0, 17.0, 24.0, 14.0, 16.0, 12.0, 12.0, 13.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.8828125, -6.66033935546875, -6.4378662109375, -6.21539306640625, -5.992919921875, -5.77044677734375, -5.5479736328125, -5.32550048828125, -5.10302734375, -4.88055419921875, -4.6580810546875, -4.43560791015625, -4.213134765625, -3.99066162109375, -3.7681884765625, -3.54571533203125, -3.3232421875, -3.10076904296875, -2.8782958984375, -2.65582275390625, -2.433349609375, -2.21087646484375, -1.9884033203125, -1.76593017578125, -1.54345703125, -1.32098388671875, -1.0985107421875, -0.87603759765625, -0.653564453125, -0.43109130859375, -0.2086181640625, 0.01385498046875, 0.236328125, 0.45880126953125, 0.6812744140625, 0.90374755859375, 1.126220703125, 1.34869384765625, 1.5711669921875, 1.79364013671875, 2.01611328125, 2.23858642578125, 2.4610595703125, 2.68353271484375, 2.906005859375, 3.12847900390625, 3.3509521484375, 3.57342529296875, 3.7958984375, 4.01837158203125, 4.2408447265625, 4.46331787109375, 4.685791015625, 4.90826416015625, 5.1307373046875, 5.35321044921875, 5.57568359375, 5.79815673828125, 6.0206298828125, 6.24310302734375, 6.465576171875, 6.68804931640625, 6.9105224609375, 7.13299560546875, 7.35546875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 18.0, 16.0, 25.0, 22.0, 46.0, 58.0, 73.0, 65.0, 125.0, 192.0, 278.0, 452.0, 792.0, 1186.0, 2073.0, 4030.0, 8511.0, 21281.0, 60377.0, 211630.0, 491411.0, 163690.0, 48788.0, 17533.0, 7357.0, 3586.0, 1852.0, 1088.0, 672.0, 423.0, 260.0, 177.0, 120.0, 94.0, 66.0, 48.0, 36.0, 24.0, 13.0, 16.0, 13.0, 10.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.5, -12.1142578125, -11.728515625, -11.3427734375, -10.95703125, -10.5712890625, -10.185546875, -9.7998046875, -9.4140625, -9.0283203125, -8.642578125, -8.2568359375, -7.87109375, -7.4853515625, -7.099609375, -6.7138671875, -6.328125, -5.9423828125, -5.556640625, -5.1708984375, -4.78515625, -4.3994140625, -4.013671875, -3.6279296875, -3.2421875, -2.8564453125, -2.470703125, -2.0849609375, -1.69921875, -1.3134765625, -0.927734375, -0.5419921875, -0.15625, 0.2294921875, 0.615234375, 1.0009765625, 1.38671875, 1.7724609375, 2.158203125, 2.5439453125, 2.9296875, 3.3154296875, 3.701171875, 4.0869140625, 4.47265625, 4.8583984375, 5.244140625, 5.6298828125, 6.015625, 6.4013671875, 6.787109375, 7.1728515625, 7.55859375, 7.9443359375, 8.330078125, 8.7158203125, 9.1015625, 9.4873046875, 9.873046875, 10.2587890625, 10.64453125, 11.0302734375, 11.416015625, 11.8017578125, 12.1875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 13.0, 6.0, 9.0, 20.0, 14.0, 23.0, 24.0, 22.0, 30.0, 37.0, 37.0, 32.0, 49.0, 66.0, 91.0, 112.0, 252.0, 1458.0, 193.0, 110.0, 72.0, 49.0, 47.0, 38.0, 32.0, 31.0, 31.0, 24.0, 20.0, 14.0, 18.0, 7.0, 5.0, 15.0, 6.0, 3.0, 9.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.3369140625, -20.611328125, -19.8857421875, -19.16015625, -18.4345703125, -17.708984375, -16.9833984375, -16.2578125, -15.5322265625, -14.806640625, -14.0810546875, -13.35546875, -12.6298828125, -11.904296875, -11.1787109375, -10.453125, -9.7275390625, -9.001953125, -8.2763671875, -7.55078125, -6.8251953125, -6.099609375, -5.3740234375, -4.6484375, -3.9228515625, -3.197265625, -2.4716796875, -1.74609375, -1.0205078125, -0.294921875, 0.4306640625, 1.15625, 1.8818359375, 2.607421875, 3.3330078125, 4.05859375, 4.7841796875, 5.509765625, 6.2353515625, 6.9609375, 7.6865234375, 8.412109375, 9.1376953125, 9.86328125, 10.5888671875, 11.314453125, 12.0400390625, 12.765625, 13.4912109375, 14.216796875, 14.9423828125, 15.66796875, 16.3935546875, 17.119140625, 17.8447265625, 18.5703125, 19.2958984375, 20.021484375, 20.7470703125, 21.47265625, 22.1982421875, 22.923828125, 23.6494140625, 24.375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 5.0, 11.0, 12.0, 8.0, 10.0, 22.0, 21.0, 25.0, 47.0, 67.0, 86.0, 97.0, 133.0, 244.0, 371.0, 865.0, 3165.0, 31580.0, 2427450.0, 661957.0, 15676.0, 2129.0, 649.0, 326.0, 192.0, 126.0, 104.0, 84.0, 43.0, 45.0, 42.0, 26.0, 19.0, 12.0, 14.0, 9.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.1875, -47.7353515625, -46.283203125, -44.8310546875, -43.37890625, -41.9267578125, -40.474609375, -39.0224609375, -37.5703125, -36.1181640625, -34.666015625, -33.2138671875, -31.76171875, -30.3095703125, -28.857421875, -27.4052734375, -25.953125, -24.5009765625, -23.048828125, -21.5966796875, -20.14453125, -18.6923828125, -17.240234375, -15.7880859375, -14.3359375, -12.8837890625, -11.431640625, -9.9794921875, -8.52734375, -7.0751953125, -5.623046875, -4.1708984375, -2.71875, -1.2666015625, 0.185546875, 1.6376953125, 3.08984375, 4.5419921875, 5.994140625, 7.4462890625, 8.8984375, 10.3505859375, 11.802734375, 13.2548828125, 14.70703125, 16.1591796875, 17.611328125, 19.0634765625, 20.515625, 21.9677734375, 23.419921875, 24.8720703125, 26.32421875, 27.7763671875, 29.228515625, 30.6806640625, 32.1328125, 33.5849609375, 35.037109375, 36.4892578125, 37.94140625, 39.3935546875, 40.845703125, 42.2978515625, 43.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 8.0, 174.0, 607.0, 211.0, 18.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.11866760253906, -30.5842342376709, -22.049800872802734, -13.51536750793457, -4.980934143066406, 3.553497314453125, 12.087932586669922, 20.62236785888672, 29.15679931640625, 37.69123077392578, 46.22566604614258, 54.760101318359375, 63.294532775878906, 71.82896423339844, 80.3634033203125, 88.89783477783203, 97.43226623535156, 105.9666976928711, 114.50112915039062, 123.03556823730469, 131.57000732421875, 140.10443115234375, 148.6388702392578, 157.17330932617188, 165.70773315429688, 174.24217224121094, 182.77659606933594, 191.31103515625, 199.845458984375, 208.37989807128906, 216.91433715820312, 225.44876098632812, 233.98318481445312, 242.5176239013672, 251.0520477294922, 259.58648681640625, 268.12091064453125, 276.65533447265625, 285.1897888183594, 293.7242126464844, 302.2586669921875, 310.7930908203125, 319.3275451660156, 327.8619689941406, 336.3963928222656, 344.93084716796875, 353.46527099609375, 361.99969482421875, 370.53411865234375, 379.06854248046875, 387.6029968261719, 396.1374206542969, 404.6718444824219, 413.206298828125, 421.74072265625, 430.275146484375, 438.8095703125, 447.343994140625, 455.8784484863281, 464.4128723144531, 472.9472961425781, 481.48175048828125, 490.01617431640625, 498.55059814453125, 507.0850524902344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 12.0, 4.0, 10.0, 17.0, 9.0, 11.0, 15.0, 23.0, 33.0, 15.0, 33.0, 45.0, 33.0, 53.0, 48.0, 63.0, 46.0, 34.0, 63.0, 48.0, 49.0, 34.0, 35.0, 34.0, 37.0, 26.0, 24.0, 26.0, 31.0, 18.0, 9.0, 12.0, 14.0, 7.0, 6.0, 3.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.59678649902344, -68.30347442626953, -66.01016235351562, -63.71685028076172, -61.42353820800781, -59.130226135253906, -56.8369140625, -54.543601989746094, -52.25028991699219, -49.95697784423828, -47.663665771484375, -45.37035369873047, -43.07704162597656, -40.783729553222656, -38.49041748046875, -36.197105407714844, -33.90379333496094, -31.61048126220703, -29.317169189453125, -27.02385711669922, -24.730545043945312, -22.437232971191406, -20.1439208984375, -17.850608825683594, -15.557296752929688, -13.263984680175781, -10.970672607421875, -8.677360534667969, -6.3840484619140625, -4.090736389160156, -1.79742431640625, 0.49588775634765625, 2.7891998291015625, 5.082511901855469, 7.375823974609375, 9.669136047363281, 11.962448120117188, 14.255760192871094, 16.549072265625, 18.842384338378906, 21.135696411132812, 23.42900848388672, 25.722320556640625, 28.01563262939453, 30.308944702148438, 32.602256774902344, 34.89556884765625, 37.188880920410156, 39.48219299316406, 41.77550506591797, 44.068817138671875, 46.36212921142578, 48.65544128417969, 50.948753356933594, 53.2420654296875, 55.535377502441406, 57.82868957519531, 60.12200164794922, 62.415313720703125, 64.70862579345703, 67.00193786621094, 69.29524993896484, 71.58856201171875, 73.88187408447266, 76.17518615722656]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 11.0, 13.0, 14.0, 19.0, 15.0, 18.0, 19.0, 25.0, 28.0, 26.0, 31.0, 40.0, 26.0, 34.0, 37.0, 49.0, 34.0, 32.0, 42.0, 34.0, 52.0, 34.0, 47.0, 37.0, 36.0, 25.0, 28.0, 17.0, 27.0, 20.0, 19.0, 10.0, 16.0, 11.0, 6.0, 8.0, 9.0, 3.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.16796875, -6.93243408203125, -6.6968994140625, -6.46136474609375, -6.225830078125, -5.99029541015625, -5.7547607421875, -5.51922607421875, -5.28369140625, -5.04815673828125, -4.8126220703125, -4.57708740234375, -4.341552734375, -4.10601806640625, -3.8704833984375, -3.63494873046875, -3.3994140625, -3.16387939453125, -2.9283447265625, -2.69281005859375, -2.457275390625, -2.22174072265625, -1.9862060546875, -1.75067138671875, -1.51513671875, -1.27960205078125, -1.0440673828125, -0.80853271484375, -0.572998046875, -0.33746337890625, -0.1019287109375, 0.13360595703125, 0.369140625, 0.60467529296875, 0.8402099609375, 1.07574462890625, 1.311279296875, 1.54681396484375, 1.7823486328125, 2.01788330078125, 2.25341796875, 2.48895263671875, 2.7244873046875, 2.96002197265625, 3.195556640625, 3.43109130859375, 3.6666259765625, 3.90216064453125, 4.1376953125, 4.37322998046875, 4.6087646484375, 4.84429931640625, 5.079833984375, 5.31536865234375, 5.5509033203125, 5.78643798828125, 6.02197265625, 6.25750732421875, 6.4930419921875, 6.72857666015625, 6.964111328125, 7.19964599609375, 7.4351806640625, 7.67071533203125, 7.90625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 2.0, 6.0, 11.0, 18.0, 25.0, 28.0, 22.0, 44.0, 53.0, 85.0, 129.0, 143.0, 227.0, 369.0, 688.0, 1365.0, 2728.0, 6163.0, 15734.0, 50149.0, 334028.0, 2812325.0, 849183.0, 83306.0, 22224.0, 7920.0, 3452.0, 1621.0, 850.0, 457.0, 273.0, 197.0, 115.0, 96.0, 58.0, 40.0, 38.0, 29.0, 19.0, 19.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.15625, -24.38623046875, -23.6162109375, -22.84619140625, -22.076171875, -21.30615234375, -20.5361328125, -19.76611328125, -18.99609375, -18.22607421875, -17.4560546875, -16.68603515625, -15.916015625, -15.14599609375, -14.3759765625, -13.60595703125, -12.8359375, -12.06591796875, -11.2958984375, -10.52587890625, -9.755859375, -8.98583984375, -8.2158203125, -7.44580078125, -6.67578125, -5.90576171875, -5.1357421875, -4.36572265625, -3.595703125, -2.82568359375, -2.0556640625, -1.28564453125, -0.515625, 0.25439453125, 1.0244140625, 1.79443359375, 2.564453125, 3.33447265625, 4.1044921875, 4.87451171875, 5.64453125, 6.41455078125, 7.1845703125, 7.95458984375, 8.724609375, 9.49462890625, 10.2646484375, 11.03466796875, 11.8046875, 12.57470703125, 13.3447265625, 14.11474609375, 14.884765625, 15.65478515625, 16.4248046875, 17.19482421875, 17.96484375, 18.73486328125, 19.5048828125, 20.27490234375, 21.044921875, 21.81494140625, 22.5849609375, 23.35498046875, 24.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 6.0, 4.0, 2.0, 8.0, 12.0, 23.0, 13.0, 33.0, 33.0, 35.0, 42.0, 68.0, 97.0, 130.0, 164.0, 220.0, 298.0, 360.0, 449.0, 479.0, 372.0, 311.0, 233.0, 157.0, 119.0, 82.0, 72.0, 66.0, 44.0, 36.0, 18.0, 9.0, 20.0, 18.0, 4.0, 4.0, 3.0, 6.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.2215576171875, -14.732177734375, -14.2427978515625, -13.75341796875, -13.2640380859375, -12.774658203125, -12.2852783203125, -11.7958984375, -11.3065185546875, -10.817138671875, -10.3277587890625, -9.83837890625, -9.3489990234375, -8.859619140625, -8.3702392578125, -7.880859375, -7.3914794921875, -6.902099609375, -6.4127197265625, -5.92333984375, -5.4339599609375, -4.944580078125, -4.4552001953125, -3.9658203125, -3.4764404296875, -2.987060546875, -2.4976806640625, -2.00830078125, -1.5189208984375, -1.029541015625, -0.5401611328125, -0.05078125, 0.4385986328125, 0.927978515625, 1.4173583984375, 1.90673828125, 2.3961181640625, 2.885498046875, 3.3748779296875, 3.8642578125, 4.3536376953125, 4.843017578125, 5.3323974609375, 5.82177734375, 6.3111572265625, 6.800537109375, 7.2899169921875, 7.779296875, 8.2686767578125, 8.758056640625, 9.2474365234375, 9.73681640625, 10.2261962890625, 10.715576171875, 11.2049560546875, 11.6943359375, 12.1837158203125, 12.673095703125, 13.1624755859375, 13.65185546875, 14.1412353515625, 14.630615234375, 15.1199951171875, 15.609375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 0.0, 8.0, 7.0, 10.0, 16.0, 19.0, 32.0, 31.0, 43.0, 79.0, 125.0, 201.0, 388.0, 1114.0, 3262.0, 12975.0, 74027.0, 1460138.0, 2510265.0, 108209.0, 16825.0, 3966.0, 1343.0, 510.0, 247.0, 128.0, 85.0, 60.0, 43.0, 28.0, 24.0, 22.0, 14.0, 8.0, 8.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.46875, -42.99072265625, -41.5126953125, -40.03466796875, -38.556640625, -37.07861328125, -35.6005859375, -34.12255859375, -32.64453125, -31.16650390625, -29.6884765625, -28.21044921875, -26.732421875, -25.25439453125, -23.7763671875, -22.29833984375, -20.8203125, -19.34228515625, -17.8642578125, -16.38623046875, -14.908203125, -13.43017578125, -11.9521484375, -10.47412109375, -8.99609375, -7.51806640625, -6.0400390625, -4.56201171875, -3.083984375, -1.60595703125, -0.1279296875, 1.35009765625, 2.828125, 4.30615234375, 5.7841796875, 7.26220703125, 8.740234375, 10.21826171875, 11.6962890625, 13.17431640625, 14.65234375, 16.13037109375, 17.6083984375, 19.08642578125, 20.564453125, 22.04248046875, 23.5205078125, 24.99853515625, 26.4765625, 27.95458984375, 29.4326171875, 30.91064453125, 32.388671875, 33.86669921875, 35.3447265625, 36.82275390625, 38.30078125, 39.77880859375, 41.2568359375, 42.73486328125, 44.212890625, 45.69091796875, 47.1689453125, 48.64697265625, 50.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 32.0, 43.0, 97.0, 165.0, 235.0, 181.0, 136.0, 60.0, 31.0, 13.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.46383666992188, -134.3179473876953, -128.1720733642578, -122.02618408203125, -115.88031005859375, -109.73442077636719, -103.58853912353516, -97.44265747070312, -91.2967758178711, -85.15089416503906, -79.00501251220703, -72.859130859375, -66.71324157714844, -60.56736373901367, -54.421478271484375, -48.275596618652344, -42.12971496582031, -35.98383331298828, -29.837949752807617, -23.692066192626953, -17.546184539794922, -11.40030288696289, -5.254417419433594, 0.8914642333984375, 7.037345886230469, 13.183228492736816, 19.329111099243164, 25.474994659423828, 31.62087631225586, 37.76675796508789, 43.91264343261719, 50.05852508544922, 56.20440673828125, 62.35028839111328, 68.49617004394531, 74.64205932617188, 80.78793334960938, 86.93382263183594, 93.07970428466797, 99.2255859375, 105.37146759033203, 111.51734924316406, 117.6632308959961, 123.80911254882812, 129.9550018310547, 136.1008758544922, 142.24676513671875, 148.39263916015625, 154.5385284423828, 160.68441772460938, 166.83029174804688, 172.97618103027344, 179.12205505371094, 185.2679443359375, 191.413818359375, 197.55970764160156, 203.70559692382812, 209.8514862060547, 215.9973602294922, 222.14324951171875, 228.28912353515625, 234.4350128173828, 240.58090209960938, 246.72677612304688, 252.87265014648438]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 9.0, 7.0, 11.0, 9.0, 15.0, 21.0, 16.0, 23.0, 25.0, 16.0, 32.0, 31.0, 31.0, 34.0, 46.0, 45.0, 44.0, 39.0, 36.0, 41.0, 31.0, 37.0, 46.0, 44.0, 39.0, 33.0, 34.0, 34.0, 27.0, 22.0, 20.0, 13.0, 20.0, 12.0, 11.0, 11.0, 3.0, 12.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.09138870239258, -53.208168029785156, -51.324951171875, -49.44173049926758, -47.558509826660156, -45.67529296875, -43.79207229614258, -41.908851623535156, -40.025634765625, -38.14241409301758, -36.25919723510742, -34.3759765625, -32.492759704589844, -30.609539031982422, -28.726318359375, -26.84309959411621, -24.959880828857422, -23.076662063598633, -21.193443298339844, -19.310222625732422, -17.427003860473633, -15.543785095214844, -13.660565376281738, -11.777345657348633, -9.894126892089844, -8.010908126831055, -6.127688407897949, -4.244469165802002, -2.3612499237060547, -0.4780311584472656, 1.4051885604858398, 3.2884082794189453, 5.171630859375, 7.054850101470947, 8.938069343566895, 10.8212890625, 12.704507827758789, 14.587726593017578, 16.470947265625, 18.35416603088379, 20.237384796142578, 22.120603561401367, 24.003822326660156, 25.887042999267578, 27.770261764526367, 29.653480529785156, 31.536701202392578, 33.419921875, 35.303138732910156, 37.18635940551758, 39.069576263427734, 40.952796936035156, 42.83601379394531, 44.719234466552734, 46.602455139160156, 48.48567199707031, 50.368892669677734, 52.252113342285156, 54.13533020019531, 56.018550872802734, 57.901771545410156, 59.78498840332031, 61.668209075927734, 63.551429748535156, 65.43464660644531]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 2.0, 4.0, 8.0, 4.0, 10.0, 14.0, 12.0, 18.0, 21.0, 20.0, 25.0, 21.0, 33.0, 46.0, 33.0, 41.0, 42.0, 29.0, 47.0, 39.0, 43.0, 32.0, 50.0, 41.0, 41.0, 47.0, 37.0, 27.0, 19.0, 25.0, 22.0, 23.0, 25.0, 12.0, 17.0, 12.0, 11.0, 7.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.80859375, -7.56024169921875, -7.3118896484375, -7.06353759765625, -6.815185546875, -6.56683349609375, -6.3184814453125, -6.07012939453125, -5.82177734375, -5.57342529296875, -5.3250732421875, -5.07672119140625, -4.828369140625, -4.58001708984375, -4.3316650390625, -4.08331298828125, -3.8349609375, -3.58660888671875, -3.3382568359375, -3.08990478515625, -2.841552734375, -2.59320068359375, -2.3448486328125, -2.09649658203125, -1.84814453125, -1.59979248046875, -1.3514404296875, -1.10308837890625, -0.854736328125, -0.60638427734375, -0.3580322265625, -0.10968017578125, 0.138671875, 0.38702392578125, 0.6353759765625, 0.88372802734375, 1.132080078125, 1.38043212890625, 1.6287841796875, 1.87713623046875, 2.12548828125, 2.37384033203125, 2.6221923828125, 2.87054443359375, 3.118896484375, 3.36724853515625, 3.6156005859375, 3.86395263671875, 4.1123046875, 4.36065673828125, 4.6090087890625, 4.85736083984375, 5.105712890625, 5.35406494140625, 5.6024169921875, 5.85076904296875, 6.09912109375, 6.34747314453125, 6.5958251953125, 6.84417724609375, 7.092529296875, 7.34088134765625, 7.5892333984375, 7.83758544921875, 8.0859375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 16.0, 20.0, 17.0, 34.0, 40.0, 65.0, 78.0, 101.0, 150.0, 257.0, 389.0, 517.0, 826.0, 1211.0, 1954.0, 3114.0, 5175.0, 8936.0, 15673.0, 28551.0, 53169.0, 103358.0, 203164.0, 277766.0, 162869.0, 82427.0, 43086.0, 23057.0, 12986.0, 7425.0, 4373.0, 2768.0, 1709.0, 1050.0, 708.0, 465.0, 291.0, 239.0, 142.0, 125.0, 68.0, 55.0, 36.0, 22.0, 21.0, 14.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6708984375, -1.615814208984375, -1.56072998046875, -1.505645751953125, -1.4505615234375, -1.395477294921875, -1.34039306640625, -1.285308837890625, -1.230224609375, -1.175140380859375, -1.12005615234375, -1.064971923828125, -1.0098876953125, -0.954803466796875, -0.89971923828125, -0.844635009765625, -0.78955078125, -0.734466552734375, -0.67938232421875, -0.624298095703125, -0.5692138671875, -0.514129638671875, -0.45904541015625, -0.403961181640625, -0.348876953125, -0.293792724609375, -0.23870849609375, -0.183624267578125, -0.1285400390625, -0.073455810546875, -0.01837158203125, 0.036712646484375, 0.091796875, 0.146881103515625, 0.20196533203125, 0.257049560546875, 0.3121337890625, 0.367218017578125, 0.42230224609375, 0.477386474609375, 0.532470703125, 0.587554931640625, 0.64263916015625, 0.697723388671875, 0.7528076171875, 0.807891845703125, 0.86297607421875, 0.918060302734375, 0.97314453125, 1.028228759765625, 1.08331298828125, 1.138397216796875, 1.1934814453125, 1.248565673828125, 1.30364990234375, 1.358734130859375, 1.413818359375, 1.468902587890625, 1.52398681640625, 1.579071044921875, 1.6341552734375, 1.689239501953125, 1.74432373046875, 1.799407958984375, 1.8544921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 7.0, 10.0, 6.0, 5.0, 7.0, 9.0, 7.0, 10.0, 21.0, 23.0, 30.0, 22.0, 23.0, 26.0, 29.0, 35.0, 33.0, 34.0, 36.0, 32.0, 37.0, 37.0, 1072.0, 46.0, 46.0, 45.0, 40.0, 26.0, 38.0, 30.0, 33.0, 22.0, 31.0, 25.0, 16.0, 12.0, 10.0, 11.0, 5.0, 11.0, 6.0, 5.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.29296875, -5.12322998046875, -4.9534912109375, -4.78375244140625, -4.614013671875, -4.44427490234375, -4.2745361328125, -4.10479736328125, -3.93505859375, -3.76531982421875, -3.5955810546875, -3.42584228515625, -3.256103515625, -3.08636474609375, -2.9166259765625, -2.74688720703125, -2.5771484375, -2.40740966796875, -2.2376708984375, -2.06793212890625, -1.898193359375, -1.72845458984375, -1.5587158203125, -1.38897705078125, -1.21923828125, -1.04949951171875, -0.8797607421875, -0.71002197265625, -0.540283203125, -0.37054443359375, -0.2008056640625, -0.03106689453125, 0.138671875, 0.30841064453125, 0.4781494140625, 0.64788818359375, 0.817626953125, 0.98736572265625, 1.1571044921875, 1.32684326171875, 1.49658203125, 1.66632080078125, 1.8360595703125, 2.00579833984375, 2.175537109375, 2.34527587890625, 2.5150146484375, 2.68475341796875, 2.8544921875, 3.02423095703125, 3.1939697265625, 3.36370849609375, 3.533447265625, 3.70318603515625, 3.8729248046875, 4.04266357421875, 4.21240234375, 4.38214111328125, 4.5518798828125, 4.72161865234375, 4.891357421875, 5.06109619140625, 5.2308349609375, 5.40057373046875, 5.5703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 11.0, 16.0, 12.0, 22.0, 35.0, 44.0, 55.0, 100.0, 130.0, 168.0, 273.0, 453.0, 711.0, 1291.0, 2264.0, 4302.0, 8222.0, 17175.0, 36059.0, 82595.0, 209549.0, 1301861.0, 254898.0, 95655.0, 41717.0, 19165.0, 9419.0, 4679.0, 2567.0, 1415.0, 837.0, 481.0, 318.0, 205.0, 115.0, 97.0, 58.0, 40.0, 34.0, 17.0, 18.0, 16.0, 9.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7744140625, -0.7482376098632812, -0.7220611572265625, -0.6958847045898438, -0.669708251953125, -0.6435317993164062, -0.6173553466796875, -0.5911788940429688, -0.56500244140625, -0.5388259887695312, -0.5126495361328125, -0.48647308349609375, -0.460296630859375, -0.43412017822265625, -0.4079437255859375, -0.38176727294921875, -0.3555908203125, -0.32941436767578125, -0.3032379150390625, -0.27706146240234375, -0.250885009765625, -0.22470855712890625, -0.1985321044921875, -0.17235565185546875, -0.14617919921875, -0.12000274658203125, -0.0938262939453125, -0.06764984130859375, -0.041473388671875, -0.01529693603515625, 0.0108795166015625, 0.03705596923828125, 0.063232421875, 0.08940887451171875, 0.1155853271484375, 0.14176177978515625, 0.167938232421875, 0.19411468505859375, 0.2202911376953125, 0.24646759033203125, 0.27264404296875, 0.29882049560546875, 0.3249969482421875, 0.35117340087890625, 0.377349853515625, 0.40352630615234375, 0.4297027587890625, 0.45587921142578125, 0.4820556640625, 0.5082321166992188, 0.5344085693359375, 0.5605850219726562, 0.586761474609375, 0.6129379272460938, 0.6391143798828125, 0.6652908325195312, 0.69146728515625, 0.7176437377929688, 0.7438201904296875, 0.7699966430664062, 0.796173095703125, 0.8223495483398438, 0.8485260009765625, 0.8747024536132812, 0.90087890625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 6.0, 4.0, 3.0, 8.0, 5.0, 13.0, 15.0, 12.0, 14.0, 25.0, 34.0, 43.0, 42.0, 47.0, 49.0, 69.0, 69.0, 60.0, 65.0, 73.0, 51.0, 43.0, 39.0, 37.0, 35.0, 24.0, 22.0, 13.0, 13.0, 14.0, 14.0, 11.0, 6.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.285400390625, -0.27634429931640625, -0.2672882080078125, -0.25823211669921875, -0.249176025390625, -0.24011993408203125, -0.2310638427734375, -0.22200775146484375, -0.21295166015625, -0.20389556884765625, -0.1948394775390625, -0.18578338623046875, -0.176727294921875, -0.16767120361328125, -0.1586151123046875, -0.14955902099609375, -0.1405029296875, -0.13144683837890625, -0.1223907470703125, -0.11333465576171875, -0.104278564453125, -0.09522247314453125, -0.0861663818359375, -0.07711029052734375, -0.06805419921875, -0.05899810791015625, -0.0499420166015625, -0.04088592529296875, -0.031829833984375, -0.02277374267578125, -0.0137176513671875, -0.00466156005859375, 0.00439453125, 0.01345062255859375, 0.0225067138671875, 0.03156280517578125, 0.040618896484375, 0.04967498779296875, 0.0587310791015625, 0.06778717041015625, 0.07684326171875, 0.08589935302734375, 0.0949554443359375, 0.10401153564453125, 0.113067626953125, 0.12212371826171875, 0.1311798095703125, 0.14023590087890625, 0.1492919921875, 0.15834808349609375, 0.1674041748046875, 0.17646026611328125, 0.185516357421875, 0.19457244873046875, 0.2036285400390625, 0.21268463134765625, 0.22174072265625, 0.23079681396484375, 0.2398529052734375, 0.24890899658203125, 0.257965087890625, 0.26702117919921875, 0.2760772705078125, 0.28513336181640625, 0.294189453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 3.0, 13.0, 8.0, 12.0, 13.0, 14.0, 18.0, 26.0, 26.0, 40.0, 49.0, 58.0, 145.0, 222.0, 718.0, 12454.0, 1023245.0, 10162.0, 674.0, 244.0, 95.0, 88.0, 58.0, 32.0, 30.0, 16.0, 13.0, 17.0, 9.0, 9.0, 6.0, 5.0, 4.0, 7.0, 0.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.22265625, -6.03106689453125, -5.8394775390625, -5.64788818359375, -5.456298828125, -5.26470947265625, -5.0731201171875, -4.88153076171875, -4.68994140625, -4.49835205078125, -4.3067626953125, -4.11517333984375, -3.923583984375, -3.73199462890625, -3.5404052734375, -3.34881591796875, -3.1572265625, -2.96563720703125, -2.7740478515625, -2.58245849609375, -2.390869140625, -2.19927978515625, -2.0076904296875, -1.81610107421875, -1.62451171875, -1.43292236328125, -1.2413330078125, -1.04974365234375, -0.858154296875, -0.66656494140625, -0.4749755859375, -0.28338623046875, -0.091796875, 0.09979248046875, 0.2913818359375, 0.48297119140625, 0.674560546875, 0.86614990234375, 1.0577392578125, 1.24932861328125, 1.44091796875, 1.63250732421875, 1.8240966796875, 2.01568603515625, 2.207275390625, 2.39886474609375, 2.5904541015625, 2.78204345703125, 2.9736328125, 3.16522216796875, 3.3568115234375, 3.54840087890625, 3.739990234375, 3.93157958984375, 4.1231689453125, 4.31475830078125, 4.50634765625, 4.69793701171875, 4.8895263671875, 5.08111572265625, 5.272705078125, 5.46429443359375, 5.6558837890625, 5.84747314453125, 6.0390625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 13.0, 14.0, 21.0, 41.0, 64.0, 107.0, 318.0, 202.0, 89.0, 54.0, 29.0, 18.0, 11.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.952785313129425, -0.9020622968673706, -0.8513392806053162, -0.8006162643432617, -0.7498931884765625, -0.6991701722145081, -0.6484471559524536, -0.5977240800857544, -0.5470011234283447, -0.4962781071662903, -0.44555506110191345, -0.394832044839859, -0.3441089987754822, -0.29338598251342773, -0.2426629662513733, -0.19193992018699646, -0.14121687412261963, -0.09049384295940399, -0.03977081924676895, 0.010952204465866089, 0.061675235629081726, 0.11239826679229736, 0.1631212830543518, 0.21384432911872864, 0.2645673453807831, 0.3152903616428375, 0.36601340770721436, 0.4167364239692688, 0.46745944023132324, 0.5181825160980225, 0.5689054727554321, 0.6196285486221313, 0.6703516244888306, 0.721074640750885, 0.7717976570129395, 0.8225207328796387, 0.8732437491416931, 0.9239667654037476, 0.974689781665802, 1.0254127979278564, 1.0761358737945557, 1.1268589496612549, 1.1775819063186646, 1.2283049821853638, 1.2790279388427734, 1.3297510147094727, 1.3804740905761719, 1.4311970472335815, 1.4819200038909912, 1.5326430797576904, 1.5833660364151, 1.6340891122817993, 1.684812068939209, 1.7355351448059082, 1.7862582206726074, 1.836981177330017, 1.8877042531967163, 1.9384273290634155, 1.9891502857208252, 2.0398733615875244, 2.0905964374542236, 2.1413192749023438, 2.192042350769043, 2.242765426635742, 2.2934885025024414]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 9.0, 12.0, 13.0, 16.0, 17.0, 21.0, 19.0, 24.0, 33.0, 36.0, 20.0, 26.0, 43.0, 30.0, 32.0, 52.0, 45.0, 43.0, 36.0, 32.0, 33.0, 44.0, 42.0, 28.0, 21.0, 31.0, 25.0, 34.0, 26.0, 24.0, 17.0, 15.0, 12.0, 16.0, 10.0, 6.0, 5.0, 9.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0562572479248047, -1.022892713546753, -0.9895281791687012, -0.9561636447906494, -0.9227991104125977, -0.8894345760345459, -0.8560700416564941, -0.8227055072784424, -0.7893409729003906, -0.7559764385223389, -0.7226119041442871, -0.6892473697662354, -0.6558828353881836, -0.6225183010101318, -0.5891537666320801, -0.5557892322540283, -0.5224246978759766, -0.4890601634979248, -0.45569562911987305, -0.4223310947418213, -0.38896656036376953, -0.3556020259857178, -0.322237491607666, -0.28887295722961426, -0.2555084228515625, -0.22214388847351074, -0.18877935409545898, -0.15541481971740723, -0.12205028533935547, -0.08868575096130371, -0.05532121658325195, -0.021956682205200195, 0.011407971382141113, 0.04477250576019287, 0.07813704013824463, 0.11150157451629639, 0.14486610889434814, 0.1782306432723999, 0.21159517765045166, 0.24495971202850342, 0.2783242464065552, 0.31168878078460693, 0.3450533151626587, 0.37841784954071045, 0.4117823839187622, 0.44514691829681396, 0.4785114526748657, 0.5118759870529175, 0.5452405214309692, 0.578605055809021, 0.6119695901870728, 0.6453341245651245, 0.6786986589431763, 0.712063193321228, 0.7454277276992798, 0.7787922620773315, 0.8121567964553833, 0.8455213308334351, 0.8788858652114868, 0.9122503995895386, 0.9456149339675903, 0.9789794683456421, 1.0123440027236938, 1.0457085371017456, 1.0790730714797974]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 7.0, 2.0, 4.0, 7.0, 4.0, 12.0, 14.0, 13.0, 15.0, 20.0, 19.0, 24.0, 24.0, 38.0, 46.0, 29.0, 40.0, 42.0, 32.0, 45.0, 41.0, 39.0, 36.0, 50.0, 34.0, 49.0, 45.0, 34.0, 28.0, 20.0, 24.0, 23.0, 22.0, 28.0, 11.0, 17.0, 14.0, 9.0, 7.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.81640625, -7.56781005859375, -7.3192138671875, -7.07061767578125, -6.822021484375, -6.57342529296875, -6.3248291015625, -6.07623291015625, -5.82763671875, -5.57904052734375, -5.3304443359375, -5.08184814453125, -4.833251953125, -4.58465576171875, -4.3360595703125, -4.08746337890625, -3.8388671875, -3.59027099609375, -3.3416748046875, -3.09307861328125, -2.844482421875, -2.59588623046875, -2.3472900390625, -2.09869384765625, -1.85009765625, -1.60150146484375, -1.3529052734375, -1.10430908203125, -0.855712890625, -0.60711669921875, -0.3585205078125, -0.10992431640625, 0.138671875, 0.38726806640625, 0.6358642578125, 0.88446044921875, 1.133056640625, 1.38165283203125, 1.6302490234375, 1.87884521484375, 2.12744140625, 2.37603759765625, 2.6246337890625, 2.87322998046875, 3.121826171875, 3.37042236328125, 3.6190185546875, 3.86761474609375, 4.1162109375, 4.36480712890625, 4.6134033203125, 4.86199951171875, 5.110595703125, 5.35919189453125, 5.6077880859375, 5.85638427734375, 6.10498046875, 6.35357666015625, 6.6021728515625, 6.85076904296875, 7.099365234375, 7.34796142578125, 7.5965576171875, 7.84515380859375, 8.09375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 6.0, 10.0, 13.0, 19.0, 28.0, 19.0, 35.0, 65.0, 106.0, 120.0, 193.0, 274.0, 414.0, 628.0, 917.0, 1368.0, 1967.0, 3028.0, 4728.0, 7569.0, 14324.0, 34908.0, 113320.0, 409832.0, 313302.0, 82763.0, 27094.0, 12121.0, 6802.0, 4211.0, 2748.0, 1746.0, 1222.0, 824.0, 541.0, 355.0, 320.0, 203.0, 140.0, 86.0, 54.0, 35.0, 33.0, 22.0, 9.0, 8.0, 8.0, 4.0, 3.0, 5.0, 1.0, 4.0, 3.0], "bins": [-12.734375, -12.3692626953125, -12.004150390625, -11.6390380859375, -11.27392578125, -10.9088134765625, -10.543701171875, -10.1785888671875, -9.8134765625, -9.4483642578125, -9.083251953125, -8.7181396484375, -8.35302734375, -7.9879150390625, -7.622802734375, -7.2576904296875, -6.892578125, -6.5274658203125, -6.162353515625, -5.7972412109375, -5.43212890625, -5.0670166015625, -4.701904296875, -4.3367919921875, -3.9716796875, -3.6065673828125, -3.241455078125, -2.8763427734375, -2.51123046875, -2.1461181640625, -1.781005859375, -1.4158935546875, -1.05078125, -0.6856689453125, -0.320556640625, 0.0445556640625, 0.40966796875, 0.7747802734375, 1.139892578125, 1.5050048828125, 1.8701171875, 2.2352294921875, 2.600341796875, 2.9654541015625, 3.33056640625, 3.6956787109375, 4.060791015625, 4.4259033203125, 4.791015625, 5.1561279296875, 5.521240234375, 5.8863525390625, 6.25146484375, 6.6165771484375, 6.981689453125, 7.3468017578125, 7.7119140625, 8.0770263671875, 8.442138671875, 8.8072509765625, 9.17236328125, 9.5374755859375, 9.902587890625, 10.2677001953125, 10.6328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 6.0, 8.0, 8.0, 6.0, 9.0, 20.0, 19.0, 13.0, 26.0, 30.0, 28.0, 37.0, 34.0, 46.0, 48.0, 44.0, 75.0, 118.0, 268.0, 1455.0, 202.0, 119.0, 62.0, 49.0, 44.0, 27.0, 33.0, 28.0, 37.0, 18.0, 17.0, 26.0, 20.0, 11.0, 16.0, 10.0, 9.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.66064453125, -18.9150390625, -18.16943359375, -17.423828125, -16.67822265625, -15.9326171875, -15.18701171875, -14.44140625, -13.69580078125, -12.9501953125, -12.20458984375, -11.458984375, -10.71337890625, -9.9677734375, -9.22216796875, -8.4765625, -7.73095703125, -6.9853515625, -6.23974609375, -5.494140625, -4.74853515625, -4.0029296875, -3.25732421875, -2.51171875, -1.76611328125, -1.0205078125, -0.27490234375, 0.470703125, 1.21630859375, 1.9619140625, 2.70751953125, 3.453125, 4.19873046875, 4.9443359375, 5.68994140625, 6.435546875, 7.18115234375, 7.9267578125, 8.67236328125, 9.41796875, 10.16357421875, 10.9091796875, 11.65478515625, 12.400390625, 13.14599609375, 13.8916015625, 14.63720703125, 15.3828125, 16.12841796875, 16.8740234375, 17.61962890625, 18.365234375, 19.11083984375, 19.8564453125, 20.60205078125, 21.34765625, 22.09326171875, 22.8388671875, 23.58447265625, 24.330078125, 25.07568359375, 25.8212890625, 26.56689453125, 27.3125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 12.0, 18.0, 19.0, 18.0, 23.0, 39.0, 39.0, 51.0, 53.0, 90.0, 77.0, 125.0, 177.0, 290.0, 584.0, 1315.0, 4007.0, 15841.0, 239784.0, 2805786.0, 63055.0, 9270.0, 2602.0, 941.0, 437.0, 292.0, 155.0, 125.0, 93.0, 80.0, 65.0, 45.0, 38.0, 37.0, 19.0, 14.0, 12.0, 12.0, 14.0, 7.0, 9.0, 1.0, 8.0, 4.0, 1.0, 1.0, 1.0, 5.0], "bins": [-46.15625, -44.849609375, -43.54296875, -42.236328125, -40.9296875, -39.623046875, -38.31640625, -37.009765625, -35.703125, -34.396484375, -33.08984375, -31.783203125, -30.4765625, -29.169921875, -27.86328125, -26.556640625, -25.25, -23.943359375, -22.63671875, -21.330078125, -20.0234375, -18.716796875, -17.41015625, -16.103515625, -14.796875, -13.490234375, -12.18359375, -10.876953125, -9.5703125, -8.263671875, -6.95703125, -5.650390625, -4.34375, -3.037109375, -1.73046875, -0.423828125, 0.8828125, 2.189453125, 3.49609375, 4.802734375, 6.109375, 7.416015625, 8.72265625, 10.029296875, 11.3359375, 12.642578125, 13.94921875, 15.255859375, 16.5625, 17.869140625, 19.17578125, 20.482421875, 21.7890625, 23.095703125, 24.40234375, 25.708984375, 27.015625, 28.322265625, 29.62890625, 30.935546875, 32.2421875, 33.548828125, 34.85546875, 36.162109375, 37.46875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 16.0, 53.0, 114.0, 211.0, 286.0, 195.0, 79.0, 32.0, 11.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.54403686523438, -80.15449523925781, -75.76495361328125, -71.37541961669922, -66.98587799072266, -62.596336364746094, -58.2067985534668, -53.8172607421875, -49.42771911621094, -45.038177490234375, -40.64863967895508, -36.25910186767578, -31.86956024169922, -27.48002052307129, -23.09048080444336, -18.70094108581543, -14.3114013671875, -9.92186164855957, -5.532321929931641, -1.142782211303711, 3.2467575073242188, 7.636297225952148, 12.025836944580078, 16.415376663208008, 20.804916381835938, 25.194456100463867, 29.583995819091797, 33.973533630371094, 38.363075256347656, 42.75261688232422, 47.142154693603516, 51.53169250488281, 55.92121887207031, 60.310760498046875, 64.70030212402344, 69.08983612060547, 73.47937774658203, 77.8689193725586, 82.25845336914062, 86.64799499511719, 91.03753662109375, 95.42707824707031, 99.81661987304688, 104.2061538696289, 108.59569549560547, 112.98523712158203, 117.37477111816406, 121.76431274414062, 126.15385437011719, 130.54339599609375, 134.9329376220703, 139.32247924804688, 143.71200561523438, 148.10154724121094, 152.4910888671875, 156.88063049316406, 161.27017211914062, 165.6597137451172, 170.04925537109375, 174.4387969970703, 178.82833862304688, 183.21786499023438, 187.60740661621094, 191.9969482421875, 196.38648986816406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 7.0, 18.0, 10.0, 15.0, 17.0, 13.0, 22.0, 33.0, 29.0, 36.0, 28.0, 26.0, 37.0, 34.0, 36.0, 48.0, 49.0, 41.0, 42.0, 43.0, 42.0, 33.0, 31.0, 21.0, 38.0, 20.0, 27.0, 30.0, 16.0, 23.0, 17.0, 17.0, 11.0, 10.0, 17.0, 10.0, 4.0, 10.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-60.20482635498047, -58.35892105102539, -56.51301956176758, -54.6671142578125, -52.82121276855469, -50.97530746459961, -49.12940216064453, -47.28350067138672, -45.437599182128906, -43.59169387817383, -41.745792388916016, -39.89988708496094, -38.053985595703125, -36.20808029174805, -34.36217498779297, -32.516273498535156, -30.670368194580078, -28.824464797973633, -26.978561401367188, -25.13265609741211, -23.286754608154297, -21.44084930419922, -19.594945907592773, -17.749042510986328, -15.903139114379883, -14.057235717773438, -12.211332321166992, -10.36542797088623, -8.519524574279785, -6.67362117767334, -4.827716827392578, -2.981813430786133, -1.1359062194824219, 0.7099974155426025, 2.555901050567627, 4.4018049240112305, 6.247708320617676, 8.093611717224121, 9.939516067504883, 11.785419464111328, 13.631322860717773, 15.477226257324219, 17.323129653930664, 19.16903305053711, 21.014938354492188, 22.86083984375, 24.706745147705078, 26.552648544311523, 28.39855194091797, 30.244455337524414, 32.09035873413086, 33.93626403808594, 35.78216552734375, 37.62807083129883, 39.473976135253906, 41.31987762451172, 43.16577911376953, 45.01168441772461, 46.85758590698242, 48.7034912109375, 50.54939270019531, 52.39529800415039, 54.24120330810547, 56.08710479736328, 57.93301010131836]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 0.0, 5.0, 4.0, 5.0, 12.0, 13.0, 17.0, 19.0, 19.0, 19.0, 29.0, 29.0, 31.0, 26.0, 31.0, 45.0, 30.0, 45.0, 41.0, 50.0, 50.0, 39.0, 46.0, 37.0, 41.0, 37.0, 39.0, 29.0, 26.0, 29.0, 29.0, 12.0, 26.0, 13.0, 12.0, 13.0, 14.0, 6.0, 6.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.5936279296875, -7.327880859375, -7.0621337890625, -6.79638671875, -6.5306396484375, -6.264892578125, -5.9991455078125, -5.7333984375, -5.4676513671875, -5.201904296875, -4.9361572265625, -4.67041015625, -4.4046630859375, -4.138916015625, -3.8731689453125, -3.607421875, -3.3416748046875, -3.075927734375, -2.8101806640625, -2.54443359375, -2.2786865234375, -2.012939453125, -1.7471923828125, -1.4814453125, -1.2156982421875, -0.949951171875, -0.6842041015625, -0.41845703125, -0.1527099609375, 0.113037109375, 0.3787841796875, 0.64453125, 0.9102783203125, 1.176025390625, 1.4417724609375, 1.70751953125, 1.9732666015625, 2.239013671875, 2.5047607421875, 2.7705078125, 3.0362548828125, 3.302001953125, 3.5677490234375, 3.83349609375, 4.0992431640625, 4.364990234375, 4.6307373046875, 4.896484375, 5.1622314453125, 5.427978515625, 5.6937255859375, 5.95947265625, 6.2252197265625, 6.490966796875, 6.7567138671875, 7.0224609375, 7.2882080078125, 7.553955078125, 7.8197021484375, 8.08544921875, 8.3511962890625, 8.616943359375, 8.8826904296875, 9.1484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 4.0, 11.0, 11.0, 10.0, 14.0, 20.0, 26.0, 44.0, 69.0, 102.0, 174.0, 279.0, 408.0, 696.0, 1143.0, 1938.0, 3376.0, 6796.0, 13694.0, 34530.0, 142730.0, 1195093.0, 2348130.0, 347264.0, 58401.0, 19882.0, 8825.0, 4589.0, 2362.0, 1327.0, 829.0, 499.0, 323.0, 221.0, 149.0, 120.0, 55.0, 34.0, 27.0, 25.0, 13.0, 16.0, 6.0, 4.0, 2.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-21.6875, -21.03466796875, -20.3818359375, -19.72900390625, -19.076171875, -18.42333984375, -17.7705078125, -17.11767578125, -16.46484375, -15.81201171875, -15.1591796875, -14.50634765625, -13.853515625, -13.20068359375, -12.5478515625, -11.89501953125, -11.2421875, -10.58935546875, -9.9365234375, -9.28369140625, -8.630859375, -7.97802734375, -7.3251953125, -6.67236328125, -6.01953125, -5.36669921875, -4.7138671875, -4.06103515625, -3.408203125, -2.75537109375, -2.1025390625, -1.44970703125, -0.796875, -0.14404296875, 0.5087890625, 1.16162109375, 1.814453125, 2.46728515625, 3.1201171875, 3.77294921875, 4.42578125, 5.07861328125, 5.7314453125, 6.38427734375, 7.037109375, 7.68994140625, 8.3427734375, 8.99560546875, 9.6484375, 10.30126953125, 10.9541015625, 11.60693359375, 12.259765625, 12.91259765625, 13.5654296875, 14.21826171875, 14.87109375, 15.52392578125, 16.1767578125, 16.82958984375, 17.482421875, 18.13525390625, 18.7880859375, 19.44091796875, 20.09375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 16.0, 17.0, 27.0, 41.0, 35.0, 67.0, 106.0, 141.0, 200.0, 338.0, 436.0, 595.0, 568.0, 459.0, 301.0, 207.0, 125.0, 107.0, 67.0, 71.0, 35.0, 24.0, 19.0, 19.0, 12.0, 6.0, 8.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -19.467529296875, -18.84130859375, -18.215087890625, -17.5888671875, -16.962646484375, -16.33642578125, -15.710205078125, -15.083984375, -14.457763671875, -13.83154296875, -13.205322265625, -12.5791015625, -11.952880859375, -11.32666015625, -10.700439453125, -10.07421875, -9.447998046875, -8.82177734375, -8.195556640625, -7.5693359375, -6.943115234375, -6.31689453125, -5.690673828125, -5.064453125, -4.438232421875, -3.81201171875, -3.185791015625, -2.5595703125, -1.933349609375, -1.30712890625, -0.680908203125, -0.0546875, 0.571533203125, 1.19775390625, 1.823974609375, 2.4501953125, 3.076416015625, 3.70263671875, 4.328857421875, 4.955078125, 5.581298828125, 6.20751953125, 6.833740234375, 7.4599609375, 8.086181640625, 8.71240234375, 9.338623046875, 9.96484375, 10.591064453125, 11.21728515625, 11.843505859375, 12.4697265625, 13.095947265625, 13.72216796875, 14.348388671875, 14.974609375, 15.600830078125, 16.22705078125, 16.853271484375, 17.4794921875, 18.105712890625, 18.73193359375, 19.358154296875, 19.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 7.0, 8.0, 8.0, 8.0, 14.0, 22.0, 28.0, 42.0, 55.0, 87.0, 132.0, 201.0, 414.0, 948.0, 2947.0, 13223.0, 95301.0, 2655049.0, 1352741.0, 59433.0, 9533.0, 2429.0, 842.0, 347.0, 172.0, 84.0, 66.0, 49.0, 35.0, 19.0, 17.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.05908203125, -45.4306640625, -43.80224609375, -42.173828125, -40.54541015625, -38.9169921875, -37.28857421875, -35.66015625, -34.03173828125, -32.4033203125, -30.77490234375, -29.146484375, -27.51806640625, -25.8896484375, -24.26123046875, -22.6328125, -21.00439453125, -19.3759765625, -17.74755859375, -16.119140625, -14.49072265625, -12.8623046875, -11.23388671875, -9.60546875, -7.97705078125, -6.3486328125, -4.72021484375, -3.091796875, -1.46337890625, 0.1650390625, 1.79345703125, 3.421875, 5.05029296875, 6.6787109375, 8.30712890625, 9.935546875, 11.56396484375, 13.1923828125, 14.82080078125, 16.44921875, 18.07763671875, 19.7060546875, 21.33447265625, 22.962890625, 24.59130859375, 26.2197265625, 27.84814453125, 29.4765625, 31.10498046875, 32.7333984375, 34.36181640625, 35.990234375, 37.61865234375, 39.2470703125, 40.87548828125, 42.50390625, 44.13232421875, 45.7607421875, 47.38916015625, 49.017578125, 50.64599609375, 52.2744140625, 53.90283203125, 55.53125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 14.0, 21.0, 23.0, 41.0, 63.0, 69.0, 88.0, 101.0, 120.0, 109.0, 87.0, 76.0, 61.0, 47.0, 30.0, 25.0, 9.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-153.76983642578125, -150.536376953125, -147.3029022216797, -144.06944274902344, -140.8359832763672, -137.60250854492188, -134.36904907226562, -131.13558959960938, -127.9021224975586, -124.66865539550781, -121.43519592285156, -118.20172882080078, -114.96826171875, -111.73480224609375, -108.50133514404297, -105.26786804199219, -102.03440856933594, -98.80094146728516, -95.5674819946289, -92.33401489257812, -89.10054779052734, -85.8670883178711, -82.63362121582031, -79.40016174316406, -76.16668701171875, -72.93321990966797, -69.69976043701172, -66.46629333496094, -63.23283004760742, -59.999366760253906, -56.765899658203125, -53.53243637084961, -50.29896926879883, -47.06550598144531, -43.83203887939453, -40.598575592041016, -37.3651123046875, -34.13164520263672, -30.898181915283203, -27.664718627929688, -24.43125343322754, -21.19778823852539, -17.964324951171875, -14.730859756469727, -11.497395515441895, -8.263931274414062, -5.030466079711914, -1.7970027923583984, 1.43646240234375, 4.669926643371582, 7.903391361236572, 11.136856079101562, 14.370320320129395, 17.603784561157227, 20.837249755859375, 24.07071304321289, 27.30417823791504, 30.537643432617188, 33.7711067199707, 37.00457000732422, 40.238037109375, 43.471500396728516, 46.70496368408203, 49.93843078613281, 53.17189407348633]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 13.0, 8.0, 24.0, 27.0, 29.0, 30.0, 24.0, 41.0, 50.0, 36.0, 42.0, 36.0, 45.0, 53.0, 41.0, 46.0, 39.0, 38.0, 53.0, 33.0, 29.0, 44.0, 23.0, 20.0, 19.0, 20.0, 15.0, 9.0, 13.0, 11.0, 11.0, 8.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.703155517578125, -57.82478332519531, -55.9464111328125, -54.06803894042969, -52.18966293334961, -50.3112907409668, -48.432918548583984, -46.55454635620117, -44.676170349121094, -42.79779815673828, -40.91942596435547, -39.041053771972656, -37.16267776489258, -35.284305572509766, -33.40593338012695, -31.52756118774414, -29.649188995361328, -27.770816802978516, -25.89244270324707, -24.014070510864258, -22.135696411132812, -20.25732421875, -18.378952026367188, -16.500579833984375, -14.62220573425293, -12.7438325881958, -10.865459442138672, -8.98708724975586, -7.1087141036987305, -5.230340957641602, -3.351968765258789, -1.4735956192016602, 0.40477752685546875, 2.2831504344940186, 4.161523342132568, 6.039896011352539, 7.918269157409668, 9.796642303466797, 11.67501449584961, 13.553387641906738, 15.431760787963867, 17.31013298034668, 19.188507080078125, 21.066879272460938, 22.94525146484375, 24.823625564575195, 26.701997756958008, 28.580371856689453, 30.458744049072266, 32.33711624145508, 34.21548843383789, 36.09386444091797, 37.97223663330078, 39.850608825683594, 41.728981018066406, 43.60735321044922, 45.48572540283203, 47.364097595214844, 49.242469787597656, 51.12084197998047, 52.99921798706055, 54.87759017944336, 56.75596237182617, 58.634334564208984, 60.51271057128906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 6.0, 13.0, 18.0, 21.0, 26.0, 25.0, 28.0, 33.0, 37.0, 44.0, 45.0, 50.0, 48.0, 56.0, 44.0, 65.0, 43.0, 46.0, 43.0, 45.0, 43.0, 25.0, 39.0, 26.0, 21.0, 22.0, 13.0, 17.0, 8.0, 11.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.4375, -10.127685546875, -9.81787109375, -9.508056640625, -9.1982421875, -8.888427734375, -8.57861328125, -8.268798828125, -7.958984375, -7.649169921875, -7.33935546875, -7.029541015625, -6.7197265625, -6.409912109375, -6.10009765625, -5.790283203125, -5.48046875, -5.170654296875, -4.86083984375, -4.551025390625, -4.2412109375, -3.931396484375, -3.62158203125, -3.311767578125, -3.001953125, -2.692138671875, -2.38232421875, -2.072509765625, -1.7626953125, -1.452880859375, -1.14306640625, -0.833251953125, -0.5234375, -0.213623046875, 0.09619140625, 0.406005859375, 0.7158203125, 1.025634765625, 1.33544921875, 1.645263671875, 1.955078125, 2.264892578125, 2.57470703125, 2.884521484375, 3.1943359375, 3.504150390625, 3.81396484375, 4.123779296875, 4.43359375, 4.743408203125, 5.05322265625, 5.363037109375, 5.6728515625, 5.982666015625, 6.29248046875, 6.602294921875, 6.912109375, 7.221923828125, 7.53173828125, 7.841552734375, 8.1513671875, 8.461181640625, 8.77099609375, 9.080810546875, 9.390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 8.0, 11.0, 12.0, 23.0, 28.0, 22.0, 65.0, 80.0, 131.0, 185.0, 266.0, 384.0, 591.0, 904.0, 1342.0, 2119.0, 3272.0, 5164.0, 8351.0, 13747.0, 23096.0, 39105.0, 69868.0, 129304.0, 227152.0, 225959.0, 128819.0, 69782.0, 39316.0, 22710.0, 13970.0, 8137.0, 5352.0, 3119.0, 2085.0, 1380.0, 871.0, 594.0, 401.0, 297.0, 167.0, 112.0, 75.0, 66.0, 46.0, 18.0, 15.0, 11.0, 9.0, 9.0, 2.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5390625, -1.489410400390625, -1.43975830078125, -1.390106201171875, -1.3404541015625, -1.290802001953125, -1.24114990234375, -1.191497802734375, -1.141845703125, -1.092193603515625, -1.04254150390625, -0.992889404296875, -0.9432373046875, -0.893585205078125, -0.84393310546875, -0.794281005859375, -0.74462890625, -0.694976806640625, -0.64532470703125, -0.595672607421875, -0.5460205078125, -0.496368408203125, -0.44671630859375, -0.397064208984375, -0.347412109375, -0.297760009765625, -0.24810791015625, -0.198455810546875, -0.1488037109375, -0.099151611328125, -0.04949951171875, 0.000152587890625, 0.0498046875, 0.099456787109375, 0.14910888671875, 0.198760986328125, 0.2484130859375, 0.298065185546875, 0.34771728515625, 0.397369384765625, 0.447021484375, 0.496673583984375, 0.54632568359375, 0.595977783203125, 0.6456298828125, 0.695281982421875, 0.74493408203125, 0.794586181640625, 0.84423828125, 0.893890380859375, 0.94354248046875, 0.993194580078125, 1.0428466796875, 1.092498779296875, 1.14215087890625, 1.191802978515625, 1.241455078125, 1.291107177734375, 1.34075927734375, 1.390411376953125, 1.4400634765625, 1.489715576171875, 1.53936767578125, 1.589019775390625, 1.638671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 6.0, 5.0, 9.0, 8.0, 7.0, 13.0, 17.0, 13.0, 18.0, 23.0, 19.0, 29.0, 22.0, 29.0, 28.0, 19.0, 34.0, 29.0, 26.0, 42.0, 34.0, 32.0, 1066.0, 31.0, 34.0, 40.0, 29.0, 40.0, 33.0, 35.0, 20.0, 27.0, 19.0, 19.0, 21.0, 24.0, 22.0, 12.0, 14.0, 10.0, 7.0, 15.0, 9.0, 4.0, 1.0, 7.0, 8.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.94921875, -4.7955322265625, -4.641845703125, -4.4881591796875, -4.33447265625, -4.1807861328125, -4.027099609375, -3.8734130859375, -3.7197265625, -3.5660400390625, -3.412353515625, -3.2586669921875, -3.10498046875, -2.9512939453125, -2.797607421875, -2.6439208984375, -2.490234375, -2.3365478515625, -2.182861328125, -2.0291748046875, -1.87548828125, -1.7218017578125, -1.568115234375, -1.4144287109375, -1.2607421875, -1.1070556640625, -0.953369140625, -0.7996826171875, -0.64599609375, -0.4923095703125, -0.338623046875, -0.1849365234375, -0.03125, 0.1224365234375, 0.276123046875, 0.4298095703125, 0.58349609375, 0.7371826171875, 0.890869140625, 1.0445556640625, 1.1982421875, 1.3519287109375, 1.505615234375, 1.6593017578125, 1.81298828125, 1.9666748046875, 2.120361328125, 2.2740478515625, 2.427734375, 2.5814208984375, 2.735107421875, 2.8887939453125, 3.04248046875, 3.1961669921875, 3.349853515625, 3.5035400390625, 3.6572265625, 3.8109130859375, 3.964599609375, 4.1182861328125, 4.27197265625, 4.4256591796875, 4.579345703125, 4.7330322265625, 4.88671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 13.0, 12.0, 25.0, 28.0, 35.0, 58.0, 80.0, 94.0, 162.0, 215.0, 359.0, 538.0, 796.0, 1253.0, 2115.0, 3586.0, 5862.0, 10379.0, 18242.0, 31921.0, 59784.0, 115272.0, 282390.0, 1203654.0, 173383.0, 83964.0, 44630.0, 24330.0, 13676.0, 7933.0, 4759.0, 2837.0, 1667.0, 1076.0, 653.0, 410.0, 282.0, 176.0, 138.0, 97.0, 75.0, 46.0, 31.0, 31.0, 20.0, 14.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.7724609375, -0.7505569458007812, -0.7286529541015625, -0.7067489624023438, -0.684844970703125, -0.6629409790039062, -0.6410369873046875, -0.6191329956054688, -0.59722900390625, -0.5753250122070312, -0.5534210205078125, -0.5315170288085938, -0.509613037109375, -0.48770904541015625, -0.4658050537109375, -0.44390106201171875, -0.4219970703125, -0.40009307861328125, -0.3781890869140625, -0.35628509521484375, -0.334381103515625, -0.31247711181640625, -0.2905731201171875, -0.26866912841796875, -0.24676513671875, -0.22486114501953125, -0.2029571533203125, -0.18105316162109375, -0.159149169921875, -0.13724517822265625, -0.1153411865234375, -0.09343719482421875, -0.071533203125, -0.04962921142578125, -0.0277252197265625, -0.00582122802734375, 0.016082763671875, 0.03798675537109375, 0.0598907470703125, 0.08179473876953125, 0.10369873046875, 0.12560272216796875, 0.1475067138671875, 0.16941070556640625, 0.191314697265625, 0.21321868896484375, 0.2351226806640625, 0.25702667236328125, 0.2789306640625, 0.30083465576171875, 0.3227386474609375, 0.34464263916015625, 0.366546630859375, 0.38845062255859375, 0.4103546142578125, 0.43225860595703125, 0.45416259765625, 0.47606658935546875, 0.4979705810546875, 0.5198745727539062, 0.541778564453125, 0.5636825561523438, 0.5855865478515625, 0.6074905395507812, 0.62939453125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 6.0, 1.0, 9.0, 6.0, 6.0, 1.0, 7.0, 8.0, 7.0, 4.0, 9.0, 8.0, 13.0, 19.0, 20.0, 15.0, 25.0, 27.0, 43.0, 60.0, 87.0, 125.0, 112.0, 83.0, 68.0, 53.0, 23.0, 21.0, 15.0, 15.0, 15.0, 8.0, 7.0, 9.0, 8.0, 6.0, 6.0, 9.0, 6.0, 7.0, 5.0, 3.0, 4.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314453125, -0.3046417236328125, -0.294830322265625, -0.2850189208984375, -0.27520751953125, -0.2653961181640625, -0.255584716796875, -0.2457733154296875, -0.2359619140625, -0.2261505126953125, -0.216339111328125, -0.2065277099609375, -0.19671630859375, -0.1869049072265625, -0.177093505859375, -0.1672821044921875, -0.157470703125, -0.1476593017578125, -0.137847900390625, -0.1280364990234375, -0.11822509765625, -0.1084136962890625, -0.098602294921875, -0.0887908935546875, -0.0789794921875, -0.0691680908203125, -0.059356689453125, -0.0495452880859375, -0.03973388671875, -0.0299224853515625, -0.020111083984375, -0.0102996826171875, -0.00048828125, 0.0093231201171875, 0.019134521484375, 0.0289459228515625, 0.03875732421875, 0.0485687255859375, 0.058380126953125, 0.0681915283203125, 0.0780029296875, 0.0878143310546875, 0.097625732421875, 0.1074371337890625, 0.11724853515625, 0.1270599365234375, 0.136871337890625, 0.1466827392578125, 0.156494140625, 0.1663055419921875, 0.176116943359375, 0.1859283447265625, 0.19573974609375, 0.2055511474609375, 0.215362548828125, 0.2251739501953125, 0.2349853515625, 0.2447967529296875, 0.254608154296875, 0.2644195556640625, 0.27423095703125, 0.2840423583984375, 0.293853759765625, 0.3036651611328125, 0.3134765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 3.0, 3.0, 7.0, 6.0, 6.0, 11.0, 4.0, 10.0, 9.0, 9.0, 7.0, 20.0, 20.0, 31.0, 42.0, 77.0, 159.0, 355.0, 1369.0, 59918.0, 979217.0, 6137.0, 549.0, 221.0, 105.0, 49.0, 43.0, 35.0, 22.0, 15.0, 10.0, 11.0, 5.0, 6.0, 8.0, 7.0, 3.0, 4.0, 6.0, 6.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.6578369140625, -6.444580078125, -6.2313232421875, -6.01806640625, -5.8048095703125, -5.591552734375, -5.3782958984375, -5.1650390625, -4.9517822265625, -4.738525390625, -4.5252685546875, -4.31201171875, -4.0987548828125, -3.885498046875, -3.6722412109375, -3.458984375, -3.2457275390625, -3.032470703125, -2.8192138671875, -2.60595703125, -2.3927001953125, -2.179443359375, -1.9661865234375, -1.7529296875, -1.5396728515625, -1.326416015625, -1.1131591796875, -0.89990234375, -0.6866455078125, -0.473388671875, -0.2601318359375, -0.046875, 0.1663818359375, 0.379638671875, 0.5928955078125, 0.80615234375, 1.0194091796875, 1.232666015625, 1.4459228515625, 1.6591796875, 1.8724365234375, 2.085693359375, 2.2989501953125, 2.51220703125, 2.7254638671875, 2.938720703125, 3.1519775390625, 3.365234375, 3.5784912109375, 3.791748046875, 4.0050048828125, 4.21826171875, 4.4315185546875, 4.644775390625, 4.8580322265625, 5.0712890625, 5.2845458984375, 5.497802734375, 5.7110595703125, 5.92431640625, 6.1375732421875, 6.350830078125, 6.5640869140625, 6.77734375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 17.0, 29.0, 39.0, 67.0, 110.0, 323.0, 202.0, 85.0, 46.0, 39.0, 12.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5964094400405884, -1.5320537090301514, -1.4676979780197144, -1.4033422470092773, -1.3389865159988403, -1.2746307849884033, -1.2102750539779663, -1.1459193229675293, -1.0815635919570923, -1.0172078609466553, -0.9528521299362183, -0.8884963989257812, -0.8241406679153442, -0.7597849369049072, -0.6954292058944702, -0.6310734748840332, -0.5667177438735962, -0.5023620128631592, -0.43800628185272217, -0.37365055084228516, -0.30929481983184814, -0.24493908882141113, -0.18058335781097412, -0.11622762680053711, -0.0518718957901001, 0.012483835220336914, 0.07683956623077393, 0.14119529724121094, 0.20555102825164795, 0.26990675926208496, 0.334262490272522, 0.398618221282959, 0.46297383308410645, 0.5273295640945435, 0.5916852951049805, 0.6560410261154175, 0.7203967571258545, 0.7847524881362915, 0.8491082191467285, 0.9134639501571655, 0.9778196811676025, 1.0421754121780396, 1.1065311431884766, 1.1708868741989136, 1.2352426052093506, 1.2995983362197876, 1.3639540672302246, 1.4283097982406616, 1.4926655292510986, 1.5570212602615356, 1.6213769912719727, 1.6857327222824097, 1.7500884532928467, 1.8144441843032837, 1.8787999153137207, 1.9431556463241577, 2.0075113773345947, 2.071866989135742, 2.1362228393554688, 2.2005786895751953, 2.2649343013763428, 2.3292899131774902, 2.393645763397217, 2.4580016136169434, 2.522357225418091]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 6.0, 11.0, 17.0, 16.0, 18.0, 10.0, 26.0, 17.0, 27.0, 24.0, 30.0, 28.0, 35.0, 32.0, 29.0, 45.0, 36.0, 48.0, 34.0, 38.0, 35.0, 30.0, 37.0, 36.0, 39.0, 23.0, 40.0, 33.0, 31.0, 17.0, 22.0, 14.0, 22.0, 20.0, 5.0, 6.0, 5.0, 10.0, 2.0, 5.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2055637836456299, -1.1697578430175781, -1.1339519023895264, -1.0981459617614746, -1.0623400211334229, -1.026534080505371, -0.9907281398773193, -0.9549221992492676, -0.9191162586212158, -0.8833103179931641, -0.8475043773651123, -0.8116984367370605, -0.7758924961090088, -0.740086555480957, -0.7042806148529053, -0.6684746742248535, -0.6326687335968018, -0.59686279296875, -0.5610568523406982, -0.5252509117126465, -0.4894449710845947, -0.45363903045654297, -0.4178330898284912, -0.38202714920043945, -0.3462212085723877, -0.31041526794433594, -0.2746093273162842, -0.23880338668823242, -0.20299744606018066, -0.1671915054321289, -0.13138556480407715, -0.09557962417602539, -0.05977368354797363, -0.023967742919921875, 0.011838197708129883, 0.04764413833618164, 0.0834500789642334, 0.11925601959228516, 0.15506196022033691, 0.19086790084838867, 0.22667384147644043, 0.2624797821044922, 0.29828572273254395, 0.3340916633605957, 0.36989760398864746, 0.4057035446166992, 0.441509485244751, 0.47731542587280273, 0.5131213665008545, 0.5489273071289062, 0.584733247756958, 0.6205391883850098, 0.6563451290130615, 0.6921510696411133, 0.727957010269165, 0.7637629508972168, 0.7995688915252686, 0.8353748321533203, 0.8711807727813721, 0.9069867134094238, 0.9427926540374756, 0.9785985946655273, 1.014404535293579, 1.0502104759216309, 1.0860164165496826]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 6.0, 12.0, 19.0, 20.0, 27.0, 24.0, 26.0, 36.0, 41.0, 42.0, 46.0, 48.0, 48.0, 56.0, 47.0, 62.0, 44.0, 44.0, 47.0, 43.0, 40.0, 27.0, 39.0, 22.0, 28.0, 17.0, 15.0, 13.0, 11.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.421875, -10.1119384765625, -9.802001953125, -9.4920654296875, -9.18212890625, -8.8721923828125, -8.562255859375, -8.2523193359375, -7.9423828125, -7.6324462890625, -7.322509765625, -7.0125732421875, -6.70263671875, -6.3927001953125, -6.082763671875, -5.7728271484375, -5.462890625, -5.1529541015625, -4.843017578125, -4.5330810546875, -4.22314453125, -3.9132080078125, -3.603271484375, -3.2933349609375, -2.9833984375, -2.6734619140625, -2.363525390625, -2.0535888671875, -1.74365234375, -1.4337158203125, -1.123779296875, -0.8138427734375, -0.50390625, -0.1939697265625, 0.115966796875, 0.4259033203125, 0.73583984375, 1.0457763671875, 1.355712890625, 1.6656494140625, 1.9755859375, 2.2855224609375, 2.595458984375, 2.9053955078125, 3.21533203125, 3.5252685546875, 3.835205078125, 4.1451416015625, 4.455078125, 4.7650146484375, 5.074951171875, 5.3848876953125, 5.69482421875, 6.0047607421875, 6.314697265625, 6.6246337890625, 6.9345703125, 7.2445068359375, 7.554443359375, 7.8643798828125, 8.17431640625, 8.4842529296875, 8.794189453125, 9.1041259765625, 9.4140625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 16.0, 20.0, 28.0, 49.0, 53.0, 119.0, 159.0, 274.0, 344.0, 579.0, 934.0, 1347.0, 2104.0, 3500.0, 5631.0, 10759.0, 32324.0, 197758.0, 611376.0, 133764.0, 24471.0, 9265.0, 5036.0, 3065.0, 1996.0, 1244.0, 822.0, 532.0, 364.0, 214.0, 140.0, 90.0, 69.0, 34.0, 29.0, 20.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.625, -15.093505859375, -14.56201171875, -14.030517578125, -13.4990234375, -12.967529296875, -12.43603515625, -11.904541015625, -11.373046875, -10.841552734375, -10.31005859375, -9.778564453125, -9.2470703125, -8.715576171875, -8.18408203125, -7.652587890625, -7.12109375, -6.589599609375, -6.05810546875, -5.526611328125, -4.9951171875, -4.463623046875, -3.93212890625, -3.400634765625, -2.869140625, -2.337646484375, -1.80615234375, -1.274658203125, -0.7431640625, -0.211669921875, 0.31982421875, 0.851318359375, 1.3828125, 1.914306640625, 2.44580078125, 2.977294921875, 3.5087890625, 4.040283203125, 4.57177734375, 5.103271484375, 5.634765625, 6.166259765625, 6.69775390625, 7.229248046875, 7.7607421875, 8.292236328125, 8.82373046875, 9.355224609375, 9.88671875, 10.418212890625, 10.94970703125, 11.481201171875, 12.0126953125, 12.544189453125, 13.07568359375, 13.607177734375, 14.138671875, 14.670166015625, 15.20166015625, 15.733154296875, 16.2646484375, 16.796142578125, 17.32763671875, 17.859130859375, 18.390625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 16.0, 16.0, 17.0, 13.0, 32.0, 26.0, 29.0, 48.0, 35.0, 50.0, 46.0, 108.0, 161.0, 1406.0, 371.0, 154.0, 97.0, 65.0, 45.0, 41.0, 39.0, 38.0, 36.0, 21.0, 20.0, 18.0, 18.0, 8.0, 9.0, 14.0, 3.0, 8.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.296875, -25.447265625, -24.59765625, -23.748046875, -22.8984375, -22.048828125, -21.19921875, -20.349609375, -19.5, -18.650390625, -17.80078125, -16.951171875, -16.1015625, -15.251953125, -14.40234375, -13.552734375, -12.703125, -11.853515625, -11.00390625, -10.154296875, -9.3046875, -8.455078125, -7.60546875, -6.755859375, -5.90625, -5.056640625, -4.20703125, -3.357421875, -2.5078125, -1.658203125, -0.80859375, 0.041015625, 0.890625, 1.740234375, 2.58984375, 3.439453125, 4.2890625, 5.138671875, 5.98828125, 6.837890625, 7.6875, 8.537109375, 9.38671875, 10.236328125, 11.0859375, 11.935546875, 12.78515625, 13.634765625, 14.484375, 15.333984375, 16.18359375, 17.033203125, 17.8828125, 18.732421875, 19.58203125, 20.431640625, 21.28125, 22.130859375, 22.98046875, 23.830078125, 24.6796875, 25.529296875, 26.37890625, 27.228515625, 28.078125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 9.0, 10.0, 11.0, 12.0, 20.0, 22.0, 22.0, 31.0, 42.0, 59.0, 92.0, 142.0, 239.0, 402.0, 763.0, 2594.0, 13121.0, 956657.0, 2148713.0, 17683.0, 3074.0, 881.0, 400.0, 236.0, 157.0, 89.0, 56.0, 35.0, 30.0, 21.0, 29.0, 8.0, 8.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.2294921875, -51.458984375, -49.6884765625, -47.91796875, -46.1474609375, -44.376953125, -42.6064453125, -40.8359375, -39.0654296875, -37.294921875, -35.5244140625, -33.75390625, -31.9833984375, -30.212890625, -28.4423828125, -26.671875, -24.9013671875, -23.130859375, -21.3603515625, -19.58984375, -17.8193359375, -16.048828125, -14.2783203125, -12.5078125, -10.7373046875, -8.966796875, -7.1962890625, -5.42578125, -3.6552734375, -1.884765625, -0.1142578125, 1.65625, 3.4267578125, 5.197265625, 6.9677734375, 8.73828125, 10.5087890625, 12.279296875, 14.0498046875, 15.8203125, 17.5908203125, 19.361328125, 21.1318359375, 22.90234375, 24.6728515625, 26.443359375, 28.2138671875, 29.984375, 31.7548828125, 33.525390625, 35.2958984375, 37.06640625, 38.8369140625, 40.607421875, 42.3779296875, 44.1484375, 45.9189453125, 47.689453125, 49.4599609375, 51.23046875, 53.0009765625, 54.771484375, 56.5419921875, 58.3125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 10.0, 147.0, 523.0, 305.0, 30.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.7033576965332, -31.894519805908203, -25.085683822631836, -18.27684783935547, -11.468009948730469, -4.659172058105469, 2.1496620178222656, 8.958499908447266, 15.767337799072266, 22.576175689697266, 29.385011672973633, 36.19384765625, 43.002685546875, 49.8115234375, 56.620357513427734, 63.429195404052734, 70.238037109375, 77.046875, 83.855712890625, 90.66455078125, 97.473388671875, 104.2822265625, 111.09105682373047, 117.89989471435547, 124.70872497558594, 131.51756286621094, 138.32640075683594, 145.13523864746094, 151.94407653808594, 158.75291442871094, 165.56173706054688, 172.37057495117188, 179.17941284179688, 185.98825073242188, 192.79708862304688, 199.60592651367188, 206.41476440429688, 213.22360229492188, 220.03244018554688, 226.84127807617188, 233.65011596679688, 240.45895385742188, 247.26779174804688, 254.07662963867188, 260.8854675292969, 267.6943054199219, 274.5031433105469, 281.3119812011719, 288.12078857421875, 294.92962646484375, 301.73846435546875, 308.54730224609375, 315.35614013671875, 322.16497802734375, 328.97381591796875, 335.78265380859375, 342.59149169921875, 349.40032958984375, 356.20916748046875, 363.01800537109375, 369.82684326171875, 376.63568115234375, 383.44451904296875, 390.25335693359375, 397.06219482421875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 3.0, 7.0, 8.0, 7.0, 14.0, 11.0, 15.0, 22.0, 20.0, 25.0, 21.0, 32.0, 22.0, 39.0, 38.0, 38.0, 39.0, 38.0, 39.0, 56.0, 47.0, 36.0, 39.0, 37.0, 39.0, 48.0, 26.0, 29.0, 27.0, 32.0, 20.0, 16.0, 24.0, 11.0, 12.0, 13.0, 11.0, 11.0, 9.0, 8.0, 3.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.15870666503906, -58.18632888793945, -56.213951110839844, -54.24156951904297, -52.26919174194336, -50.29681396484375, -48.32443618774414, -46.35205841064453, -44.379676818847656, -42.40729904174805, -40.43492126464844, -38.46253967285156, -36.49016189575195, -34.517784118652344, -32.545406341552734, -30.573028564453125, -28.600650787353516, -26.628273010253906, -24.655893325805664, -22.683515548706055, -20.711135864257812, -18.738758087158203, -16.766380310058594, -14.794001579284668, -12.821622848510742, -10.849244117736816, -8.87686538696289, -6.904487609863281, -4.9321088790893555, -2.9597301483154297, -0.9873523712158203, 0.9850263595581055, 2.9574050903320312, 4.929783821105957, 6.902162075042725, 8.874540328979492, 10.846919059753418, 12.819297790527344, 14.791675567626953, 16.764053344726562, 18.736433029174805, 20.708810806274414, 22.681190490722656, 24.653568267822266, 26.625946044921875, 28.598325729370117, 30.570703506469727, 32.54308319091797, 34.51546096801758, 36.48783874511719, 38.4602165222168, 40.432594299316406, 42.40497589111328, 44.37735366821289, 46.3497314453125, 48.32210922241211, 50.29448699951172, 52.26686477661133, 54.23924255371094, 56.21162414550781, 58.18400192260742, 60.15637969970703, 62.12875747680664, 64.10113525390625, 66.07351684570312]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 9.0, 4.0, 8.0, 18.0, 20.0, 17.0, 18.0, 27.0, 28.0, 34.0, 42.0, 30.0, 58.0, 39.0, 59.0, 48.0, 45.0, 51.0, 36.0, 48.0, 56.0, 43.0, 37.0, 37.0, 25.0, 35.0, 22.0, 20.0, 11.0, 15.0, 11.0, 16.0, 6.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.8984375, -9.587646484375, -9.27685546875, -8.966064453125, -8.6552734375, -8.344482421875, -8.03369140625, -7.722900390625, -7.412109375, -7.101318359375, -6.79052734375, -6.479736328125, -6.1689453125, -5.858154296875, -5.54736328125, -5.236572265625, -4.92578125, -4.614990234375, -4.30419921875, -3.993408203125, -3.6826171875, -3.371826171875, -3.06103515625, -2.750244140625, -2.439453125, -2.128662109375, -1.81787109375, -1.507080078125, -1.1962890625, -0.885498046875, -0.57470703125, -0.263916015625, 0.046875, 0.357666015625, 0.66845703125, 0.979248046875, 1.2900390625, 1.600830078125, 1.91162109375, 2.222412109375, 2.533203125, 2.843994140625, 3.15478515625, 3.465576171875, 3.7763671875, 4.087158203125, 4.39794921875, 4.708740234375, 5.01953125, 5.330322265625, 5.64111328125, 5.951904296875, 6.2626953125, 6.573486328125, 6.88427734375, 7.195068359375, 7.505859375, 7.816650390625, 8.12744140625, 8.438232421875, 8.7490234375, 9.059814453125, 9.37060546875, 9.681396484375, 9.9921875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 12.0, 10.0, 18.0, 21.0, 32.0, 47.0, 65.0, 93.0, 152.0, 232.0, 339.0, 511.0, 901.0, 1487.0, 2802.0, 5272.0, 11846.0, 33051.0, 151969.0, 1341735.0, 2265004.0, 297868.0, 49732.0, 16099.0, 6781.0, 3340.0, 1885.0, 1012.0, 657.0, 426.0, 290.0, 179.0, 116.0, 81.0, 54.0, 44.0, 29.0, 22.0, 16.0, 9.0, 10.0, 9.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.765625, -19.087890625, -18.41015625, -17.732421875, -17.0546875, -16.376953125, -15.69921875, -15.021484375, -14.34375, -13.666015625, -12.98828125, -12.310546875, -11.6328125, -10.955078125, -10.27734375, -9.599609375, -8.921875, -8.244140625, -7.56640625, -6.888671875, -6.2109375, -5.533203125, -4.85546875, -4.177734375, -3.5, -2.822265625, -2.14453125, -1.466796875, -0.7890625, -0.111328125, 0.56640625, 1.244140625, 1.921875, 2.599609375, 3.27734375, 3.955078125, 4.6328125, 5.310546875, 5.98828125, 6.666015625, 7.34375, 8.021484375, 8.69921875, 9.376953125, 10.0546875, 10.732421875, 11.41015625, 12.087890625, 12.765625, 13.443359375, 14.12109375, 14.798828125, 15.4765625, 16.154296875, 16.83203125, 17.509765625, 18.1875, 18.865234375, 19.54296875, 20.220703125, 20.8984375, 21.576171875, 22.25390625, 22.931640625, 23.609375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 1.0, 7.0, 12.0, 14.0, 16.0, 24.0, 34.0, 40.0, 41.0, 65.0, 78.0, 115.0, 144.0, 223.0, 335.0, 433.0, 484.0, 493.0, 403.0, 289.0, 215.0, 153.0, 116.0, 75.0, 60.0, 43.0, 27.0, 31.0, 27.0, 14.0, 6.0, 15.0, 3.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5625, -15.04052734375, -14.5185546875, -13.99658203125, -13.474609375, -12.95263671875, -12.4306640625, -11.90869140625, -11.38671875, -10.86474609375, -10.3427734375, -9.82080078125, -9.298828125, -8.77685546875, -8.2548828125, -7.73291015625, -7.2109375, -6.68896484375, -6.1669921875, -5.64501953125, -5.123046875, -4.60107421875, -4.0791015625, -3.55712890625, -3.03515625, -2.51318359375, -1.9912109375, -1.46923828125, -0.947265625, -0.42529296875, 0.0966796875, 0.61865234375, 1.140625, 1.66259765625, 2.1845703125, 2.70654296875, 3.228515625, 3.75048828125, 4.2724609375, 4.79443359375, 5.31640625, 5.83837890625, 6.3603515625, 6.88232421875, 7.404296875, 7.92626953125, 8.4482421875, 8.97021484375, 9.4921875, 10.01416015625, 10.5361328125, 11.05810546875, 11.580078125, 12.10205078125, 12.6240234375, 13.14599609375, 13.66796875, 14.18994140625, 14.7119140625, 15.23388671875, 15.755859375, 16.27783203125, 16.7998046875, 17.32177734375, 17.84375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 13.0, 16.0, 16.0, 23.0, 33.0, 59.0, 87.0, 117.0, 191.0, 454.0, 1567.0, 9147.0, 147143.0, 3860130.0, 163106.0, 9610.0, 1540.0, 422.0, 193.0, 132.0, 74.0, 45.0, 40.0, 25.0, 22.0, 20.0, 14.0, 12.0, 8.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.3125, -74.9345703125, -72.556640625, -70.1787109375, -67.80078125, -65.4228515625, -63.044921875, -60.6669921875, -58.2890625, -55.9111328125, -53.533203125, -51.1552734375, -48.77734375, -46.3994140625, -44.021484375, -41.6435546875, -39.265625, -36.8876953125, -34.509765625, -32.1318359375, -29.75390625, -27.3759765625, -24.998046875, -22.6201171875, -20.2421875, -17.8642578125, -15.486328125, -13.1083984375, -10.73046875, -8.3525390625, -5.974609375, -3.5966796875, -1.21875, 1.1591796875, 3.537109375, 5.9150390625, 8.29296875, 10.6708984375, 13.048828125, 15.4267578125, 17.8046875, 20.1826171875, 22.560546875, 24.9384765625, 27.31640625, 29.6943359375, 32.072265625, 34.4501953125, 36.828125, 39.2060546875, 41.583984375, 43.9619140625, 46.33984375, 48.7177734375, 51.095703125, 53.4736328125, 55.8515625, 58.2294921875, 60.607421875, 62.9853515625, 65.36328125, 67.7412109375, 70.119140625, 72.4970703125, 74.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 16.0, 25.0, 39.0, 53.0, 88.0, 123.0, 160.0, 135.0, 128.0, 101.0, 67.0, 38.0, 13.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.6884994506836, -81.61717224121094, -77.54585266113281, -73.47452545166016, -69.40320587158203, -65.33187866210938, -61.260555267333984, -57.189231872558594, -53.1179084777832, -49.04658508300781, -44.97526168823242, -40.90393829345703, -36.832611083984375, -32.76129150390625, -28.689964294433594, -24.618640899658203, -20.547317504882812, -16.475994110107422, -12.404669761657715, -8.333345413208008, -4.262022018432617, -0.19069862365722656, 3.880626678466797, 7.9519500732421875, 12.023273468017578, 16.09459686279297, 20.16592025756836, 24.237245559692383, 28.308568954467773, 32.37989044189453, 36.45121765136719, 40.52254104614258, 44.59385681152344, 48.66518020629883, 52.73650360107422, 56.807830810546875, 60.879150390625, 64.95047760009766, 69.02180480957031, 73.09312438964844, 77.16444396972656, 81.23577117919922, 85.30709075927734, 89.37841796875, 93.44973754882812, 97.52106475830078, 101.59239196777344, 105.66371154785156, 109.73503875732422, 113.80636596679688, 117.877685546875, 121.94901275634766, 126.02033233642578, 130.09165954589844, 134.16297912597656, 138.23431396484375, 142.30563354492188, 146.376953125, 150.4482879638672, 154.5196075439453, 158.59092712402344, 162.66224670410156, 166.73358154296875, 170.80490112304688, 174.876220703125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 9.0, 12.0, 15.0, 24.0, 13.0, 13.0, 30.0, 28.0, 30.0, 31.0, 34.0, 38.0, 34.0, 38.0, 40.0, 38.0, 55.0, 45.0, 38.0, 48.0, 35.0, 38.0, 28.0, 29.0, 35.0, 17.0, 24.0, 36.0, 21.0, 16.0, 17.0, 13.0, 14.0, 11.0, 7.0, 5.0, 4.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.67112731933594, -46.95042419433594, -45.22972106933594, -43.50901794433594, -41.78831481933594, -40.06761169433594, -38.34690856933594, -36.62620544433594, -34.90550231933594, -33.18479919433594, -31.464096069335938, -29.743392944335938, -28.022689819335938, -26.301986694335938, -24.581283569335938, -22.860580444335938, -21.139875411987305, -19.419172286987305, -17.698469161987305, -15.977766036987305, -14.257062911987305, -12.536358833312988, -10.815655708312988, -9.094952583312988, -7.374249458312988, -5.653546333312988, -3.932842969894409, -2.21213960647583, -0.4914364814758301, 1.2292671203613281, 2.949970245361328, 4.670673370361328, 6.391376495361328, 8.112079620361328, 9.832782745361328, 11.553485870361328, 13.274188995361328, 14.994893074035645, 16.715595245361328, 18.436298370361328, 20.157001495361328, 21.877704620361328, 23.598407745361328, 25.319110870361328, 27.039813995361328, 28.760517120361328, 30.481220245361328, 32.20192337036133, 33.922630310058594, 35.643333435058594, 37.364036560058594, 39.084739685058594, 40.805442810058594, 42.526145935058594, 44.246849060058594, 45.967552185058594, 47.688255310058594, 49.408958435058594, 51.129661560058594, 52.850364685058594, 54.571067810058594, 56.291770935058594, 58.012474060058594, 59.733177185058594, 61.453880310058594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 12.0, 9.0, 12.0, 21.0, 26.0, 26.0, 27.0, 34.0, 42.0, 50.0, 40.0, 57.0, 54.0, 60.0, 41.0, 55.0, 45.0, 47.0, 53.0, 38.0, 42.0, 36.0, 33.0, 28.0, 26.0, 19.0, 13.0, 13.0, 12.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.5546875, -11.2218017578125, -10.888916015625, -10.5560302734375, -10.22314453125, -9.8902587890625, -9.557373046875, -9.2244873046875, -8.8916015625, -8.5587158203125, -8.225830078125, -7.8929443359375, -7.56005859375, -7.2271728515625, -6.894287109375, -6.5614013671875, -6.228515625, -5.8956298828125, -5.562744140625, -5.2298583984375, -4.89697265625, -4.5640869140625, -4.231201171875, -3.8983154296875, -3.5654296875, -3.2325439453125, -2.899658203125, -2.5667724609375, -2.23388671875, -1.9010009765625, -1.568115234375, -1.2352294921875, -0.90234375, -0.5694580078125, -0.236572265625, 0.0963134765625, 0.42919921875, 0.7620849609375, 1.094970703125, 1.4278564453125, 1.7607421875, 2.0936279296875, 2.426513671875, 2.7593994140625, 3.09228515625, 3.4251708984375, 3.758056640625, 4.0909423828125, 4.423828125, 4.7567138671875, 5.089599609375, 5.4224853515625, 5.75537109375, 6.0882568359375, 6.421142578125, 6.7540283203125, 7.0869140625, 7.4197998046875, 7.752685546875, 8.0855712890625, 8.41845703125, 8.7513427734375, 9.084228515625, 9.4171142578125, 9.75]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 13.0, 32.0, 34.0, 41.0, 62.0, 105.0, 168.0, 223.0, 399.0, 669.0, 1123.0, 1915.0, 3423.0, 6355.0, 11448.0, 21975.0, 43198.0, 91308.0, 194536.0, 300244.0, 192097.0, 89655.0, 42533.0, 21388.0, 11416.0, 6041.0, 3279.0, 1964.0, 1141.0, 638.0, 391.0, 260.0, 165.0, 95.0, 60.0, 43.0, 27.0, 24.0, 16.0, 15.0, 7.0, 3.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6640625, -1.6094818115234375, -1.554901123046875, -1.5003204345703125, -1.44573974609375, -1.3911590576171875, -1.336578369140625, -1.2819976806640625, -1.2274169921875, -1.1728363037109375, -1.118255615234375, -1.0636749267578125, -1.00909423828125, -0.9545135498046875, -0.899932861328125, -0.8453521728515625, -0.790771484375, -0.7361907958984375, -0.681610107421875, -0.6270294189453125, -0.57244873046875, -0.5178680419921875, -0.463287353515625, -0.4087066650390625, -0.3541259765625, -0.2995452880859375, -0.244964599609375, -0.1903839111328125, -0.13580322265625, -0.0812225341796875, -0.026641845703125, 0.0279388427734375, 0.08251953125, 0.1371002197265625, 0.191680908203125, 0.2462615966796875, 0.30084228515625, 0.3554229736328125, 0.410003662109375, 0.4645843505859375, 0.5191650390625, 0.5737457275390625, 0.628326416015625, 0.6829071044921875, 0.73748779296875, 0.7920684814453125, 0.846649169921875, 0.9012298583984375, 0.955810546875, 1.0103912353515625, 1.064971923828125, 1.1195526123046875, 1.17413330078125, 1.2287139892578125, 1.283294677734375, 1.3378753662109375, 1.3924560546875, 1.4470367431640625, 1.501617431640625, 1.5561981201171875, 1.61077880859375, 1.6653594970703125, 1.719940185546875, 1.7745208740234375, 1.8291015625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 6.0, 9.0, 12.0, 11.0, 14.0, 13.0, 14.0, 14.0, 18.0, 15.0, 20.0, 32.0, 32.0, 29.0, 41.0, 43.0, 50.0, 54.0, 55.0, 1066.0, 36.0, 35.0, 32.0, 19.0, 45.0, 30.0, 42.0, 27.0, 35.0, 26.0, 20.0, 14.0, 10.0, 26.0, 15.0, 14.0, 13.0, 8.0, 6.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.8206787109375, -4.641357421875, -4.4620361328125, -4.28271484375, -4.1033935546875, -3.924072265625, -3.7447509765625, -3.5654296875, -3.3861083984375, -3.206787109375, -3.0274658203125, -2.84814453125, -2.6688232421875, -2.489501953125, -2.3101806640625, -2.130859375, -1.9515380859375, -1.772216796875, -1.5928955078125, -1.41357421875, -1.2342529296875, -1.054931640625, -0.8756103515625, -0.6962890625, -0.5169677734375, -0.337646484375, -0.1583251953125, 0.02099609375, 0.2003173828125, 0.379638671875, 0.5589599609375, 0.73828125, 0.9176025390625, 1.096923828125, 1.2762451171875, 1.45556640625, 1.6348876953125, 1.814208984375, 1.9935302734375, 2.1728515625, 2.3521728515625, 2.531494140625, 2.7108154296875, 2.89013671875, 3.0694580078125, 3.248779296875, 3.4281005859375, 3.607421875, 3.7867431640625, 3.966064453125, 4.1453857421875, 4.32470703125, 4.5040283203125, 4.683349609375, 4.8626708984375, 5.0419921875, 5.2213134765625, 5.400634765625, 5.5799560546875, 5.75927734375, 5.9385986328125, 6.117919921875, 6.2972412109375, 6.4765625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 7.0, 9.0, 18.0, 9.0, 26.0, 26.0, 32.0, 55.0, 59.0, 110.0, 140.0, 230.0, 368.0, 641.0, 1192.0, 2149.0, 3876.0, 7435.0, 14397.0, 29482.0, 60961.0, 131054.0, 676123.0, 912576.0, 133519.0, 61493.0, 29955.0, 14695.0, 7575.0, 3918.0, 2075.0, 1152.0, 631.0, 387.0, 225.0, 167.0, 90.0, 74.0, 60.0, 29.0, 27.0, 17.0, 11.0, 14.0, 9.0, 5.0, 7.0, 8.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.77392578125, -0.7497482299804688, -0.7255706787109375, -0.7013931274414062, -0.677215576171875, -0.6530380249023438, -0.6288604736328125, -0.6046829223632812, -0.58050537109375, -0.5563278198242188, -0.5321502685546875, -0.5079727172851562, -0.483795166015625, -0.45961761474609375, -0.4354400634765625, -0.41126251220703125, -0.3870849609375, -0.36290740966796875, -0.3387298583984375, -0.31455230712890625, -0.290374755859375, -0.26619720458984375, -0.2420196533203125, -0.21784210205078125, -0.19366455078125, -0.16948699951171875, -0.1453094482421875, -0.12113189697265625, -0.096954345703125, -0.07277679443359375, -0.0485992431640625, -0.02442169189453125, -0.000244140625, 0.02393341064453125, 0.0481109619140625, 0.07228851318359375, 0.096466064453125, 0.12064361572265625, 0.1448211669921875, 0.16899871826171875, 0.19317626953125, 0.21735382080078125, 0.2415313720703125, 0.26570892333984375, 0.289886474609375, 0.31406402587890625, 0.3382415771484375, 0.36241912841796875, 0.3865966796875, 0.41077423095703125, 0.4349517822265625, 0.45912933349609375, 0.483306884765625, 0.5074844360351562, 0.5316619873046875, 0.5558395385742188, 0.58001708984375, 0.6041946411132812, 0.6283721923828125, 0.6525497436523438, 0.676727294921875, 0.7009048461914062, 0.7250823974609375, 0.7492599487304688, 0.7734375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 5.0, 1.0, 3.0, 1.0, 5.0, 7.0, 11.0, 14.0, 14.0, 18.0, 11.0, 12.0, 16.0, 15.0, 23.0, 47.0, 76.0, 142.0, 214.0, 117.0, 52.0, 33.0, 32.0, 12.0, 16.0, 15.0, 16.0, 10.0, 3.0, 14.0, 8.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.23095703125, -0.22475433349609375, -0.2185516357421875, -0.21234893798828125, -0.206146240234375, -0.19994354248046875, -0.1937408447265625, -0.18753814697265625, -0.18133544921875, -0.17513275146484375, -0.1689300537109375, -0.16272735595703125, -0.156524658203125, -0.15032196044921875, -0.1441192626953125, -0.13791656494140625, -0.1317138671875, -0.12551116943359375, -0.1193084716796875, -0.11310577392578125, -0.106903076171875, -0.10070037841796875, -0.0944976806640625, -0.08829498291015625, -0.08209228515625, -0.07588958740234375, -0.0696868896484375, -0.06348419189453125, -0.057281494140625, -0.05107879638671875, -0.0448760986328125, -0.03867340087890625, -0.032470703125, -0.02626800537109375, -0.0200653076171875, -0.01386260986328125, -0.007659912109375, -0.00145721435546875, 0.0047454833984375, 0.01094818115234375, 0.01715087890625, 0.02335357666015625, 0.0295562744140625, 0.03575897216796875, 0.041961669921875, 0.04816436767578125, 0.0543670654296875, 0.06056976318359375, 0.0667724609375, 0.07297515869140625, 0.0791778564453125, 0.08538055419921875, 0.091583251953125, 0.09778594970703125, 0.1039886474609375, 0.11019134521484375, 0.11639404296875, 0.12259674072265625, 0.1287994384765625, 0.13500213623046875, 0.141204833984375, 0.14740753173828125, 0.1536102294921875, 0.15981292724609375, 0.166015625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 13.0, 8.0, 7.0, 8.0, 21.0, 22.0, 29.0, 30.0, 78.0, 117.0, 401.0, 4078.0, 1003663.0, 38594.0, 933.0, 227.0, 98.0, 45.0, 22.0, 19.0, 19.0, 18.0, 12.0, 19.0, 11.0, 9.0, 3.0, 4.0, 2.0, 1.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.619140625, -3.483917236328125, -3.34869384765625, -3.213470458984375, -3.0782470703125, -2.943023681640625, -2.80780029296875, -2.672576904296875, -2.537353515625, -2.402130126953125, -2.26690673828125, -2.131683349609375, -1.9964599609375, -1.861236572265625, -1.72601318359375, -1.590789794921875, -1.45556640625, -1.320343017578125, -1.18511962890625, -1.049896240234375, -0.9146728515625, -0.779449462890625, -0.64422607421875, -0.509002685546875, -0.373779296875, -0.238555908203125, -0.10333251953125, 0.031890869140625, 0.1671142578125, 0.302337646484375, 0.43756103515625, 0.572784423828125, 0.7080078125, 0.843231201171875, 0.97845458984375, 1.113677978515625, 1.2489013671875, 1.384124755859375, 1.51934814453125, 1.654571533203125, 1.789794921875, 1.925018310546875, 2.06024169921875, 2.195465087890625, 2.3306884765625, 2.465911865234375, 2.60113525390625, 2.736358642578125, 2.87158203125, 3.006805419921875, 3.14202880859375, 3.277252197265625, 3.4124755859375, 3.547698974609375, 3.68292236328125, 3.818145751953125, 3.953369140625, 4.088592529296875, 4.22381591796875, 4.359039306640625, 4.4942626953125, 4.629486083984375, 4.76470947265625, 4.899932861328125, 5.03515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 10.0, 14.0, 26.0, 61.0, 90.0, 214.0, 323.0, 117.0, 56.0, 44.0, 16.0, 4.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38207873702049255, -0.3506269156932831, -0.3191750943660736, -0.28772324323654175, -0.2562714219093323, -0.224819615483284, -0.19336777925491333, -0.16191595792770386, -0.13046413660049438, -0.09901231527328491, -0.06756048649549484, -0.03610865771770477, -0.0046568363904953, 0.026794984936714172, 0.05824682116508484, 0.08969864249229431, 0.12115046381950378, 0.15260228514671326, 0.18405410647392273, 0.2155059427022934, 0.24695776402950287, 0.27840960025787354, 0.309861421585083, 0.3413132429122925, 0.37276506423950195, 0.4042168855667114, 0.4356687068939209, 0.46712052822113037, 0.49857234954833984, 0.5300241708755493, 0.5614759922027588, 0.5929278135299683, 0.6243796348571777, 0.6558314561843872, 0.6872832775115967, 0.7187350988388062, 0.7501869201660156, 0.7816387414932251, 0.8130905628204346, 0.844542384147644, 0.8759942054748535, 0.907446026802063, 0.9388978481292725, 0.9703496694564819, 1.0018014907836914, 1.0332533121109009, 1.0647051334381104, 1.0961569547653198, 1.1276087760925293, 1.1590605974197388, 1.1905124187469482, 1.2219642400741577, 1.2534160614013672, 1.2848678827285767, 1.3163197040557861, 1.3477715253829956, 1.3792234659194946, 1.410675287246704, 1.4421271085739136, 1.473578929901123, 1.5050307512283325, 1.536482572555542, 1.5679343938827515, 1.599386215209961, 1.6308380365371704]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 7.0, 1.0, 7.0, 6.0, 8.0, 10.0, 12.0, 11.0, 12.0, 20.0, 21.0, 27.0, 29.0, 32.0, 36.0, 34.0, 33.0, 40.0, 32.0, 46.0, 51.0, 34.0, 34.0, 34.0, 32.0, 30.0, 33.0, 34.0, 41.0, 44.0, 40.0, 31.0, 14.0, 19.0, 20.0, 10.0, 11.0, 12.0, 12.0, 13.0, 6.0, 5.0, 4.0, 7.0, 2.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5377938747406006, -0.5203893780708313, -0.5029848217964172, -0.48558032512664795, -0.4681757986545563, -0.4507712721824646, -0.4333667755126953, -0.41596224904060364, -0.39855772256851196, -0.3811531960964203, -0.3637486696243286, -0.3463441729545593, -0.32893964648246765, -0.311535120010376, -0.2941306233406067, -0.276726096868515, -0.25932157039642334, -0.24191704392433167, -0.22451253235340118, -0.2071080207824707, -0.18970349431037903, -0.17229896783828735, -0.15489445626735687, -0.1374899446964264, -0.12008541822433472, -0.10268089920282364, -0.08527638018131256, -0.06787186115980148, -0.050467342138290405, -0.03306282311677933, -0.01565830409526825, 0.0017462149262428284, 0.019150733947753906, 0.036555252969264984, 0.05395977199077606, 0.07136429101228714, 0.08876881003379822, 0.1061733290553093, 0.12357784807682037, 0.14098235964775085, 0.15838688611984253, 0.1757914125919342, 0.19319592416286469, 0.21060043573379517, 0.22800496220588684, 0.24540948867797852, 0.2628139853477478, 0.2802185118198395, 0.29762303829193115, 0.3150275647640228, 0.3324320912361145, 0.3498365879058838, 0.36724111437797546, 0.38464564085006714, 0.4020501375198364, 0.4194546639919281, 0.4368591904640198, 0.45426371693611145, 0.4716682434082031, 0.4890727400779724, 0.5064772367477417, 0.5238817930221558, 0.541286289691925, 0.5586908459663391, 0.5760953426361084]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 12.0, 9.0, 11.0, 21.0, 24.0, 27.0, 28.0, 35.0, 42.0, 46.0, 43.0, 57.0, 51.0, 62.0, 39.0, 58.0, 43.0, 48.0, 51.0, 39.0, 45.0, 35.0, 32.0, 28.0, 26.0, 21.0, 12.0, 13.0, 10.0, 10.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.546875, -11.21435546875, -10.8818359375, -10.54931640625, -10.216796875, -9.88427734375, -9.5517578125, -9.21923828125, -8.88671875, -8.55419921875, -8.2216796875, -7.88916015625, -7.556640625, -7.22412109375, -6.8916015625, -6.55908203125, -6.2265625, -5.89404296875, -5.5615234375, -5.22900390625, -4.896484375, -4.56396484375, -4.2314453125, -3.89892578125, -3.56640625, -3.23388671875, -2.9013671875, -2.56884765625, -2.236328125, -1.90380859375, -1.5712890625, -1.23876953125, -0.90625, -0.57373046875, -0.2412109375, 0.09130859375, 0.423828125, 0.75634765625, 1.0888671875, 1.42138671875, 1.75390625, 2.08642578125, 2.4189453125, 2.75146484375, 3.083984375, 3.41650390625, 3.7490234375, 4.08154296875, 4.4140625, 4.74658203125, 5.0791015625, 5.41162109375, 5.744140625, 6.07666015625, 6.4091796875, 6.74169921875, 7.07421875, 7.40673828125, 7.7392578125, 8.07177734375, 8.404296875, 8.73681640625, 9.0693359375, 9.40185546875, 9.734375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 13.0, 12.0, 18.0, 39.0, 46.0, 96.0, 119.0, 229.0, 370.0, 563.0, 1080.0, 1833.0, 3613.0, 7360.0, 15586.0, 34396.0, 85416.0, 245198.0, 398085.0, 151816.0, 56172.0, 23726.0, 11118.0, 5434.0, 2700.0, 1473.0, 798.0, 433.0, 295.0, 187.0, 106.0, 72.0, 44.0, 36.0, 17.0, 13.0, 9.0, 13.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.10565185546875, -6.8245849609375, -6.54351806640625, -6.262451171875, -5.98138427734375, -5.7003173828125, -5.41925048828125, -5.13818359375, -4.85711669921875, -4.5760498046875, -4.29498291015625, -4.013916015625, -3.73284912109375, -3.4517822265625, -3.17071533203125, -2.8896484375, -2.60858154296875, -2.3275146484375, -2.04644775390625, -1.765380859375, -1.48431396484375, -1.2032470703125, -0.92218017578125, -0.64111328125, -0.36004638671875, -0.0789794921875, 0.20208740234375, 0.483154296875, 0.76422119140625, 1.0452880859375, 1.32635498046875, 1.607421875, 1.88848876953125, 2.1695556640625, 2.45062255859375, 2.731689453125, 3.01275634765625, 3.2938232421875, 3.57489013671875, 3.85595703125, 4.13702392578125, 4.4180908203125, 4.69915771484375, 4.980224609375, 5.26129150390625, 5.5423583984375, 5.82342529296875, 6.1044921875, 6.38555908203125, 6.6666259765625, 6.94769287109375, 7.228759765625, 7.50982666015625, 7.7908935546875, 8.07196044921875, 8.35302734375, 8.63409423828125, 8.9151611328125, 9.19622802734375, 9.477294921875, 9.75836181640625, 10.0394287109375, 10.32049560546875, 10.6015625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 7.0, 7.0, 17.0, 18.0, 20.0, 19.0, 32.0, 29.0, 36.0, 29.0, 42.0, 37.0, 48.0, 61.0, 118.0, 289.0, 1513.0, 213.0, 80.0, 67.0, 46.0, 43.0, 34.0, 34.0, 23.0, 36.0, 26.0, 19.0, 16.0, 18.0, 13.0, 14.0, 9.0, 4.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-30.65625, -29.787109375, -28.91796875, -28.048828125, -27.1796875, -26.310546875, -25.44140625, -24.572265625, -23.703125, -22.833984375, -21.96484375, -21.095703125, -20.2265625, -19.357421875, -18.48828125, -17.619140625, -16.75, -15.880859375, -15.01171875, -14.142578125, -13.2734375, -12.404296875, -11.53515625, -10.666015625, -9.796875, -8.927734375, -8.05859375, -7.189453125, -6.3203125, -5.451171875, -4.58203125, -3.712890625, -2.84375, -1.974609375, -1.10546875, -0.236328125, 0.6328125, 1.501953125, 2.37109375, 3.240234375, 4.109375, 4.978515625, 5.84765625, 6.716796875, 7.5859375, 8.455078125, 9.32421875, 10.193359375, 11.0625, 11.931640625, 12.80078125, 13.669921875, 14.5390625, 15.408203125, 16.27734375, 17.146484375, 18.015625, 18.884765625, 19.75390625, 20.623046875, 21.4921875, 22.361328125, 23.23046875, 24.099609375, 24.96875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 16.0, 24.0, 26.0, 26.0, 35.0, 48.0, 70.0, 82.0, 117.0, 160.0, 245.0, 426.0, 1491.0, 26562.0, 3017932.0, 94564.0, 2381.0, 484.0, 267.0, 190.0, 136.0, 88.0, 80.0, 56.0, 40.0, 26.0, 30.0, 21.0, 14.0, 8.0, 9.0, 5.0, 2.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.53125, -53.59130859375, -51.6513671875, -49.71142578125, -47.771484375, -45.83154296875, -43.8916015625, -41.95166015625, -40.01171875, -38.07177734375, -36.1318359375, -34.19189453125, -32.251953125, -30.31201171875, -28.3720703125, -26.43212890625, -24.4921875, -22.55224609375, -20.6123046875, -18.67236328125, -16.732421875, -14.79248046875, -12.8525390625, -10.91259765625, -8.97265625, -7.03271484375, -5.0927734375, -3.15283203125, -1.212890625, 0.72705078125, 2.6669921875, 4.60693359375, 6.546875, 8.48681640625, 10.4267578125, 12.36669921875, 14.306640625, 16.24658203125, 18.1865234375, 20.12646484375, 22.06640625, 24.00634765625, 25.9462890625, 27.88623046875, 29.826171875, 31.76611328125, 33.7060546875, 35.64599609375, 37.5859375, 39.52587890625, 41.4658203125, 43.40576171875, 45.345703125, 47.28564453125, 49.2255859375, 51.16552734375, 53.10546875, 55.04541015625, 56.9853515625, 58.92529296875, 60.865234375, 62.80517578125, 64.7451171875, 66.68505859375, 68.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 25.0, 95.0, 261.0, 265.0, 204.0, 105.0, 39.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-120.59603881835938, -117.69630432128906, -114.79656982421875, -111.89683532714844, -108.99710845947266, -106.09737396240234, -103.19763946533203, -100.29790496826172, -97.39817810058594, -94.49844360351562, -91.59870910644531, -88.698974609375, -85.79924774169922, -82.8995132446289, -79.9997787475586, -77.10004425048828, -74.20030975341797, -71.30057525634766, -68.40084075927734, -65.50111389160156, -62.60137939453125, -59.70164489746094, -56.801910400390625, -53.90217590332031, -51.002445220947266, -48.10271072387695, -45.202980041503906, -42.303245544433594, -39.40351104736328, -36.503780364990234, -33.60404586791992, -30.704313278198242, -27.80457305908203, -24.90484046936035, -22.005107879638672, -19.10537338256836, -16.20564079284668, -13.305908203125, -10.406173706054688, -7.506441116333008, -4.606708526611328, -1.7069754600524902, 1.1927576065063477, 4.092491149902344, 6.992223739624023, 9.891956329345703, 12.791690826416016, 15.691423416137695, 18.591156005859375, 21.490888595581055, 24.390621185302734, 27.290355682373047, 30.190088272094727, 33.089820861816406, 35.98955535888672, 38.88928985595703, 41.78902053833008, 44.68875503540039, 47.58848571777344, 50.48822021484375, 53.38795471191406, 56.28768539428711, 59.18741989135742, 62.08715057373047, 64.98688507080078]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 8.0, 11.0, 19.0, 19.0, 25.0, 22.0, 23.0, 27.0, 26.0, 25.0, 42.0, 42.0, 41.0, 39.0, 41.0, 41.0, 30.0, 37.0, 44.0, 42.0, 45.0, 37.0, 47.0, 34.0, 35.0, 20.0, 26.0, 22.0, 20.0, 21.0, 13.0, 12.0, 14.0, 5.0, 7.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.1614761352539, -67.1134262084961, -65.06536865234375, -63.01731872558594, -60.969268798828125, -58.92121505737305, -56.87316131591797, -54.825111389160156, -52.77705764770508, -50.72900390625, -48.68095397949219, -46.63290023803711, -44.58484649658203, -42.53679656982422, -40.48874282836914, -38.44068908691406, -36.39263916015625, -34.34458541870117, -32.29653549194336, -30.24848175048828, -28.200429916381836, -26.15237808227539, -24.104324340820312, -22.056272506713867, -20.008220672607422, -17.960168838500977, -15.912116050720215, -13.864063262939453, -11.816011428833008, -9.767959594726562, -7.719906806945801, -5.671854019165039, -3.623798370361328, -1.5757460594177246, 0.4723062515258789, 2.5203585624694824, 4.568410873413086, 6.616462707519531, 8.664515495300293, 10.712568283081055, 12.7606201171875, 14.808671951293945, 16.85672378540039, 18.90477752685547, 20.952829360961914, 23.00088119506836, 25.048934936523438, 27.096986770629883, 29.145038604736328, 31.193090438842773, 33.24114227294922, 35.2891960144043, 37.337249755859375, 39.38529968261719, 41.433353424072266, 43.481407165527344, 45.529457092285156, 47.577510833740234, 49.62556076049805, 51.673614501953125, 53.72166442871094, 55.769718170166016, 57.817771911621094, 59.865821838378906, 61.913875579833984]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 8.0, 4.0, 24.0, 25.0, 27.0, 25.0, 26.0, 45.0, 45.0, 40.0, 46.0, 40.0, 61.0, 51.0, 62.0, 48.0, 49.0, 36.0, 49.0, 34.0, 52.0, 24.0, 28.0, 23.0, 20.0, 22.0, 18.0, 13.0, 11.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.671875, -11.3409423828125, -11.010009765625, -10.6790771484375, -10.34814453125, -10.0172119140625, -9.686279296875, -9.3553466796875, -9.0244140625, -8.6934814453125, -8.362548828125, -8.0316162109375, -7.70068359375, -7.3697509765625, -7.038818359375, -6.7078857421875, -6.376953125, -6.0460205078125, -5.715087890625, -5.3841552734375, -5.05322265625, -4.7222900390625, -4.391357421875, -4.0604248046875, -3.7294921875, -3.3985595703125, -3.067626953125, -2.7366943359375, -2.40576171875, -2.0748291015625, -1.743896484375, -1.4129638671875, -1.08203125, -0.7510986328125, -0.420166015625, -0.0892333984375, 0.24169921875, 0.5726318359375, 0.903564453125, 1.2344970703125, 1.5654296875, 1.8963623046875, 2.227294921875, 2.5582275390625, 2.88916015625, 3.2200927734375, 3.551025390625, 3.8819580078125, 4.212890625, 4.5438232421875, 4.874755859375, 5.2056884765625, 5.53662109375, 5.8675537109375, 6.198486328125, 6.5294189453125, 6.8603515625, 7.1912841796875, 7.522216796875, 7.8531494140625, 8.18408203125, 8.5150146484375, 8.845947265625, 9.1768798828125, 9.5078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 9.0, 7.0, 4.0, 15.0, 22.0, 24.0, 40.0, 57.0, 64.0, 114.0, 139.0, 200.0, 289.0, 469.0, 776.0, 1359.0, 2605.0, 5552.0, 13926.0, 48245.0, 392573.0, 2905117.0, 721042.0, 69981.0, 17850.0, 6872.0, 3041.0, 1455.0, 886.0, 493.0, 328.0, 223.0, 144.0, 92.0, 83.0, 53.0, 34.0, 34.0, 18.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.5, -27.652099609375, -26.80419921875, -25.956298828125, -25.1083984375, -24.260498046875, -23.41259765625, -22.564697265625, -21.716796875, -20.868896484375, -20.02099609375, -19.173095703125, -18.3251953125, -17.477294921875, -16.62939453125, -15.781494140625, -14.93359375, -14.085693359375, -13.23779296875, -12.389892578125, -11.5419921875, -10.694091796875, -9.84619140625, -8.998291015625, -8.150390625, -7.302490234375, -6.45458984375, -5.606689453125, -4.7587890625, -3.910888671875, -3.06298828125, -2.215087890625, -1.3671875, -0.519287109375, 0.32861328125, 1.176513671875, 2.0244140625, 2.872314453125, 3.72021484375, 4.568115234375, 5.416015625, 6.263916015625, 7.11181640625, 7.959716796875, 8.8076171875, 9.655517578125, 10.50341796875, 11.351318359375, 12.19921875, 13.047119140625, 13.89501953125, 14.742919921875, 15.5908203125, 16.438720703125, 17.28662109375, 18.134521484375, 18.982421875, 19.830322265625, 20.67822265625, 21.526123046875, 22.3740234375, 23.221923828125, 24.06982421875, 24.917724609375, 25.765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 10.0, 5.0, 3.0, 13.0, 9.0, 10.0, 15.0, 27.0, 22.0, 33.0, 40.0, 58.0, 98.0, 101.0, 159.0, 221.0, 329.0, 388.0, 507.0, 505.0, 403.0, 317.0, 217.0, 135.0, 122.0, 84.0, 68.0, 44.0, 43.0, 21.0, 19.0, 14.0, 10.0, 11.0, 5.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.8125, -18.2763671875, -17.740234375, -17.2041015625, -16.66796875, -16.1318359375, -15.595703125, -15.0595703125, -14.5234375, -13.9873046875, -13.451171875, -12.9150390625, -12.37890625, -11.8427734375, -11.306640625, -10.7705078125, -10.234375, -9.6982421875, -9.162109375, -8.6259765625, -8.08984375, -7.5537109375, -7.017578125, -6.4814453125, -5.9453125, -5.4091796875, -4.873046875, -4.3369140625, -3.80078125, -3.2646484375, -2.728515625, -2.1923828125, -1.65625, -1.1201171875, -0.583984375, -0.0478515625, 0.48828125, 1.0244140625, 1.560546875, 2.0966796875, 2.6328125, 3.1689453125, 3.705078125, 4.2412109375, 4.77734375, 5.3134765625, 5.849609375, 6.3857421875, 6.921875, 7.4580078125, 7.994140625, 8.5302734375, 9.06640625, 9.6025390625, 10.138671875, 10.6748046875, 11.2109375, 11.7470703125, 12.283203125, 12.8193359375, 13.35546875, 13.8916015625, 14.427734375, 14.9638671875, 15.5]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 18.0, 16.0, 21.0, 22.0, 33.0, 68.0, 91.0, 142.0, 187.0, 403.0, 1015.0, 3514.0, 21385.0, 513497.0, 3556511.0, 85695.0, 8276.0, 1878.0, 657.0, 305.0, 154.0, 109.0, 74.0, 44.0, 28.0, 26.0, 20.0, 23.0, 14.0, 6.0, 8.0, 5.0, 10.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.86962890625, -68.7392578125, -66.60888671875, -64.478515625, -62.34814453125, -60.2177734375, -58.08740234375, -55.95703125, -53.82666015625, -51.6962890625, -49.56591796875, -47.435546875, -45.30517578125, -43.1748046875, -41.04443359375, -38.9140625, -36.78369140625, -34.6533203125, -32.52294921875, -30.392578125, -28.26220703125, -26.1318359375, -24.00146484375, -21.87109375, -19.74072265625, -17.6103515625, -15.47998046875, -13.349609375, -11.21923828125, -9.0888671875, -6.95849609375, -4.828125, -2.69775390625, -0.5673828125, 1.56298828125, 3.693359375, 5.82373046875, 7.9541015625, 10.08447265625, 12.21484375, 14.34521484375, 16.4755859375, 18.60595703125, 20.736328125, 22.86669921875, 24.9970703125, 27.12744140625, 29.2578125, 31.38818359375, 33.5185546875, 35.64892578125, 37.779296875, 39.90966796875, 42.0400390625, 44.17041015625, 46.30078125, 48.43115234375, 50.5615234375, 52.69189453125, 54.822265625, 56.95263671875, 59.0830078125, 61.21337890625, 63.34375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 22.0, 73.0, 208.0, 340.0, 246.0, 89.0, 24.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.43296813964844, -130.91455078125, -121.39613342285156, -111.87772369384766, -102.35930633544922, -92.84088897705078, -83.32247924804688, -73.80406188964844, -64.28564453125, -54.76722717285156, -45.24881362915039, -35.73040008544922, -26.21198272705078, -16.693565368652344, -7.175151824951172, 2.34326171875, 11.861679077148438, 21.380094528198242, 30.898509979248047, 40.41692352294922, 49.935340881347656, 59.453758239746094, 68.97216796875, 78.49058532714844, 88.00900268554688, 97.52742004394531, 107.04583740234375, 116.56424713134766, 126.0826644897461, 135.60107421875, 145.11949157714844, 154.63790893554688, 164.15634155273438, 173.6747589111328, 183.19317626953125, 192.7115936279297, 202.23001098632812, 211.7484130859375, 221.26683044433594, 230.78524780273438, 240.3036651611328, 249.82208251953125, 259.3404846191406, 268.8589172363281, 278.3773193359375, 287.895751953125, 297.4141540527344, 306.93255615234375, 316.45098876953125, 325.9693908691406, 335.4878234863281, 345.0062255859375, 354.524658203125, 364.0430603027344, 373.5614929199219, 383.07989501953125, 392.59832763671875, 402.1167297363281, 411.6351623535156, 421.153564453125, 430.6719970703125, 440.1903991699219, 449.7088317871094, 459.22723388671875, 468.7456359863281]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 9.0, 7.0, 10.0, 9.0, 14.0, 18.0, 14.0, 14.0, 29.0, 28.0, 21.0, 28.0, 32.0, 24.0, 36.0, 36.0, 37.0, 48.0, 44.0, 25.0, 34.0, 39.0, 38.0, 36.0, 41.0, 25.0, 34.0, 31.0, 34.0, 27.0, 22.0, 22.0, 26.0, 19.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-56.384605407714844, -54.535579681396484, -52.686553955078125, -50.837528228759766, -48.988502502441406, -47.13947677612305, -45.29045104980469, -43.44142532348633, -41.59239959716797, -39.74337387084961, -37.89434814453125, -36.04532241821289, -34.19629669189453, -32.34727096557617, -30.498245239257812, -28.649219512939453, -26.800193786621094, -24.951168060302734, -23.102142333984375, -21.253116607666016, -19.404090881347656, -17.555065155029297, -15.706039428710938, -13.857013702392578, -12.007987976074219, -10.15896224975586, -8.3099365234375, -6.460910797119141, -4.611885070800781, -2.762859344482422, -0.9138336181640625, 0.9351921081542969, 2.7842178344726562, 4.633243560791016, 6.482269287109375, 8.331295013427734, 10.180320739746094, 12.029346466064453, 13.878372192382812, 15.727397918701172, 17.57642364501953, 19.42544937133789, 21.27447509765625, 23.12350082397461, 24.97252655029297, 26.821552276611328, 28.670578002929688, 30.519603729248047, 32.368629455566406, 34.217655181884766, 36.066680908203125, 37.915706634521484, 39.764732360839844, 41.6137580871582, 43.46278381347656, 45.31180953979492, 47.16083526611328, 49.00986099243164, 50.85888671875, 52.70791244506836, 54.55693817138672, 56.40596389770508, 58.25498962402344, 60.1040153503418, 61.953041076660156]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 4.0, 13.0, 11.0, 13.0, 13.0, 29.0, 15.0, 28.0, 36.0, 34.0, 56.0, 49.0, 40.0, 52.0, 64.0, 56.0, 50.0, 49.0, 49.0, 42.0, 37.0, 44.0, 39.0, 28.0, 24.0, 21.0, 22.0, 26.0, 7.0, 11.0, 6.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.640625, -11.2967529296875, -10.952880859375, -10.6090087890625, -10.26513671875, -9.9212646484375, -9.577392578125, -9.2335205078125, -8.8896484375, -8.5457763671875, -8.201904296875, -7.8580322265625, -7.51416015625, -7.1702880859375, -6.826416015625, -6.4825439453125, -6.138671875, -5.7947998046875, -5.450927734375, -5.1070556640625, -4.76318359375, -4.4193115234375, -4.075439453125, -3.7315673828125, -3.3876953125, -3.0438232421875, -2.699951171875, -2.3560791015625, -2.01220703125, -1.6683349609375, -1.324462890625, -0.9805908203125, -0.63671875, -0.2928466796875, 0.051025390625, 0.3948974609375, 0.73876953125, 1.0826416015625, 1.426513671875, 1.7703857421875, 2.1142578125, 2.4581298828125, 2.802001953125, 3.1458740234375, 3.48974609375, 3.8336181640625, 4.177490234375, 4.5213623046875, 4.865234375, 5.2091064453125, 5.552978515625, 5.8968505859375, 6.24072265625, 6.5845947265625, 6.928466796875, 7.2723388671875, 7.6162109375, 7.9600830078125, 8.303955078125, 8.6478271484375, 8.99169921875, 9.3355712890625, 9.679443359375, 10.0233154296875, 10.3671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 9.0, 23.0, 30.0, 37.0, 80.0, 91.0, 169.0, 297.0, 476.0, 760.0, 1355.0, 2310.0, 4010.0, 7454.0, 14351.0, 28567.0, 59704.0, 134738.0, 278797.0, 271292.0, 128843.0, 57502.0, 27284.0, 13742.0, 7324.0, 3951.0, 2213.0, 1238.0, 757.0, 438.0, 228.0, 177.0, 100.0, 60.0, 47.0, 34.0, 19.0, 12.0, 9.0, 3.0, 8.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.0491790771484375, -1.987030029296875, -1.9248809814453125, -1.86273193359375, -1.8005828857421875, -1.738433837890625, -1.6762847900390625, -1.6141357421875, -1.5519866943359375, -1.489837646484375, -1.4276885986328125, -1.36553955078125, -1.3033905029296875, -1.241241455078125, -1.1790924072265625, -1.116943359375, -1.0547943115234375, -0.992645263671875, -0.9304962158203125, -0.86834716796875, -0.8061981201171875, -0.744049072265625, -0.6819000244140625, -0.6197509765625, -0.5576019287109375, -0.495452880859375, -0.4333038330078125, -0.37115478515625, -0.3090057373046875, -0.246856689453125, -0.1847076416015625, -0.12255859375, -0.0604095458984375, 0.001739501953125, 0.0638885498046875, 0.12603759765625, 0.1881866455078125, 0.250335693359375, 0.3124847412109375, 0.3746337890625, 0.4367828369140625, 0.498931884765625, 0.5610809326171875, 0.62322998046875, 0.6853790283203125, 0.747528076171875, 0.8096771240234375, 0.871826171875, 0.9339752197265625, 0.996124267578125, 1.0582733154296875, 1.12042236328125, 1.1825714111328125, 1.244720458984375, 1.3068695068359375, 1.3690185546875, 1.4311676025390625, 1.493316650390625, 1.5554656982421875, 1.61761474609375, 1.6797637939453125, 1.741912841796875, 1.8040618896484375, 1.8662109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 12.0, 9.0, 16.0, 14.0, 20.0, 15.0, 20.0, 22.0, 23.0, 26.0, 40.0, 34.0, 52.0, 51.0, 49.0, 27.0, 1074.0, 57.0, 50.0, 52.0, 35.0, 38.0, 38.0, 35.0, 30.0, 29.0, 30.0, 31.0, 15.0, 18.0, 13.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.84857177734375, -5.6307373046875, -5.41290283203125, -5.195068359375, -4.97723388671875, -4.7593994140625, -4.54156494140625, -4.32373046875, -4.10589599609375, -3.8880615234375, -3.67022705078125, -3.452392578125, -3.23455810546875, -3.0167236328125, -2.79888916015625, -2.5810546875, -2.36322021484375, -2.1453857421875, -1.92755126953125, -1.709716796875, -1.49188232421875, -1.2740478515625, -1.05621337890625, -0.83837890625, -0.62054443359375, -0.4027099609375, -0.18487548828125, 0.032958984375, 0.25079345703125, 0.4686279296875, 0.68646240234375, 0.904296875, 1.12213134765625, 1.3399658203125, 1.55780029296875, 1.775634765625, 1.99346923828125, 2.2113037109375, 2.42913818359375, 2.64697265625, 2.86480712890625, 3.0826416015625, 3.30047607421875, 3.518310546875, 3.73614501953125, 3.9539794921875, 4.17181396484375, 4.3896484375, 4.60748291015625, 4.8253173828125, 5.04315185546875, 5.260986328125, 5.47882080078125, 5.6966552734375, 5.91448974609375, 6.13232421875, 6.35015869140625, 6.5679931640625, 6.78582763671875, 7.003662109375, 7.22149658203125, 7.4393310546875, 7.65716552734375, 7.875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 7.0, 11.0, 19.0, 24.0, 21.0, 45.0, 70.0, 91.0, 100.0, 160.0, 240.0, 387.0, 550.0, 781.0, 1225.0, 1947.0, 3182.0, 5257.0, 8640.0, 14876.0, 25324.0, 45824.0, 85228.0, 168466.0, 1270359.0, 225191.0, 106976.0, 56520.0, 31131.0, 17451.0, 10316.0, 6238.0, 3810.0, 2331.0, 1413.0, 983.0, 594.0, 404.0, 286.0, 170.0, 141.0, 84.0, 69.0, 43.0, 35.0, 27.0, 22.0, 16.0, 10.0, 9.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.6611328125, -0.6402587890625, -0.619384765625, -0.5985107421875, -0.57763671875, -0.5567626953125, -0.535888671875, -0.5150146484375, -0.494140625, -0.4732666015625, -0.452392578125, -0.4315185546875, -0.41064453125, -0.3897705078125, -0.368896484375, -0.3480224609375, -0.3271484375, -0.3062744140625, -0.285400390625, -0.2645263671875, -0.24365234375, -0.2227783203125, -0.201904296875, -0.1810302734375, -0.16015625, -0.1392822265625, -0.118408203125, -0.0975341796875, -0.07666015625, -0.0557861328125, -0.034912109375, -0.0140380859375, 0.0068359375, 0.0277099609375, 0.048583984375, 0.0694580078125, 0.09033203125, 0.1112060546875, 0.132080078125, 0.1529541015625, 0.173828125, 0.1947021484375, 0.215576171875, 0.2364501953125, 0.25732421875, 0.2781982421875, 0.299072265625, 0.3199462890625, 0.3408203125, 0.3616943359375, 0.382568359375, 0.4034423828125, 0.42431640625, 0.4451904296875, 0.466064453125, 0.4869384765625, 0.5078125, 0.5286865234375, 0.549560546875, 0.5704345703125, 0.59130859375, 0.6121826171875, 0.633056640625, 0.6539306640625, 0.6748046875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 2.0, 0.0, 8.0, 4.0, 8.0, 9.0, 10.0, 10.0, 15.0, 7.0, 16.0, 10.0, 17.0, 16.0, 28.0, 66.0, 109.0, 317.0, 103.0, 66.0, 22.0, 19.0, 10.0, 19.0, 11.0, 14.0, 13.0, 12.0, 11.0, 5.0, 4.0, 5.0, 2.0, 11.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1925048828125, -0.18638229370117188, -0.18025970458984375, -0.17413711547851562, -0.1680145263671875, -0.16189193725585938, -0.15576934814453125, -0.14964675903320312, -0.143524169921875, -0.13740158081054688, -0.13127899169921875, -0.12515640258789062, -0.1190338134765625, -0.11291122436523438, -0.10678863525390625, -0.10066604614257812, -0.09454345703125, -0.08842086791992188, -0.08229827880859375, -0.07617568969726562, -0.0700531005859375, -0.06393051147460938, -0.05780792236328125, -0.051685333251953125, -0.045562744140625, -0.039440155029296875, -0.03331756591796875, -0.027194976806640625, -0.0210723876953125, -0.014949798583984375, -0.00882720947265625, -0.002704620361328125, 0.00341796875, 0.009540557861328125, 0.01566314697265625, 0.021785736083984375, 0.0279083251953125, 0.034030914306640625, 0.04015350341796875, 0.046276092529296875, 0.052398681640625, 0.058521270751953125, 0.06464385986328125, 0.07076644897460938, 0.0768890380859375, 0.08301162719726562, 0.08913421630859375, 0.09525680541992188, 0.10137939453125, 0.10750198364257812, 0.11362457275390625, 0.11974716186523438, 0.1258697509765625, 0.13199234008789062, 0.13811492919921875, 0.14423751831054688, 0.150360107421875, 0.15648269653320312, 0.16260528564453125, 0.16872787475585938, 0.1748504638671875, 0.18097305297851562, 0.18709564208984375, 0.19321823120117188, 0.1993408203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 5.0, 7.0, 12.0, 12.0, 15.0, 16.0, 25.0, 35.0, 31.0, 63.0, 173.0, 425.0, 6046.0, 1028305.0, 12387.0, 527.0, 167.0, 71.0, 61.0, 20.0, 23.0, 13.0, 14.0, 16.0, 11.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.14984130859375, -4.0184326171875, -3.88702392578125, -3.755615234375, -3.62420654296875, -3.4927978515625, -3.36138916015625, -3.22998046875, -3.09857177734375, -2.9671630859375, -2.83575439453125, -2.704345703125, -2.57293701171875, -2.4415283203125, -2.31011962890625, -2.1787109375, -2.04730224609375, -1.9158935546875, -1.78448486328125, -1.653076171875, -1.52166748046875, -1.3902587890625, -1.25885009765625, -1.12744140625, -0.99603271484375, -0.8646240234375, -0.73321533203125, -0.601806640625, -0.47039794921875, -0.3389892578125, -0.20758056640625, -0.076171875, 0.05523681640625, 0.1866455078125, 0.31805419921875, 0.449462890625, 0.58087158203125, 0.7122802734375, 0.84368896484375, 0.97509765625, 1.10650634765625, 1.2379150390625, 1.36932373046875, 1.500732421875, 1.63214111328125, 1.7635498046875, 1.89495849609375, 2.0263671875, 2.15777587890625, 2.2891845703125, 2.42059326171875, 2.552001953125, 2.68341064453125, 2.8148193359375, 2.94622802734375, 3.07763671875, 3.20904541015625, 3.3404541015625, 3.47186279296875, 3.603271484375, 3.73468017578125, 3.8660888671875, 3.99749755859375, 4.12890625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 16.0, 32.0, 78.0, 206.0, 432.0, 145.0, 49.0, 28.0, 14.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.728989601135254, -1.6871917247772217, -1.6453938484191895, -1.6035958528518677, -1.5617979764938354, -1.5200001001358032, -1.4782021045684814, -1.4364042282104492, -1.394606351852417, -1.3528084754943848, -1.3110105991363525, -1.2692126035690308, -1.2274147272109985, -1.1856168508529663, -1.1438188552856445, -1.1020209789276123, -1.06022310256958, -1.0184252262115479, -0.9766272902488708, -0.9348293542861938, -0.8930314779281616, -0.8512336015701294, -0.8094356656074524, -0.7676377296447754, -0.7258398532867432, -0.6840419769287109, -0.6422440409660339, -0.6004461050033569, -0.5586482286453247, -0.5168503522872925, -0.4750524163246155, -0.43325451016426086, -0.3914567232131958, -0.3496588170528412, -0.3078609108924866, -0.26606300473213196, -0.22426509857177734, -0.18246719241142273, -0.14066928625106812, -0.0988713800907135, -0.05707347393035889, -0.015275567770004272, 0.026522338390350342, 0.06832024455070496, 0.11011815071105957, 0.15191605687141418, 0.1937139630317688, 0.2355118691921234, 0.277309775352478, 0.31910768151283264, 0.36090558767318726, 0.40270349383354187, 0.4445013999938965, 0.4862993061542511, 0.5280972123146057, 0.5698951482772827, 0.6116930246353149, 0.6534909009933472, 0.6952888369560242, 0.7370867729187012, 0.7788846492767334, 0.8206825256347656, 0.8624804615974426, 0.9042783975601196, 0.9460762739181519]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 8.0, 5.0, 7.0, 10.0, 13.0, 9.0, 17.0, 15.0, 12.0, 27.0, 22.0, 29.0, 29.0, 37.0, 24.0, 36.0, 24.0, 31.0, 36.0, 48.0, 34.0, 32.0, 38.0, 29.0, 24.0, 37.0, 25.0, 34.0, 26.0, 30.0, 21.0, 40.0, 24.0, 21.0, 26.0, 19.0, 17.0, 14.0, 9.0, 9.0, 17.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.4947187900543213, -0.4796886742115021, -0.46465858817100525, -0.44962847232818604, -0.4345983862876892, -0.41956827044487, -0.4045381546020508, -0.38950806856155396, -0.37447795271873474, -0.3594478368759155, -0.3444177508354187, -0.3293876349925995, -0.31435754895210266, -0.29932743310928345, -0.2842973470687866, -0.2692672312259674, -0.2542371153831482, -0.23920701444149017, -0.22417691349983215, -0.20914679765701294, -0.19411669671535492, -0.1790865957736969, -0.16405649483203888, -0.14902639389038086, -0.13399630784988403, -0.11896620690822601, -0.1039360985159874, -0.08890599757432938, -0.07387588918209076, -0.05884578824043274, -0.04381568729877472, -0.028785578906536102, -0.013755470514297485, 0.0012746332213282585, 0.016304736956954002, 0.03133483976125717, 0.04636494442820549, 0.06139504909515381, 0.07642515003681183, 0.09145525842905045, 0.10648535937070847, 0.12151546031236649, 0.1365455687046051, 0.15157566964626312, 0.16660577058792114, 0.18163588643074036, 0.19666597247123718, 0.2116960883140564, 0.22672618925571442, 0.24175629019737244, 0.25678640604019165, 0.2718164920806885, 0.2868466079235077, 0.3018767237663269, 0.31690680980682373, 0.33193692564964294, 0.34696701169013977, 0.361997127532959, 0.3770272135734558, 0.392057329416275, 0.40708741545677185, 0.42211753129959106, 0.4371476173400879, 0.4521777331829071, 0.4672078490257263]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 6.0, 11.0, 10.0, 15.0, 14.0, 28.0, 16.0, 27.0, 35.0, 37.0, 52.0, 51.0, 39.0, 51.0, 66.0, 52.0, 50.0, 50.0, 52.0, 40.0, 39.0, 42.0, 39.0, 29.0, 25.0, 20.0, 22.0, 26.0, 7.0, 11.0, 7.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.625, -11.281494140625, -10.93798828125, -10.594482421875, -10.2509765625, -9.907470703125, -9.56396484375, -9.220458984375, -8.876953125, -8.533447265625, -8.18994140625, -7.846435546875, -7.5029296875, -7.159423828125, -6.81591796875, -6.472412109375, -6.12890625, -5.785400390625, -5.44189453125, -5.098388671875, -4.7548828125, -4.411376953125, -4.06787109375, -3.724365234375, -3.380859375, -3.037353515625, -2.69384765625, -2.350341796875, -2.0068359375, -1.663330078125, -1.31982421875, -0.976318359375, -0.6328125, -0.289306640625, 0.05419921875, 0.397705078125, 0.7412109375, 1.084716796875, 1.42822265625, 1.771728515625, 2.115234375, 2.458740234375, 2.80224609375, 3.145751953125, 3.4892578125, 3.832763671875, 4.17626953125, 4.519775390625, 4.86328125, 5.206787109375, 5.55029296875, 5.893798828125, 6.2373046875, 6.580810546875, 6.92431640625, 7.267822265625, 7.611328125, 7.954833984375, 8.29833984375, 8.641845703125, 8.9853515625, 9.328857421875, 9.67236328125, 10.015869140625, 10.359375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 20.0, 22.0, 23.0, 39.0, 59.0, 78.0, 122.0, 147.0, 234.0, 346.0, 569.0, 889.0, 1408.0, 2537.0, 4864.0, 9881.0, 24505.0, 76080.0, 317517.0, 450921.0, 102761.0, 30689.0, 11798.0, 5626.0, 2952.0, 1699.0, 969.0, 601.0, 396.0, 278.0, 150.0, 118.0, 76.0, 51.0, 31.0, 25.0, 27.0, 17.0, 8.0, 9.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.96875, -16.4854736328125, -16.002197265625, -15.5189208984375, -15.03564453125, -14.5523681640625, -14.069091796875, -13.5858154296875, -13.1025390625, -12.6192626953125, -12.135986328125, -11.6527099609375, -11.16943359375, -10.6861572265625, -10.202880859375, -9.7196044921875, -9.236328125, -8.7530517578125, -8.269775390625, -7.7864990234375, -7.30322265625, -6.8199462890625, -6.336669921875, -5.8533935546875, -5.3701171875, -4.8868408203125, -4.403564453125, -3.9202880859375, -3.43701171875, -2.9537353515625, -2.470458984375, -1.9871826171875, -1.50390625, -1.0206298828125, -0.537353515625, -0.0540771484375, 0.42919921875, 0.9124755859375, 1.395751953125, 1.8790283203125, 2.3623046875, 2.8455810546875, 3.328857421875, 3.8121337890625, 4.29541015625, 4.7786865234375, 5.261962890625, 5.7452392578125, 6.228515625, 6.7117919921875, 7.195068359375, 7.6783447265625, 8.16162109375, 8.6448974609375, 9.128173828125, 9.6114501953125, 10.0947265625, 10.5780029296875, 11.061279296875, 11.5445556640625, 12.02783203125, 12.5111083984375, 12.994384765625, 13.4776611328125, 13.9609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 3.0, 9.0, 17.0, 10.0, 19.0, 17.0, 15.0, 22.0, 24.0, 38.0, 28.0, 26.0, 33.0, 56.0, 57.0, 67.0, 120.0, 253.0, 1482.0, 208.0, 106.0, 61.0, 50.0, 40.0, 43.0, 40.0, 23.0, 16.0, 21.0, 23.0, 10.0, 21.0, 15.0, 17.0, 9.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.75, -24.97900390625, -24.2080078125, -23.43701171875, -22.666015625, -21.89501953125, -21.1240234375, -20.35302734375, -19.58203125, -18.81103515625, -18.0400390625, -17.26904296875, -16.498046875, -15.72705078125, -14.9560546875, -14.18505859375, -13.4140625, -12.64306640625, -11.8720703125, -11.10107421875, -10.330078125, -9.55908203125, -8.7880859375, -8.01708984375, -7.24609375, -6.47509765625, -5.7041015625, -4.93310546875, -4.162109375, -3.39111328125, -2.6201171875, -1.84912109375, -1.078125, -0.30712890625, 0.4638671875, 1.23486328125, 2.005859375, 2.77685546875, 3.5478515625, 4.31884765625, 5.08984375, 5.86083984375, 6.6318359375, 7.40283203125, 8.173828125, 8.94482421875, 9.7158203125, 10.48681640625, 11.2578125, 12.02880859375, 12.7998046875, 13.57080078125, 14.341796875, 15.11279296875, 15.8837890625, 16.65478515625, 17.42578125, 18.19677734375, 18.9677734375, 19.73876953125, 20.509765625, 21.28076171875, 22.0517578125, 22.82275390625, 23.59375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 1.0, 7.0, 12.0, 11.0, 20.0, 20.0, 23.0, 30.0, 51.0, 43.0, 59.0, 77.0, 95.0, 150.0, 195.0, 306.0, 627.0, 1840.0, 8653.0, 141329.0, 2907085.0, 75516.0, 6431.0, 1476.0, 553.0, 283.0, 191.0, 118.0, 105.0, 86.0, 61.0, 53.0, 43.0, 37.0, 22.0, 28.0, 15.0, 10.0, 6.0, 9.0, 7.0, 9.0, 2.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.65625, -45.17138671875, -43.6865234375, -42.20166015625, -40.716796875, -39.23193359375, -37.7470703125, -36.26220703125, -34.77734375, -33.29248046875, -31.8076171875, -30.32275390625, -28.837890625, -27.35302734375, -25.8681640625, -24.38330078125, -22.8984375, -21.41357421875, -19.9287109375, -18.44384765625, -16.958984375, -15.47412109375, -13.9892578125, -12.50439453125, -11.01953125, -9.53466796875, -8.0498046875, -6.56494140625, -5.080078125, -3.59521484375, -2.1103515625, -0.62548828125, 0.859375, 2.34423828125, 3.8291015625, 5.31396484375, 6.798828125, 8.28369140625, 9.7685546875, 11.25341796875, 12.73828125, 14.22314453125, 15.7080078125, 17.19287109375, 18.677734375, 20.16259765625, 21.6474609375, 23.13232421875, 24.6171875, 26.10205078125, 27.5869140625, 29.07177734375, 30.556640625, 32.04150390625, 33.5263671875, 35.01123046875, 36.49609375, 37.98095703125, 39.4658203125, 40.95068359375, 42.435546875, 43.92041015625, 45.4052734375, 46.89013671875, 48.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 22.0, 347.0, 540.0, 103.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.33827209472656, -30.995132446289062, -23.651994705200195, -16.308856964111328, -8.965717315673828, -1.6225776672363281, 5.720558166503906, 13.063697814941406, 20.406837463378906, 27.749977111816406, 35.093116760253906, 42.43625259399414, 49.77939224243164, 57.12253189086914, 64.46566772460938, 71.80880737304688, 79.15194702148438, 86.49508666992188, 93.83822631835938, 101.18136596679688, 108.52450561523438, 115.86764526367188, 123.21077728271484, 130.55392456054688, 137.89706420898438, 145.24020385742188, 152.58334350585938, 159.92648315429688, 167.26962280273438, 174.61276245117188, 181.95590209960938, 189.29904174804688, 196.64218139648438, 203.98532104492188, 211.32846069335938, 218.67160034179688, 226.01473999023438, 233.35787963867188, 240.70101928710938, 248.04415893554688, 255.38729858398438, 262.7304382324219, 270.0735778808594, 277.4167175292969, 284.7598571777344, 292.1029968261719, 299.4461364746094, 306.7892761230469, 314.13238525390625, 321.47552490234375, 328.81866455078125, 336.16180419921875, 343.50494384765625, 350.84808349609375, 358.19122314453125, 365.53436279296875, 372.87750244140625, 380.22064208984375, 387.56378173828125, 394.90692138671875, 402.25006103515625, 409.59320068359375, 416.93634033203125, 424.27947998046875, 431.62261962890625]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 9.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 13.0, 12.0, 30.0, 25.0, 23.0, 19.0, 26.0, 34.0, 35.0, 32.0, 26.0, 29.0, 37.0, 37.0, 43.0, 57.0, 38.0, 40.0, 36.0, 36.0, 31.0, 28.0, 35.0, 25.0, 29.0, 24.0, 14.0, 17.0, 19.0, 12.0, 7.0, 7.0, 9.0, 13.0, 9.0, 2.0, 7.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0], "bins": [-62.882659912109375, -61.04526901245117, -59.20787811279297, -57.37049102783203, -55.53310012817383, -53.695709228515625, -51.85831832885742, -50.02092742919922, -48.18354034423828, -46.34614944458008, -44.508758544921875, -42.67137145996094, -40.833980560302734, -38.99658966064453, -37.15919876098633, -35.321807861328125, -33.48441696166992, -31.64702606201172, -29.80963706970215, -27.972246170043945, -26.134857177734375, -24.297466278076172, -22.46007537841797, -20.622684478759766, -18.785295486450195, -16.947904586791992, -15.110515594482422, -13.273124694824219, -11.435734748840332, -9.598344802856445, -7.760953903198242, -5.9235639572143555, -4.086174011230469, -2.248783826828003, -0.4113936424255371, 1.4259967803955078, 3.2633867263793945, 5.100776672363281, 6.938167572021484, 8.775557518005371, 10.612947463989258, 12.450337409973145, 14.287727355957031, 16.125118255615234, 17.962509155273438, 19.799898147583008, 21.63728904724121, 23.47467803955078, 25.312068939208984, 27.149459838867188, 28.986848831176758, 30.82423973083496, 32.66162872314453, 34.499019622802734, 36.33641052246094, 38.17380142211914, 40.011192321777344, 41.84858322143555, 43.68597412109375, 45.52336120605469, 47.36075210571289, 49.198143005371094, 51.0355339050293, 52.8729248046875, 54.71031188964844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 11.0, 12.0, 21.0, 19.0, 23.0, 24.0, 34.0, 38.0, 36.0, 45.0, 48.0, 53.0, 47.0, 58.0, 44.0, 52.0, 48.0, 46.0, 48.0, 45.0, 37.0, 25.0, 29.0, 20.0, 25.0, 25.0, 21.0, 14.0, 7.0, 4.0, 7.0, 4.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.453125, -11.09912109375, -10.7451171875, -10.39111328125, -10.037109375, -9.68310546875, -9.3291015625, -8.97509765625, -8.62109375, -8.26708984375, -7.9130859375, -7.55908203125, -7.205078125, -6.85107421875, -6.4970703125, -6.14306640625, -5.7890625, -5.43505859375, -5.0810546875, -4.72705078125, -4.373046875, -4.01904296875, -3.6650390625, -3.31103515625, -2.95703125, -2.60302734375, -2.2490234375, -1.89501953125, -1.541015625, -1.18701171875, -0.8330078125, -0.47900390625, -0.125, 0.22900390625, 0.5830078125, 0.93701171875, 1.291015625, 1.64501953125, 1.9990234375, 2.35302734375, 2.70703125, 3.06103515625, 3.4150390625, 3.76904296875, 4.123046875, 4.47705078125, 4.8310546875, 5.18505859375, 5.5390625, 5.89306640625, 6.2470703125, 6.60107421875, 6.955078125, 7.30908203125, 7.6630859375, 8.01708984375, 8.37109375, 8.72509765625, 9.0791015625, 9.43310546875, 9.787109375, 10.14111328125, 10.4951171875, 10.84912109375, 11.203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 14.0, 10.0, 6.0, 19.0, 23.0, 34.0, 44.0, 64.0, 95.0, 162.0, 235.0, 414.0, 661.0, 1188.0, 2352.0, 5303.0, 13531.0, 53492.0, 561600.0, 3067099.0, 420491.0, 45137.0, 12368.0, 4908.0, 2136.0, 1143.0, 640.0, 378.0, 237.0, 142.0, 117.0, 76.0, 34.0, 36.0, 26.0, 26.0, 11.0, 15.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-32.5625, -31.669189453125, -30.77587890625, -29.882568359375, -28.9892578125, -28.095947265625, -27.20263671875, -26.309326171875, -25.416015625, -24.522705078125, -23.62939453125, -22.736083984375, -21.8427734375, -20.949462890625, -20.05615234375, -19.162841796875, -18.26953125, -17.376220703125, -16.48291015625, -15.589599609375, -14.6962890625, -13.802978515625, -12.90966796875, -12.016357421875, -11.123046875, -10.229736328125, -9.33642578125, -8.443115234375, -7.5498046875, -6.656494140625, -5.76318359375, -4.869873046875, -3.9765625, -3.083251953125, -2.18994140625, -1.296630859375, -0.4033203125, 0.489990234375, 1.38330078125, 2.276611328125, 3.169921875, 4.063232421875, 4.95654296875, 5.849853515625, 6.7431640625, 7.636474609375, 8.52978515625, 9.423095703125, 10.31640625, 11.209716796875, 12.10302734375, 12.996337890625, 13.8896484375, 14.782958984375, 15.67626953125, 16.569580078125, 17.462890625, 18.356201171875, 19.24951171875, 20.142822265625, 21.0361328125, 21.929443359375, 22.82275390625, 23.716064453125, 24.609375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 11.0, 11.0, 18.0, 18.0, 30.0, 47.0, 67.0, 92.0, 150.0, 212.0, 341.0, 508.0, 629.0, 566.0, 453.0, 284.0, 179.0, 131.0, 73.0, 72.0, 41.0, 39.0, 26.0, 19.0, 14.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.78125, -21.137939453125, -20.49462890625, -19.851318359375, -19.2080078125, -18.564697265625, -17.92138671875, -17.278076171875, -16.634765625, -15.991455078125, -15.34814453125, -14.704833984375, -14.0615234375, -13.418212890625, -12.77490234375, -12.131591796875, -11.48828125, -10.844970703125, -10.20166015625, -9.558349609375, -8.9150390625, -8.271728515625, -7.62841796875, -6.985107421875, -6.341796875, -5.698486328125, -5.05517578125, -4.411865234375, -3.7685546875, -3.125244140625, -2.48193359375, -1.838623046875, -1.1953125, -0.552001953125, 0.09130859375, 0.734619140625, 1.3779296875, 2.021240234375, 2.66455078125, 3.307861328125, 3.951171875, 4.594482421875, 5.23779296875, 5.881103515625, 6.5244140625, 7.167724609375, 7.81103515625, 8.454345703125, 9.09765625, 9.740966796875, 10.38427734375, 11.027587890625, 11.6708984375, 12.314208984375, 12.95751953125, 13.600830078125, 14.244140625, 14.887451171875, 15.53076171875, 16.174072265625, 16.8173828125, 17.460693359375, 18.10400390625, 18.747314453125, 19.390625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 10.0, 14.0, 8.0, 11.0, 13.0, 26.0, 37.0, 51.0, 48.0, 81.0, 125.0, 193.0, 423.0, 1036.0, 3911.0, 45100.0, 3708968.0, 419162.0, 11679.0, 1977.0, 635.0, 294.0, 146.0, 90.0, 69.0, 39.0, 30.0, 30.0, 15.0, 12.0, 9.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-80.875, -78.1572265625, -75.439453125, -72.7216796875, -70.00390625, -67.2861328125, -64.568359375, -61.8505859375, -59.1328125, -56.4150390625, -53.697265625, -50.9794921875, -48.26171875, -45.5439453125, -42.826171875, -40.1083984375, -37.390625, -34.6728515625, -31.955078125, -29.2373046875, -26.51953125, -23.8017578125, -21.083984375, -18.3662109375, -15.6484375, -12.9306640625, -10.212890625, -7.4951171875, -4.77734375, -2.0595703125, 0.658203125, 3.3759765625, 6.09375, 8.8115234375, 11.529296875, 14.2470703125, 16.96484375, 19.6826171875, 22.400390625, 25.1181640625, 27.8359375, 30.5537109375, 33.271484375, 35.9892578125, 38.70703125, 41.4248046875, 44.142578125, 46.8603515625, 49.578125, 52.2958984375, 55.013671875, 57.7314453125, 60.44921875, 63.1669921875, 65.884765625, 68.6025390625, 71.3203125, 74.0380859375, 76.755859375, 79.4736328125, 82.19140625, 84.9091796875, 87.626953125, 90.3447265625, 93.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 15.0, 23.0, 36.0, 61.0, 68.0, 115.0, 168.0, 146.0, 110.0, 115.0, 50.0, 40.0, 23.0, 9.0, 14.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.791595458984375, -42.027671813964844, -38.26375198364258, -34.49983215332031, -30.73590850830078, -26.971986770629883, -23.208065032958984, -19.444143295288086, -15.680221557617188, -11.916299819946289, -8.15237808227539, -4.388456344604492, -0.6245346069335938, 3.1393871307373047, 6.903308868408203, 10.667230606079102, 14.43115234375, 18.1950740814209, 21.958995819091797, 25.722917556762695, 29.486839294433594, 33.250762939453125, 37.01468276977539, 40.778602600097656, 44.54252624511719, 48.30644989013672, 52.070369720458984, 55.83428955078125, 59.59821319580078, 63.36213684082031, 67.12605285644531, 70.88997650146484, 74.65390014648438, 78.4178237915039, 82.18174743652344, 85.94566345214844, 89.70958709716797, 93.4735107421875, 97.2374267578125, 101.00135040283203, 104.76527404785156, 108.5291976928711, 112.29312133789062, 116.05703735351562, 119.82096099853516, 123.58488464355469, 127.34880065917969, 131.11273193359375, 134.87664794921875, 138.64056396484375, 142.4044952392578, 146.1684112548828, 149.93234252929688, 153.69625854492188, 157.46017456054688, 161.22410583496094, 164.98802185058594, 168.75193786621094, 172.515869140625, 176.27978515625, 180.043701171875, 183.80763244628906, 187.57154846191406, 191.33547973632812, 195.09939575195312]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 6.0, 4.0, 9.0, 3.0, 16.0, 19.0, 15.0, 24.0, 28.0, 20.0, 31.0, 25.0, 32.0, 27.0, 36.0, 37.0, 46.0, 26.0, 29.0, 41.0, 35.0, 44.0, 32.0, 37.0, 40.0, 33.0, 30.0, 26.0, 27.0, 22.0, 25.0, 29.0, 20.0, 21.0, 14.0, 11.0, 14.0, 8.0, 8.0, 12.0, 6.0, 3.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0], "bins": [-61.32733154296875, -59.58025360107422, -57.83317565917969, -56.08610153198242, -54.33902359008789, -52.59194564819336, -50.84486770629883, -49.09779357910156, -47.35071563720703, -45.6036376953125, -43.85655975341797, -42.1094856262207, -40.36240768432617, -38.61532974243164, -36.86825180053711, -35.121177673339844, -33.37409973144531, -31.62702178955078, -29.879945755004883, -28.13286781311035, -26.385791778564453, -24.638713836669922, -22.89163589477539, -21.144559860229492, -19.397480010986328, -17.650402069091797, -15.903326034545898, -14.156248092651367, -12.409172058105469, -10.662094116210938, -8.915017127990723, -7.167940139770508, -5.420864105224609, -3.6737871170043945, -1.9267098903656006, -0.17963266372680664, 1.5674443244934082, 3.3145217895507812, 5.061598777770996, 6.808675765991211, 8.555752754211426, 10.30282974243164, 12.049906730651855, 13.79698371887207, 15.544061660766602, 17.2911376953125, 19.03821563720703, 20.785293579101562, 22.53236961364746, 24.279447555541992, 26.02652359008789, 27.773601531982422, 29.52067756652832, 31.26775550842285, 33.01483154296875, 34.76190948486328, 36.50898742675781, 38.256065368652344, 40.003143310546875, 41.75021743774414, 43.49729537963867, 45.2443733215332, 46.991451263427734, 48.738525390625, 50.48560333251953]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 13.0, 5.0, 6.0, 11.0, 10.0, 7.0, 19.0, 21.0, 25.0, 28.0, 32.0, 41.0, 44.0, 52.0, 34.0, 53.0, 37.0, 51.0, 62.0, 46.0, 47.0, 41.0, 43.0, 35.0, 35.0, 29.0, 23.0, 31.0, 26.0, 19.0, 11.0, 10.0, 17.0, 6.0, 7.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.359375, -10.026611328125, -9.69384765625, -9.361083984375, -9.0283203125, -8.695556640625, -8.36279296875, -8.030029296875, -7.697265625, -7.364501953125, -7.03173828125, -6.698974609375, -6.3662109375, -6.033447265625, -5.70068359375, -5.367919921875, -5.03515625, -4.702392578125, -4.36962890625, -4.036865234375, -3.7041015625, -3.371337890625, -3.03857421875, -2.705810546875, -2.373046875, -2.040283203125, -1.70751953125, -1.374755859375, -1.0419921875, -0.709228515625, -0.37646484375, -0.043701171875, 0.2890625, 0.621826171875, 0.95458984375, 1.287353515625, 1.6201171875, 1.952880859375, 2.28564453125, 2.618408203125, 2.951171875, 3.283935546875, 3.61669921875, 3.949462890625, 4.2822265625, 4.614990234375, 4.94775390625, 5.280517578125, 5.61328125, 5.946044921875, 6.27880859375, 6.611572265625, 6.9443359375, 7.277099609375, 7.60986328125, 7.942626953125, 8.275390625, 8.608154296875, 8.94091796875, 9.273681640625, 9.6064453125, 9.939208984375, 10.27197265625, 10.604736328125, 10.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 16.0, 29.0, 40.0, 67.0, 95.0, 144.0, 254.0, 377.0, 556.0, 914.0, 1409.0, 2253.0, 3540.0, 5689.0, 9337.0, 15347.0, 25341.0, 42325.0, 72734.0, 124428.0, 194141.0, 207738.0, 138787.0, 82506.0, 47810.0, 27998.0, 16993.0, 10530.0, 6277.0, 3998.0, 2535.0, 1539.0, 993.0, 612.0, 457.0, 266.0, 167.0, 121.0, 61.0, 51.0, 26.0, 19.0, 10.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2188720703125, -1.177001953125, -1.1351318359375, -1.09326171875, -1.0513916015625, -1.009521484375, -0.9676513671875, -0.92578125, -0.8839111328125, -0.842041015625, -0.8001708984375, -0.75830078125, -0.7164306640625, -0.674560546875, -0.6326904296875, -0.5908203125, -0.5489501953125, -0.507080078125, -0.4652099609375, -0.42333984375, -0.3814697265625, -0.339599609375, -0.2977294921875, -0.255859375, -0.2139892578125, -0.172119140625, -0.1302490234375, -0.08837890625, -0.0465087890625, -0.004638671875, 0.0372314453125, 0.0791015625, 0.1209716796875, 0.162841796875, 0.2047119140625, 0.24658203125, 0.2884521484375, 0.330322265625, 0.3721923828125, 0.4140625, 0.4559326171875, 0.497802734375, 0.5396728515625, 0.58154296875, 0.6234130859375, 0.665283203125, 0.7071533203125, 0.7490234375, 0.7908935546875, 0.832763671875, 0.8746337890625, 0.91650390625, 0.9583740234375, 1.000244140625, 1.0421142578125, 1.083984375, 1.1258544921875, 1.167724609375, 1.2095947265625, 1.25146484375, 1.2933349609375, 1.335205078125, 1.3770751953125, 1.4189453125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 5.0, 9.0, 7.0, 20.0, 17.0, 16.0, 21.0, 20.0, 18.0, 31.0, 26.0, 38.0, 31.0, 30.0, 48.0, 21.0, 43.0, 42.0, 1062.0, 31.0, 36.0, 38.0, 40.0, 34.0, 35.0, 26.0, 40.0, 37.0, 13.0, 24.0, 22.0, 18.0, 12.0, 17.0, 7.0, 19.0, 6.0, 11.0, 4.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-5.74609375, -5.56475830078125, -5.3834228515625, -5.20208740234375, -5.020751953125, -4.83941650390625, -4.6580810546875, -4.47674560546875, -4.29541015625, -4.11407470703125, -3.9327392578125, -3.75140380859375, -3.570068359375, -3.38873291015625, -3.2073974609375, -3.02606201171875, -2.8447265625, -2.66339111328125, -2.4820556640625, -2.30072021484375, -2.119384765625, -1.93804931640625, -1.7567138671875, -1.57537841796875, -1.39404296875, -1.21270751953125, -1.0313720703125, -0.85003662109375, -0.668701171875, -0.48736572265625, -0.3060302734375, -0.12469482421875, 0.056640625, 0.23797607421875, 0.4193115234375, 0.60064697265625, 0.781982421875, 0.96331787109375, 1.1446533203125, 1.32598876953125, 1.50732421875, 1.68865966796875, 1.8699951171875, 2.05133056640625, 2.232666015625, 2.41400146484375, 2.5953369140625, 2.77667236328125, 2.9580078125, 3.13934326171875, 3.3206787109375, 3.50201416015625, 3.683349609375, 3.86468505859375, 4.0460205078125, 4.22735595703125, 4.40869140625, 4.59002685546875, 4.7713623046875, 4.95269775390625, 5.134033203125, 5.31536865234375, 5.4967041015625, 5.67803955078125, 5.859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 20.0, 28.0, 38.0, 54.0, 105.0, 163.0, 201.0, 372.0, 598.0, 1064.0, 1733.0, 2840.0, 4716.0, 8012.0, 13749.0, 23777.0, 43023.0, 80510.0, 154448.0, 1262589.0, 246168.0, 115080.0, 60007.0, 32712.0, 18722.0, 10641.0, 6215.0, 3832.0, 2194.0, 1303.0, 789.0, 523.0, 360.0, 195.0, 117.0, 75.0, 42.0, 32.0, 19.0, 22.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.787109375, -0.765106201171875, -0.74310302734375, -0.721099853515625, -0.6990966796875, -0.677093505859375, -0.65509033203125, -0.633087158203125, -0.611083984375, -0.589080810546875, -0.56707763671875, -0.545074462890625, -0.5230712890625, -0.501068115234375, -0.47906494140625, -0.457061767578125, -0.43505859375, -0.413055419921875, -0.39105224609375, -0.369049072265625, -0.3470458984375, -0.325042724609375, -0.30303955078125, -0.281036376953125, -0.259033203125, -0.237030029296875, -0.21502685546875, -0.193023681640625, -0.1710205078125, -0.149017333984375, -0.12701416015625, -0.105010986328125, -0.0830078125, -0.061004638671875, -0.03900146484375, -0.016998291015625, 0.0050048828125, 0.027008056640625, 0.04901123046875, 0.071014404296875, 0.093017578125, 0.115020751953125, 0.13702392578125, 0.159027099609375, 0.1810302734375, 0.203033447265625, 0.22503662109375, 0.247039794921875, 0.26904296875, 0.291046142578125, 0.31304931640625, 0.335052490234375, 0.3570556640625, 0.379058837890625, 0.40106201171875, 0.423065185546875, 0.445068359375, 0.467071533203125, 0.48907470703125, 0.511077880859375, 0.5330810546875, 0.555084228515625, 0.57708740234375, 0.599090576171875, 0.62109375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 7.0, 5.0, 4.0, 10.0, 5.0, 4.0, 7.0, 8.0, 21.0, 14.0, 15.0, 20.0, 21.0, 41.0, 49.0, 62.0, 125.0, 243.0, 93.0, 56.0, 38.0, 18.0, 19.0, 19.0, 12.0, 9.0, 11.0, 14.0, 5.0, 8.0, 10.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1304931640625, -0.12668991088867188, -0.12288665771484375, -0.11908340454101562, -0.1152801513671875, -0.11147689819335938, -0.10767364501953125, -0.10387039184570312, -0.100067138671875, -0.09626388549804688, -0.09246063232421875, -0.08865737915039062, -0.0848541259765625, -0.08105087280273438, -0.07724761962890625, -0.07344436645507812, -0.06964111328125, -0.06583786010742188, -0.06203460693359375, -0.058231353759765625, -0.0544281005859375, -0.050624847412109375, -0.04682159423828125, -0.043018341064453125, -0.039215087890625, -0.035411834716796875, -0.03160858154296875, -0.027805328369140625, -0.0240020751953125, -0.020198822021484375, -0.01639556884765625, -0.012592315673828125, -0.0087890625, -0.004985809326171875, -0.00118255615234375, 0.002620697021484375, 0.0064239501953125, 0.010227203369140625, 0.01403045654296875, 0.017833709716796875, 0.021636962890625, 0.025440216064453125, 0.02924346923828125, 0.033046722412109375, 0.0368499755859375, 0.040653228759765625, 0.04445648193359375, 0.048259735107421875, 0.05206298828125, 0.055866241455078125, 0.05966949462890625, 0.06347274780273438, 0.0672760009765625, 0.07107925415039062, 0.07488250732421875, 0.07868576049804688, 0.082489013671875, 0.08629226684570312, 0.09009552001953125, 0.09389877319335938, 0.0977020263671875, 0.10150527954101562, 0.10530853271484375, 0.10911178588867188, 0.1129150390625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 3.0, 9.0, 12.0, 9.0, 17.0, 13.0, 27.0, 38.0, 69.0, 145.0, 451.0, 8749.0, 1003198.0, 34469.0, 819.0, 214.0, 89.0, 48.0, 39.0, 19.0, 16.0, 18.0, 9.0, 3.0, 8.0, 8.0, 4.0, 6.0, 5.0, 4.0, 0.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.67578125, -2.58551025390625, -2.4952392578125, -2.40496826171875, -2.314697265625, -2.22442626953125, -2.1341552734375, -2.04388427734375, -1.95361328125, -1.86334228515625, -1.7730712890625, -1.68280029296875, -1.592529296875, -1.50225830078125, -1.4119873046875, -1.32171630859375, -1.2314453125, -1.14117431640625, -1.0509033203125, -0.96063232421875, -0.870361328125, -0.78009033203125, -0.6898193359375, -0.59954833984375, -0.50927734375, -0.41900634765625, -0.3287353515625, -0.23846435546875, -0.148193359375, -0.05792236328125, 0.0323486328125, 0.12261962890625, 0.212890625, 0.30316162109375, 0.3934326171875, 0.48370361328125, 0.573974609375, 0.66424560546875, 0.7545166015625, 0.84478759765625, 0.93505859375, 1.02532958984375, 1.1156005859375, 1.20587158203125, 1.296142578125, 1.38641357421875, 1.4766845703125, 1.56695556640625, 1.6572265625, 1.74749755859375, 1.8377685546875, 1.92803955078125, 2.018310546875, 2.10858154296875, 2.1988525390625, 2.28912353515625, 2.37939453125, 2.46966552734375, 2.5599365234375, 2.65020751953125, 2.740478515625, 2.83074951171875, 2.9210205078125, 3.01129150390625, 3.1015625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 17.0, 21.0, 17.0, 45.0, 81.0, 117.0, 198.0, 210.0, 90.0, 51.0, 35.0, 29.0, 23.0, 11.0, 7.0, 10.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6201918125152588, -0.5994992852210999, -0.5788067579269409, -0.558114230632782, -0.537421703338623, -0.5167291760444641, -0.4960366487503052, -0.47534412145614624, -0.4546515941619873, -0.43395906686782837, -0.41326653957366943, -0.3925740122795105, -0.37188148498535156, -0.3511889576911926, -0.3304964303970337, -0.30980390310287476, -0.2891114056110382, -0.2684188783168793, -0.24772635102272034, -0.2270338237285614, -0.20634129643440247, -0.18564876914024353, -0.1649562567472458, -0.14426372945308685, -0.12357120215892792, -0.10287867486476898, -0.08218614757061005, -0.06149362772703171, -0.04080110043287277, -0.020108573138713837, 0.000583946704864502, 0.021276473999023438, 0.04196900129318237, 0.06266152858734131, 0.08335405588150024, 0.10404657572507858, 0.12473910301923752, 0.14543163776397705, 0.1661241501569748, 0.18681667745113373, 0.20750920474529266, 0.2282017320394516, 0.24889425933361053, 0.2695867717266083, 0.2902792990207672, 0.31097182631492615, 0.3316643536090851, 0.352356880903244, 0.37304940819740295, 0.3937419354915619, 0.4144344627857208, 0.43512699007987976, 0.4558195173740387, 0.47651204466819763, 0.4972045421600342, 0.5178970694541931, 0.538589596748352, 0.559282124042511, 0.5799746513366699, 0.6006671786308289, 0.6213597059249878, 0.6420522332191467, 0.6627447605133057, 0.6834372878074646, 0.7041298151016235]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 0.0, 5.0, 5.0, 13.0, 10.0, 22.0, 20.0, 11.0, 18.0, 21.0, 29.0, 23.0, 22.0, 31.0, 33.0, 44.0, 43.0, 36.0, 42.0, 51.0, 40.0, 41.0, 41.0, 29.0, 37.0, 28.0, 29.0, 33.0, 27.0, 15.0, 28.0, 14.0, 34.0, 13.0, 20.0, 16.0, 13.0, 13.0, 9.0, 8.0, 6.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3506801724433899, -0.34051117300987244, -0.330342173576355, -0.3201731741428375, -0.31000417470932007, -0.2998351752758026, -0.28966617584228516, -0.2794971466064453, -0.26932817697525024, -0.2591591775417328, -0.24899017810821533, -0.23882117867469788, -0.22865217924118042, -0.21848317980766296, -0.20831416547298431, -0.19814516603946686, -0.1879761517047882, -0.17780715227127075, -0.1676381528377533, -0.15746915340423584, -0.14730015397071838, -0.13713115453720093, -0.12696214020252228, -0.11679314076900482, -0.10662414133548737, -0.09645514190196991, -0.08628614246845245, -0.0761171355843544, -0.06594813615083694, -0.05577913671731949, -0.045610133558511734, -0.03544113039970398, -0.025272130966186523, -0.015103129670023918, -0.004934128373861313, 0.005234872922301292, 0.015403874218463898, 0.025572873651981354, 0.03574187681078911, 0.04591087996959686, 0.05607987940311432, 0.06624887883663177, 0.07641787827014923, 0.08658688515424728, 0.09675588458776474, 0.1069248840212822, 0.11709389090538025, 0.1272628903388977, 0.13743188977241516, 0.14760088920593262, 0.15776988863945007, 0.16793888807296753, 0.17810788750648499, 0.18827688694000244, 0.1984459012746811, 0.20861490070819855, 0.218783900141716, 0.22895289957523346, 0.23912189900875092, 0.24929089844226837, 0.259459912776947, 0.2696289122104645, 0.27979791164398193, 0.2899669110774994, 0.30013591051101685]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 13.0, 5.0, 6.0, 11.0, 10.0, 6.0, 19.0, 21.0, 25.0, 29.0, 31.0, 40.0, 44.0, 51.0, 37.0, 50.0, 38.0, 51.0, 62.0, 45.0, 50.0, 40.0, 44.0, 35.0, 35.0, 29.0, 22.0, 32.0, 25.0, 19.0, 11.0, 10.0, 18.0, 5.0, 8.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3671875, -10.0345458984375, -9.701904296875, -9.3692626953125, -9.03662109375, -8.7039794921875, -8.371337890625, -8.0386962890625, -7.7060546875, -7.3734130859375, -7.040771484375, -6.7081298828125, -6.37548828125, -6.0428466796875, -5.710205078125, -5.3775634765625, -5.044921875, -4.7122802734375, -4.379638671875, -4.0469970703125, -3.71435546875, -3.3817138671875, -3.049072265625, -2.7164306640625, -2.3837890625, -2.0511474609375, -1.718505859375, -1.3858642578125, -1.05322265625, -0.7205810546875, -0.387939453125, -0.0552978515625, 0.27734375, 0.6099853515625, 0.942626953125, 1.2752685546875, 1.60791015625, 1.9405517578125, 2.273193359375, 2.6058349609375, 2.9384765625, 3.2711181640625, 3.603759765625, 3.9364013671875, 4.26904296875, 4.6016845703125, 4.934326171875, 5.2669677734375, 5.599609375, 5.9322509765625, 6.264892578125, 6.5975341796875, 6.93017578125, 7.2628173828125, 7.595458984375, 7.9281005859375, 8.2607421875, 8.5933837890625, 8.926025390625, 9.2586669921875, 9.59130859375, 9.9239501953125, 10.256591796875, 10.5892333984375, 10.921875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 3.0, 11.0, 25.0, 28.0, 24.0, 63.0, 91.0, 150.0, 228.0, 406.0, 803.0, 1756.0, 5038.0, 17175.0, 70313.0, 368254.0, 471295.0, 82986.0, 20193.0, 5817.0, 1891.0, 851.0, 450.0, 224.0, 154.0, 93.0, 71.0, 43.0, 31.0, 15.0, 11.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.578125, -17.02978515625, -16.4814453125, -15.93310546875, -15.384765625, -14.83642578125, -14.2880859375, -13.73974609375, -13.19140625, -12.64306640625, -12.0947265625, -11.54638671875, -10.998046875, -10.44970703125, -9.9013671875, -9.35302734375, -8.8046875, -8.25634765625, -7.7080078125, -7.15966796875, -6.611328125, -6.06298828125, -5.5146484375, -4.96630859375, -4.41796875, -3.86962890625, -3.3212890625, -2.77294921875, -2.224609375, -1.67626953125, -1.1279296875, -0.57958984375, -0.03125, 0.51708984375, 1.0654296875, 1.61376953125, 2.162109375, 2.71044921875, 3.2587890625, 3.80712890625, 4.35546875, 4.90380859375, 5.4521484375, 6.00048828125, 6.548828125, 7.09716796875, 7.6455078125, 8.19384765625, 8.7421875, 9.29052734375, 9.8388671875, 10.38720703125, 10.935546875, 11.48388671875, 12.0322265625, 12.58056640625, 13.12890625, 13.67724609375, 14.2255859375, 14.77392578125, 15.322265625, 15.87060546875, 16.4189453125, 16.96728515625, 17.515625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 10.0, 10.0, 5.0, 9.0, 14.0, 18.0, 13.0, 16.0, 24.0, 28.0, 27.0, 32.0, 33.0, 49.0, 45.0, 62.0, 70.0, 109.0, 196.0, 1527.0, 194.0, 118.0, 68.0, 51.0, 40.0, 40.0, 24.0, 32.0, 28.0, 20.0, 28.0, 24.0, 9.0, 15.0, 18.0, 11.0, 3.0, 2.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.8125, -24.965576171875, -24.11865234375, -23.271728515625, -22.4248046875, -21.577880859375, -20.73095703125, -19.884033203125, -19.037109375, -18.190185546875, -17.34326171875, -16.496337890625, -15.6494140625, -14.802490234375, -13.95556640625, -13.108642578125, -12.26171875, -11.414794921875, -10.56787109375, -9.720947265625, -8.8740234375, -8.027099609375, -7.18017578125, -6.333251953125, -5.486328125, -4.639404296875, -3.79248046875, -2.945556640625, -2.0986328125, -1.251708984375, -0.40478515625, 0.442138671875, 1.2890625, 2.135986328125, 2.98291015625, 3.829833984375, 4.6767578125, 5.523681640625, 6.37060546875, 7.217529296875, 8.064453125, 8.911376953125, 9.75830078125, 10.605224609375, 11.4521484375, 12.299072265625, 13.14599609375, 13.992919921875, 14.83984375, 15.686767578125, 16.53369140625, 17.380615234375, 18.2275390625, 19.074462890625, 19.92138671875, 20.768310546875, 21.615234375, 22.462158203125, 23.30908203125, 24.156005859375, 25.0029296875, 25.849853515625, 26.69677734375, 27.543701171875, 28.390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 6.0, 6.0, 12.0, 14.0, 14.0, 16.0, 22.0, 24.0, 35.0, 42.0, 49.0, 66.0, 88.0, 145.0, 321.0, 629.0, 2242.0, 33011.0, 2961253.0, 141835.0, 3968.0, 851.0, 361.0, 193.0, 117.0, 85.0, 59.0, 38.0, 39.0, 35.0, 22.0, 16.0, 16.0, 10.0, 11.0, 6.0, 13.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-68.8125, -66.767578125, -64.72265625, -62.677734375, -60.6328125, -58.587890625, -56.54296875, -54.498046875, -52.453125, -50.408203125, -48.36328125, -46.318359375, -44.2734375, -42.228515625, -40.18359375, -38.138671875, -36.09375, -34.048828125, -32.00390625, -29.958984375, -27.9140625, -25.869140625, -23.82421875, -21.779296875, -19.734375, -17.689453125, -15.64453125, -13.599609375, -11.5546875, -9.509765625, -7.46484375, -5.419921875, -3.375, -1.330078125, 0.71484375, 2.759765625, 4.8046875, 6.849609375, 8.89453125, 10.939453125, 12.984375, 15.029296875, 17.07421875, 19.119140625, 21.1640625, 23.208984375, 25.25390625, 27.298828125, 29.34375, 31.388671875, 33.43359375, 35.478515625, 37.5234375, 39.568359375, 41.61328125, 43.658203125, 45.703125, 47.748046875, 49.79296875, 51.837890625, 53.8828125, 55.927734375, 57.97265625, 60.017578125, 62.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [314.0, 676.0, 28.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.072973251342773, -3.105311393737793, 9.862350463867188, 22.83001136779785, 35.79767608642578, 48.76533508300781, 61.732994079589844, 74.7006607055664, 87.66831970214844, 100.63597869873047, 113.60364532470703, 126.57130432128906, 139.53897094726562, 152.50662231445312, 165.4742889404297, 178.44195556640625, 191.4096221923828, 204.37728881835938, 217.34494018554688, 230.31260681152344, 243.2802734375, 256.2479248046875, 269.215576171875, 282.1832580566406, 295.1509094238281, 308.1185607910156, 321.08624267578125, 334.05389404296875, 347.02154541015625, 359.9892272949219, 372.9568786621094, 385.924560546875, 398.8921813964844, 411.8598327636719, 424.8275146484375, 437.795166015625, 450.7628173828125, 463.7304992675781, 476.6981506347656, 489.66583251953125, 502.63348388671875, 515.6011352539062, 528.5687866210938, 541.5364990234375, 554.504150390625, 567.4718017578125, 580.439453125, 593.4071044921875, 606.374755859375, 619.3424072265625, 632.31005859375, 645.2777099609375, 658.2454223632812, 671.2130737304688, 684.1807250976562, 697.1483764648438, 710.1160888671875, 723.083740234375, 736.0513916015625, 749.01904296875, 761.9867553710938, 774.9544067382812, 787.9220581054688, 800.8897094726562, 813.8573608398438]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 4.0, 4.0, 14.0, 20.0, 15.0, 11.0, 25.0, 20.0, 42.0, 22.0, 35.0, 25.0, 30.0, 43.0, 51.0, 40.0, 40.0, 47.0, 39.0, 53.0, 48.0, 38.0, 42.0, 26.0, 22.0, 25.0, 23.0, 21.0, 25.0, 15.0, 18.0, 13.0, 11.0, 9.0, 17.0, 8.0, 4.0, 10.0, 7.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-79.46998596191406, -77.28299713134766, -75.09601593017578, -72.90902709960938, -70.7220458984375, -68.5350570678711, -66.34807586669922, -64.16108703613281, -61.97410583496094, -59.7871208190918, -57.600135803222656, -55.413150787353516, -53.226165771484375, -51.039180755615234, -48.852195739746094, -46.66520690917969, -44.47822189331055, -42.291236877441406, -40.104251861572266, -37.917266845703125, -35.730281829833984, -33.543296813964844, -31.35630989074707, -29.16932487487793, -26.98233985900879, -24.79535484313965, -22.608369827270508, -20.421382904052734, -18.234397888183594, -16.047412872314453, -13.860427856445312, -11.673442840576172, -9.486454010009766, -7.299468994140625, -5.112483501434326, -2.9254980087280273, -0.7385129928588867, 1.448472023010254, 3.635457992553711, 5.822443008422852, 8.009428024291992, 10.196413040161133, 12.383398056030273, 14.57038402557373, 16.757369995117188, 18.944355010986328, 21.13134002685547, 23.31832504272461, 25.50531005859375, 27.69229507446289, 29.87928009033203, 32.06626510620117, 34.25325012207031, 36.44023513793945, 38.627220153808594, 40.814208984375, 43.001190185546875, 45.188175201416016, 47.375160217285156, 49.5621452331543, 51.74913024902344, 53.93611526489258, 56.12310028076172, 58.310089111328125, 60.497074127197266]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 10.0, 8.0, 10.0, 10.0, 16.0, 15.0, 22.0, 22.0, 31.0, 45.0, 43.0, 38.0, 33.0, 36.0, 43.0, 35.0, 41.0, 40.0, 40.0, 49.0, 49.0, 44.0, 37.0, 41.0, 28.0, 26.0, 26.0, 28.0, 21.0, 25.0, 8.0, 7.0, 14.0, 10.0, 10.0, 9.0, 2.0, 5.0, 2.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.921875, -9.596923828125, -9.27197265625, -8.947021484375, -8.6220703125, -8.297119140625, -7.97216796875, -7.647216796875, -7.322265625, -6.997314453125, -6.67236328125, -6.347412109375, -6.0224609375, -5.697509765625, -5.37255859375, -5.047607421875, -4.72265625, -4.397705078125, -4.07275390625, -3.747802734375, -3.4228515625, -3.097900390625, -2.77294921875, -2.447998046875, -2.123046875, -1.798095703125, -1.47314453125, -1.148193359375, -0.8232421875, -0.498291015625, -0.17333984375, 0.151611328125, 0.4765625, 0.801513671875, 1.12646484375, 1.451416015625, 1.7763671875, 2.101318359375, 2.42626953125, 2.751220703125, 3.076171875, 3.401123046875, 3.72607421875, 4.051025390625, 4.3759765625, 4.700927734375, 5.02587890625, 5.350830078125, 5.67578125, 6.000732421875, 6.32568359375, 6.650634765625, 6.9755859375, 7.300537109375, 7.62548828125, 7.950439453125, 8.275390625, 8.600341796875, 8.92529296875, 9.250244140625, 9.5751953125, 9.900146484375, 10.22509765625, 10.550048828125, 10.875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 8.0, 11.0, 19.0, 30.0, 35.0, 38.0, 54.0, 57.0, 99.0, 148.0, 201.0, 331.0, 465.0, 733.0, 1344.0, 2169.0, 4175.0, 9154.0, 22808.0, 78390.0, 434879.0, 2062671.0, 1291541.0, 208317.0, 45828.0, 15620.0, 6867.0, 3328.0, 1875.0, 1065.0, 682.0, 395.0, 283.0, 179.0, 124.0, 93.0, 66.0, 51.0, 36.0, 35.0, 22.0, 15.0, 8.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.34375, -16.719970703125, -16.09619140625, -15.472412109375, -14.8486328125, -14.224853515625, -13.60107421875, -12.977294921875, -12.353515625, -11.729736328125, -11.10595703125, -10.482177734375, -9.8583984375, -9.234619140625, -8.61083984375, -7.987060546875, -7.36328125, -6.739501953125, -6.11572265625, -5.491943359375, -4.8681640625, -4.244384765625, -3.62060546875, -2.996826171875, -2.373046875, -1.749267578125, -1.12548828125, -0.501708984375, 0.1220703125, 0.745849609375, 1.36962890625, 1.993408203125, 2.6171875, 3.240966796875, 3.86474609375, 4.488525390625, 5.1123046875, 5.736083984375, 6.35986328125, 6.983642578125, 7.607421875, 8.231201171875, 8.85498046875, 9.478759765625, 10.1025390625, 10.726318359375, 11.35009765625, 11.973876953125, 12.59765625, 13.221435546875, 13.84521484375, 14.468994140625, 15.0927734375, 15.716552734375, 16.34033203125, 16.964111328125, 17.587890625, 18.211669921875, 18.83544921875, 19.459228515625, 20.0830078125, 20.706787109375, 21.33056640625, 21.954345703125, 22.578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 14.0, 20.0, 31.0, 31.0, 44.0, 78.0, 95.0, 178.0, 259.0, 394.0, 594.0, 641.0, 531.0, 334.0, 253.0, 156.0, 130.0, 91.0, 57.0, 27.0, 23.0, 31.0, 14.0, 13.0, 5.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.5703125, -19.84375, -19.1171875, -18.390625, -17.6640625, -16.9375, -16.2109375, -15.484375, -14.7578125, -14.03125, -13.3046875, -12.578125, -11.8515625, -11.125, -10.3984375, -9.671875, -8.9453125, -8.21875, -7.4921875, -6.765625, -6.0390625, -5.3125, -4.5859375, -3.859375, -3.1328125, -2.40625, -1.6796875, -0.953125, -0.2265625, 0.5, 1.2265625, 1.953125, 2.6796875, 3.40625, 4.1328125, 4.859375, 5.5859375, 6.3125, 7.0390625, 7.765625, 8.4921875, 9.21875, 9.9453125, 10.671875, 11.3984375, 12.125, 12.8515625, 13.578125, 14.3046875, 15.03125, 15.7578125, 16.484375, 17.2109375, 17.9375, 18.6640625, 19.390625, 20.1171875, 20.84375, 21.5703125, 22.296875, 23.0234375, 23.75, 24.4765625, 25.203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 9.0, 14.0, 20.0, 16.0, 22.0, 43.0, 59.0, 87.0, 164.0, 271.0, 586.0, 2133.0, 17828.0, 1101553.0, 3035342.0, 31532.0, 3182.0, 740.0, 280.0, 138.0, 82.0, 52.0, 42.0, 22.0, 19.0, 12.0, 10.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.25, -87.6787109375, -85.107421875, -82.5361328125, -79.96484375, -77.3935546875, -74.822265625, -72.2509765625, -69.6796875, -67.1083984375, -64.537109375, -61.9658203125, -59.39453125, -56.8232421875, -54.251953125, -51.6806640625, -49.109375, -46.5380859375, -43.966796875, -41.3955078125, -38.82421875, -36.2529296875, -33.681640625, -31.1103515625, -28.5390625, -25.9677734375, -23.396484375, -20.8251953125, -18.25390625, -15.6826171875, -13.111328125, -10.5400390625, -7.96875, -5.3974609375, -2.826171875, -0.2548828125, 2.31640625, 4.8876953125, 7.458984375, 10.0302734375, 12.6015625, 15.1728515625, 17.744140625, 20.3154296875, 22.88671875, 25.4580078125, 28.029296875, 30.6005859375, 33.171875, 35.7431640625, 38.314453125, 40.8857421875, 43.45703125, 46.0283203125, 48.599609375, 51.1708984375, 53.7421875, 56.3134765625, 58.884765625, 61.4560546875, 64.02734375, 66.5986328125, 69.169921875, 71.7412109375, 74.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 36.0, 76.0, 160.0, 268.0, 260.0, 129.0, 46.0, 16.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.4894104003906, -287.7291564941406, -280.96893310546875, -274.20867919921875, -267.44842529296875, -260.68817138671875, -253.9279327392578, -247.16769409179688, -240.40744018554688, -233.64718627929688, -226.88694763183594, -220.126708984375, -213.366455078125, -206.606201171875, -199.84596252441406, -193.08572387695312, -186.32546997070312, -179.56521606445312, -172.8049774169922, -166.04473876953125, -159.28448486328125, -152.52423095703125, -145.7639923095703, -139.00375366210938, -132.24349975585938, -125.4832534790039, -118.72300720214844, -111.96276092529297, -105.2025146484375, -98.44226837158203, -91.68202209472656, -84.9217758178711, -78.16154479980469, -71.40129852294922, -64.64105224609375, -57.88080596923828, -51.12055969238281, -44.360313415527344, -37.600067138671875, -30.839820861816406, -24.079574584960938, -17.31932830810547, -10.55908203125, -3.7988357543945312, 2.9614105224609375, 9.721656799316406, 16.481903076171875, 23.242149353027344, 30.002395629882812, 36.76264190673828, 43.52288818359375, 50.28313446044922, 57.04338073730469, 63.803627014160156, 70.56387329101562, 77.3241195678711, 84.08436584472656, 90.84461212158203, 97.6048583984375, 104.36510467529297, 111.12535095214844, 117.8855972290039, 124.64584350585938, 131.40609741210938, 138.1663360595703]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 8.0, 17.0, 19.0, 16.0, 29.0, 24.0, 26.0, 36.0, 35.0, 24.0, 36.0, 51.0, 37.0, 38.0, 53.0, 46.0, 47.0, 49.0, 39.0, 43.0, 34.0, 41.0, 37.0, 36.0, 28.0, 26.0, 16.0, 23.0, 15.0, 11.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.77525329589844, -69.49578857421875, -67.21632385253906, -64.93685913085938, -62.65739059448242, -60.377925872802734, -58.09845733642578, -55.818992614746094, -53.539527893066406, -51.26006317138672, -48.98059844970703, -46.70112991333008, -44.42166519165039, -42.1422004699707, -39.86273193359375, -37.58326721191406, -35.303802490234375, -33.02433776855469, -30.744871139526367, -28.465404510498047, -26.18593978881836, -23.906475067138672, -21.62700843811035, -19.34754180908203, -17.068077087402344, -14.78861141204834, -12.509145736694336, -10.229680061340332, -7.950214385986328, -5.670748710632324, -3.3912830352783203, -1.1118173599243164, 1.1676406860351562, 3.44710636138916, 5.726572036743164, 8.006037712097168, 10.285503387451172, 12.564969062805176, 14.84443473815918, 17.1239013671875, 19.403366088867188, 21.682830810546875, 23.962297439575195, 26.241764068603516, 28.521228790283203, 30.80069351196289, 33.080162048339844, 35.35962677001953, 37.63909149169922, 39.918556213378906, 42.198020935058594, 44.47748947143555, 46.756954193115234, 49.03641891479492, 51.315887451171875, 53.59535217285156, 55.87481689453125, 58.15428161621094, 60.433746337890625, 62.71321487426758, 64.99267578125, 67.27214813232422, 69.5516128540039, 71.8310775756836, 74.11054229736328]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 5.0, 7.0, 11.0, 8.0, 17.0, 19.0, 36.0, 29.0, 32.0, 27.0, 43.0, 37.0, 37.0, 46.0, 53.0, 43.0, 54.0, 55.0, 50.0, 37.0, 42.0, 45.0, 27.0, 34.0, 27.0, 27.0, 20.0, 17.0, 16.0, 18.0, 12.0, 14.0, 2.0, 8.0, 11.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.7401123046875, -9.409912109375, -9.0797119140625, -8.74951171875, -8.4193115234375, -8.089111328125, -7.7589111328125, -7.4287109375, -7.0985107421875, -6.768310546875, -6.4381103515625, -6.10791015625, -5.7777099609375, -5.447509765625, -5.1173095703125, -4.787109375, -4.4569091796875, -4.126708984375, -3.7965087890625, -3.46630859375, -3.1361083984375, -2.805908203125, -2.4757080078125, -2.1455078125, -1.8153076171875, -1.485107421875, -1.1549072265625, -0.82470703125, -0.4945068359375, -0.164306640625, 0.1658935546875, 0.49609375, 0.8262939453125, 1.156494140625, 1.4866943359375, 1.81689453125, 2.1470947265625, 2.477294921875, 2.8074951171875, 3.1376953125, 3.4678955078125, 3.798095703125, 4.1282958984375, 4.45849609375, 4.7886962890625, 5.118896484375, 5.4490966796875, 5.779296875, 6.1094970703125, 6.439697265625, 6.7698974609375, 7.10009765625, 7.4302978515625, 7.760498046875, 8.0906982421875, 8.4208984375, 8.7510986328125, 9.081298828125, 9.4114990234375, 9.74169921875, 10.0718994140625, 10.402099609375, 10.7322998046875, 11.0625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 11.0, 18.0, 27.0, 39.0, 75.0, 107.0, 154.0, 235.0, 357.0, 556.0, 830.0, 1279.0, 1955.0, 3077.0, 4758.0, 7493.0, 11534.0, 19209.0, 32398.0, 56959.0, 103772.0, 185598.0, 242630.0, 162172.0, 89497.0, 49067.0, 28638.0, 17010.0, 10334.0, 6569.0, 4344.0, 2744.0, 1761.0, 1150.0, 745.0, 500.0, 308.0, 236.0, 137.0, 83.0, 67.0, 48.0, 15.0, 15.0, 12.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.3408203125, -1.299407958984375, -1.25799560546875, -1.216583251953125, -1.1751708984375, -1.133758544921875, -1.09234619140625, -1.050933837890625, -1.009521484375, -0.968109130859375, -0.92669677734375, -0.885284423828125, -0.8438720703125, -0.802459716796875, -0.76104736328125, -0.719635009765625, -0.67822265625, -0.636810302734375, -0.59539794921875, -0.553985595703125, -0.5125732421875, -0.471160888671875, -0.42974853515625, -0.388336181640625, -0.346923828125, -0.305511474609375, -0.26409912109375, -0.222686767578125, -0.1812744140625, -0.139862060546875, -0.09844970703125, -0.057037353515625, -0.015625, 0.025787353515625, 0.06719970703125, 0.108612060546875, 0.1500244140625, 0.191436767578125, 0.23284912109375, 0.274261474609375, 0.315673828125, 0.357086181640625, 0.39849853515625, 0.439910888671875, 0.4813232421875, 0.522735595703125, 0.56414794921875, 0.605560302734375, 0.64697265625, 0.688385009765625, 0.72979736328125, 0.771209716796875, 0.8126220703125, 0.854034423828125, 0.89544677734375, 0.936859130859375, 0.978271484375, 1.019683837890625, 1.06109619140625, 1.102508544921875, 1.1439208984375, 1.185333251953125, 1.22674560546875, 1.268157958984375, 1.3095703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 5.0, 14.0, 5.0, 12.0, 14.0, 9.0, 12.0, 15.0, 14.0, 33.0, 24.0, 28.0, 35.0, 30.0, 31.0, 40.0, 41.0, 36.0, 32.0, 47.0, 1061.0, 39.0, 44.0, 37.0, 37.0, 33.0, 23.0, 23.0, 20.0, 22.0, 21.0, 23.0, 19.0, 22.0, 19.0, 18.0, 14.0, 12.0, 8.0, 10.0, 12.0, 7.0, 3.0, 2.0, 1.0, 7.0, 2.0, 3.0, 2.0], "bins": [-6.45703125, -6.273681640625, -6.09033203125, -5.906982421875, -5.7236328125, -5.540283203125, -5.35693359375, -5.173583984375, -4.990234375, -4.806884765625, -4.62353515625, -4.440185546875, -4.2568359375, -4.073486328125, -3.89013671875, -3.706787109375, -3.5234375, -3.340087890625, -3.15673828125, -2.973388671875, -2.7900390625, -2.606689453125, -2.42333984375, -2.239990234375, -2.056640625, -1.873291015625, -1.68994140625, -1.506591796875, -1.3232421875, -1.139892578125, -0.95654296875, -0.773193359375, -0.58984375, -0.406494140625, -0.22314453125, -0.039794921875, 0.1435546875, 0.326904296875, 0.51025390625, 0.693603515625, 0.876953125, 1.060302734375, 1.24365234375, 1.427001953125, 1.6103515625, 1.793701171875, 1.97705078125, 2.160400390625, 2.34375, 2.527099609375, 2.71044921875, 2.893798828125, 3.0771484375, 3.260498046875, 3.44384765625, 3.627197265625, 3.810546875, 3.993896484375, 4.17724609375, 4.360595703125, 4.5439453125, 4.727294921875, 4.91064453125, 5.093994140625, 5.27734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 7.0, 11.0, 14.0, 30.0, 34.0, 63.0, 94.0, 138.0, 191.0, 275.0, 354.0, 603.0, 834.0, 1203.0, 1760.0, 2670.0, 3870.0, 5670.0, 8662.0, 12724.0, 19382.0, 29212.0, 45574.0, 72935.0, 117420.0, 266904.0, 1144568.0, 132226.0, 81705.0, 51188.0, 32720.0, 21045.0, 13928.0, 9453.0, 6352.0, 4302.0, 2914.0, 2031.0, 1272.0, 846.0, 595.0, 461.0, 310.0, 185.0, 144.0, 89.0, 51.0, 41.0, 20.0, 22.0, 16.0, 6.0, 4.0, 3.0, 4.0, 3.0], "bins": [-0.52392578125, -0.5085716247558594, -0.49321746826171875, -0.4778633117675781, -0.4625091552734375, -0.4471549987792969, -0.43180084228515625, -0.4164466857910156, -0.401092529296875, -0.3857383728027344, -0.37038421630859375, -0.3550300598144531, -0.3396759033203125, -0.3243217468261719, -0.30896759033203125, -0.2936134338378906, -0.27825927734375, -0.2629051208496094, -0.24755096435546875, -0.23219680786132812, -0.2168426513671875, -0.20148849487304688, -0.18613433837890625, -0.17078018188476562, -0.155426025390625, -0.14007186889648438, -0.12471771240234375, -0.10936355590820312, -0.0940093994140625, -0.07865524291992188, -0.06330108642578125, -0.047946929931640625, -0.0325927734375, -0.017238616943359375, -0.00188446044921875, 0.013469696044921875, 0.0288238525390625, 0.044178009033203125, 0.05953216552734375, 0.07488632202148438, 0.090240478515625, 0.10559463500976562, 0.12094879150390625, 0.13630294799804688, 0.1516571044921875, 0.16701126098632812, 0.18236541748046875, 0.19771957397460938, 0.21307373046875, 0.22842788696289062, 0.24378204345703125, 0.2591361999511719, 0.2744903564453125, 0.2898445129394531, 0.30519866943359375, 0.3205528259277344, 0.335906982421875, 0.3512611389160156, 0.36661529541015625, 0.3819694519042969, 0.3973236083984375, 0.4126777648925781, 0.42803192138671875, 0.4433860778808594, 0.458740234375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 13.0, 13.0, 11.0, 9.0, 24.0, 14.0, 26.0, 32.0, 41.0, 42.0, 79.0, 277.0, 105.0, 74.0, 37.0, 25.0, 33.0, 21.0, 19.0, 9.0, 8.0, 12.0, 9.0, 9.0, 5.0, 11.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.07940673828125, -0.07704448699951172, -0.07468223571777344, -0.07231998443603516, -0.06995773315429688, -0.0675954818725586, -0.06523323059082031, -0.06287097930908203, -0.06050872802734375, -0.05814647674560547, -0.05578422546386719, -0.053421974182128906, -0.051059722900390625, -0.048697471618652344, -0.04633522033691406, -0.04397296905517578, -0.0416107177734375, -0.03924846649169922, -0.03688621520996094, -0.034523963928222656, -0.032161712646484375, -0.029799461364746094, -0.027437210083007812, -0.02507495880126953, -0.02271270751953125, -0.02035045623779297, -0.017988204956054688, -0.015625953674316406, -0.013263702392578125, -0.010901451110839844, -0.008539199829101562, -0.006176948547363281, -0.003814697265625, -0.0014524459838867188, 0.0009098052978515625, 0.0032720565795898438, 0.005634307861328125, 0.007996559143066406, 0.010358810424804688, 0.012721061706542969, 0.01508331298828125, 0.01744556427001953, 0.019807815551757812, 0.022170066833496094, 0.024532318115234375, 0.026894569396972656, 0.029256820678710938, 0.03161907196044922, 0.0339813232421875, 0.03634357452392578, 0.03870582580566406, 0.041068077087402344, 0.043430328369140625, 0.045792579650878906, 0.04815483093261719, 0.05051708221435547, 0.05287933349609375, 0.05524158477783203, 0.05760383605957031, 0.059966087341308594, 0.062328338623046875, 0.06469058990478516, 0.06705284118652344, 0.06941509246826172, 0.07177734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 8.0, 9.0, 15.0, 8.0, 21.0, 19.0, 40.0, 78.0, 109.0, 210.0, 961.0, 233955.0, 811245.0, 1263.0, 222.0, 113.0, 74.0, 50.0, 25.0, 18.0, 14.0, 15.0, 13.0, 11.0, 3.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.91015625, -1.85235595703125, -1.7945556640625, -1.73675537109375, -1.678955078125, -1.62115478515625, -1.5633544921875, -1.50555419921875, -1.44775390625, -1.38995361328125, -1.3321533203125, -1.27435302734375, -1.216552734375, -1.15875244140625, -1.1009521484375, -1.04315185546875, -0.9853515625, -0.92755126953125, -0.8697509765625, -0.81195068359375, -0.754150390625, -0.69635009765625, -0.6385498046875, -0.58074951171875, -0.52294921875, -0.46514892578125, -0.4073486328125, -0.34954833984375, -0.291748046875, -0.23394775390625, -0.1761474609375, -0.11834716796875, -0.060546875, -0.00274658203125, 0.0550537109375, 0.11285400390625, 0.170654296875, 0.22845458984375, 0.2862548828125, 0.34405517578125, 0.40185546875, 0.45965576171875, 0.5174560546875, 0.57525634765625, 0.633056640625, 0.69085693359375, 0.7486572265625, 0.80645751953125, 0.8642578125, 0.92205810546875, 0.9798583984375, 1.03765869140625, 1.095458984375, 1.15325927734375, 1.2110595703125, 1.26885986328125, 1.32666015625, 1.38446044921875, 1.4422607421875, 1.50006103515625, 1.557861328125, 1.61566162109375, 1.6734619140625, 1.73126220703125, 1.7890625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 12.0, 28.0, 39.0, 157.0, 394.0, 224.0, 86.0, 42.0, 14.0, 8.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42340564727783203, -0.4086211025714874, -0.39383652806282043, -0.37905198335647583, -0.3642674386501312, -0.3494828939437866, -0.33469831943511963, -0.319913774728775, -0.3051292300224304, -0.2903446853160858, -0.2755601108074188, -0.2607755661010742, -0.24599102139472961, -0.23120646178722382, -0.21642190217971802, -0.2016373574733734, -0.18685279786586761, -0.17206823825836182, -0.1572836935520172, -0.1424991339445114, -0.1277145892381668, -0.11293002963066101, -0.09814547747373581, -0.08336092531681061, -0.0685763731598854, -0.053791821002960205, -0.039007268846035004, -0.024222712963819504, -0.009438160806894302, 0.0053463950753211975, 0.0201309472322464, 0.0349154993891716, 0.0497000515460968, 0.064484603703022, 0.0792691558599472, 0.094053715467453, 0.10883826017379761, 0.1236228197813034, 0.1384073793888092, 0.1531919240951538, 0.1679764688014984, 0.1827610284090042, 0.19754557311534882, 0.21233013272285461, 0.22711467742919922, 0.24189923703670502, 0.2566837966442108, 0.2714683413505554, 0.2862529158592224, 0.301037460565567, 0.315822035074234, 0.3306065797805786, 0.3453911244869232, 0.3601756691932678, 0.3749602437019348, 0.3897447884082794, 0.404529333114624, 0.41931387782096863, 0.4340984523296356, 0.4488829970359802, 0.46366754174232483, 0.47845208644866943, 0.4932366609573364, 0.5080212354660034, 0.5228057503700256]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 3.0, 6.0, 7.0, 6.0, 12.0, 8.0, 5.0, 7.0, 12.0, 16.0, 12.0, 16.0, 20.0, 23.0, 16.0, 33.0, 21.0, 22.0, 33.0, 37.0, 36.0, 39.0, 42.0, 32.0, 40.0, 25.0, 39.0, 38.0, 40.0, 44.0, 33.0, 33.0, 26.0, 20.0, 20.0, 15.0, 26.0, 19.0, 18.0, 14.0, 16.0, 14.0, 15.0, 7.0, 14.0, 2.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11607164144515991, -0.11205572634935379, -0.10803981125354767, -0.10402388870716095, -0.10000797361135483, -0.0959920585155487, -0.09197613596916199, -0.08796022087335587, -0.08394430577754974, -0.07992839068174362, -0.0759124755859375, -0.07189655303955078, -0.06788063794374466, -0.06386472284793854, -0.05984880402684212, -0.0558328852057457, -0.051816970109939575, -0.04780105501413345, -0.04378513619303703, -0.03976921737194061, -0.03575330227613449, -0.03173738718032837, -0.02772146835923195, -0.023705551400780678, -0.019689634442329407, -0.015673717483878136, -0.011657800525426865, -0.007641883566975594, -0.0036259666085243225, 0.00038995034992694855, 0.00440586730837822, 0.00842178426682949, 0.012437701225280762, 0.016453618183732033, 0.020469535142183304, 0.024485452100634575, 0.028501369059085846, 0.03251728415489197, 0.03653320297598839, 0.04054912179708481, 0.04456503689289093, 0.04858095198869705, 0.05259687080979347, 0.05661278963088989, 0.060628704726696014, 0.06464461982250214, 0.06866054236888885, 0.07267645746469498, 0.0766923725605011, 0.08070828765630722, 0.08472420275211334, 0.08874012529850006, 0.09275604039430618, 0.0967719554901123, 0.10078787803649902, 0.10480379313230515, 0.10881970822811127, 0.11283562332391739, 0.11685153841972351, 0.12086746096611023, 0.12488337606191635, 0.12889929115772247, 0.1329152137041092, 0.13693112134933472, 0.14094704389572144]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 5.0, 7.0, 11.0, 8.0, 16.0, 20.0, 35.0, 30.0, 32.0, 26.0, 44.0, 36.0, 38.0, 46.0, 51.0, 45.0, 54.0, 55.0, 48.0, 39.0, 42.0, 44.0, 28.0, 33.0, 27.0, 26.0, 21.0, 18.0, 16.0, 17.0, 13.0, 12.0, 4.0, 8.0, 10.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.740234375, -9.41015625, -9.080078125, -8.75, -8.419921875, -8.08984375, -7.759765625, -7.4296875, -7.099609375, -6.76953125, -6.439453125, -6.109375, -5.779296875, -5.44921875, -5.119140625, -4.7890625, -4.458984375, -4.12890625, -3.798828125, -3.46875, -3.138671875, -2.80859375, -2.478515625, -2.1484375, -1.818359375, -1.48828125, -1.158203125, -0.828125, -0.498046875, -0.16796875, 0.162109375, 0.4921875, 0.822265625, 1.15234375, 1.482421875, 1.8125, 2.142578125, 2.47265625, 2.802734375, 3.1328125, 3.462890625, 3.79296875, 4.123046875, 4.453125, 4.783203125, 5.11328125, 5.443359375, 5.7734375, 6.103515625, 6.43359375, 6.763671875, 7.09375, 7.423828125, 7.75390625, 8.083984375, 8.4140625, 8.744140625, 9.07421875, 9.404296875, 9.734375, 10.064453125, 10.39453125, 10.724609375, 11.0546875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 15.0, 12.0, 16.0, 19.0, 40.0, 66.0, 102.0, 157.0, 274.0, 387.0, 716.0, 1168.0, 2156.0, 3960.0, 7185.0, 14186.0, 27716.0, 56594.0, 125656.0, 303426.0, 282340.0, 115265.0, 52310.0, 26168.0, 13097.0, 6908.0, 3726.0, 2004.0, 1098.0, 668.0, 387.0, 259.0, 145.0, 90.0, 71.0, 52.0, 20.0, 25.0, 16.0, 16.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-11.015625, -10.691162109375, -10.36669921875, -10.042236328125, -9.7177734375, -9.393310546875, -9.06884765625, -8.744384765625, -8.419921875, -8.095458984375, -7.77099609375, -7.446533203125, -7.1220703125, -6.797607421875, -6.47314453125, -6.148681640625, -5.82421875, -5.499755859375, -5.17529296875, -4.850830078125, -4.5263671875, -4.201904296875, -3.87744140625, -3.552978515625, -3.228515625, -2.904052734375, -2.57958984375, -2.255126953125, -1.9306640625, -1.606201171875, -1.28173828125, -0.957275390625, -0.6328125, -0.308349609375, 0.01611328125, 0.340576171875, 0.6650390625, 0.989501953125, 1.31396484375, 1.638427734375, 1.962890625, 2.287353515625, 2.61181640625, 2.936279296875, 3.2607421875, 3.585205078125, 3.90966796875, 4.234130859375, 4.55859375, 4.883056640625, 5.20751953125, 5.531982421875, 5.8564453125, 6.180908203125, 6.50537109375, 6.829833984375, 7.154296875, 7.478759765625, 7.80322265625, 8.127685546875, 8.4521484375, 8.776611328125, 9.10107421875, 9.425537109375, 9.75]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0, 11.0, 18.0, 16.0, 21.0, 11.0, 19.0, 26.0, 21.0, 26.0, 26.0, 35.0, 38.0, 46.0, 53.0, 71.0, 89.0, 197.0, 1406.0, 282.0, 115.0, 69.0, 61.0, 54.0, 40.0, 47.0, 40.0, 27.0, 29.0, 17.0, 24.0, 20.0, 14.0, 20.0, 10.0, 7.0, 6.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.515625, -24.686279296875, -23.85693359375, -23.027587890625, -22.1982421875, -21.368896484375, -20.53955078125, -19.710205078125, -18.880859375, -18.051513671875, -17.22216796875, -16.392822265625, -15.5634765625, -14.734130859375, -13.90478515625, -13.075439453125, -12.24609375, -11.416748046875, -10.58740234375, -9.758056640625, -8.9287109375, -8.099365234375, -7.27001953125, -6.440673828125, -5.611328125, -4.781982421875, -3.95263671875, -3.123291015625, -2.2939453125, -1.464599609375, -0.63525390625, 0.194091796875, 1.0234375, 1.852783203125, 2.68212890625, 3.511474609375, 4.3408203125, 5.170166015625, 5.99951171875, 6.828857421875, 7.658203125, 8.487548828125, 9.31689453125, 10.146240234375, 10.9755859375, 11.804931640625, 12.63427734375, 13.463623046875, 14.29296875, 15.122314453125, 15.95166015625, 16.781005859375, 17.6103515625, 18.439697265625, 19.26904296875, 20.098388671875, 20.927734375, 21.757080078125, 22.58642578125, 23.415771484375, 24.2451171875, 25.074462890625, 25.90380859375, 26.733154296875, 27.5625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 12.0, 9.0, 14.0, 11.0, 15.0, 33.0, 29.0, 47.0, 50.0, 62.0, 90.0, 125.0, 190.0, 295.0, 588.0, 1322.0, 4921.0, 35379.0, 829135.0, 2199224.0, 63565.0, 7178.0, 1672.0, 617.0, 346.0, 195.0, 133.0, 103.0, 72.0, 66.0, 42.0, 26.0, 24.0, 26.0, 20.0, 16.0, 8.0, 12.0, 7.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.0625, -40.82958984375, -39.5966796875, -38.36376953125, -37.130859375, -35.89794921875, -34.6650390625, -33.43212890625, -32.19921875, -30.96630859375, -29.7333984375, -28.50048828125, -27.267578125, -26.03466796875, -24.8017578125, -23.56884765625, -22.3359375, -21.10302734375, -19.8701171875, -18.63720703125, -17.404296875, -16.17138671875, -14.9384765625, -13.70556640625, -12.47265625, -11.23974609375, -10.0068359375, -8.77392578125, -7.541015625, -6.30810546875, -5.0751953125, -3.84228515625, -2.609375, -1.37646484375, -0.1435546875, 1.08935546875, 2.322265625, 3.55517578125, 4.7880859375, 6.02099609375, 7.25390625, 8.48681640625, 9.7197265625, 10.95263671875, 12.185546875, 13.41845703125, 14.6513671875, 15.88427734375, 17.1171875, 18.35009765625, 19.5830078125, 20.81591796875, 22.048828125, 23.28173828125, 24.5146484375, 25.74755859375, 26.98046875, 28.21337890625, 29.4462890625, 30.67919921875, 31.912109375, 33.14501953125, 34.3779296875, 35.61083984375, 36.84375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 233.0, 750.0, 31.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.6969985961914, -75.49006652832031, -61.283138275146484, -47.076210021972656, -32.86927795410156, -18.66234588623047, -4.455421447753906, 9.751510620117188, 23.95844268798828, 38.165374755859375, 52.3723030090332, 66.57923126220703, 80.78616333007812, 94.99309539794922, 109.20001983642578, 123.40695190429688, 137.6138916015625, 151.82081604003906, 166.0277557373047, 180.23468017578125, 194.44161987304688, 208.64854431152344, 222.85546875, 237.06240844726562, 251.26931762695312, 265.47625732421875, 279.68316650390625, 293.8901062011719, 308.0970458984375, 322.303955078125, 336.5108947753906, 350.71783447265625, 364.92474365234375, 379.1316833496094, 393.3385925292969, 407.5455322265625, 421.7524719238281, 435.95941162109375, 450.16632080078125, 464.3732604980469, 478.5802001953125, 492.7871398925781, 506.9940490722656, 521.2009887695312, 535.4078979492188, 549.6148681640625, 563.82177734375, 578.0286865234375, 592.235595703125, 606.4425048828125, 620.6494750976562, 634.8563842773438, 649.0632934570312, 663.270263671875, 677.4771728515625, 691.68408203125, 705.8910522460938, 720.0979614257812, 734.304931640625, 748.5118408203125, 762.71875, 776.9257202148438, 791.1326293945312, 805.3395385742188, 819.5465087890625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 4.0, 5.0, 8.0, 9.0, 9.0, 11.0, 16.0, 14.0, 17.0, 24.0, 23.0, 34.0, 27.0, 35.0, 29.0, 49.0, 41.0, 34.0, 37.0, 49.0, 55.0, 53.0, 51.0, 42.0, 26.0, 30.0, 37.0, 28.0, 26.0, 28.0, 23.0, 18.0, 15.0, 12.0, 15.0, 12.0, 15.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-85.1396484375, -82.82827758789062, -80.51690673828125, -78.2055435180664, -75.89417266845703, -73.58280181884766, -71.27143859863281, -68.96006774902344, -66.64869689941406, -64.33732604980469, -62.02595901489258, -59.71459197998047, -57.403221130371094, -55.09185028076172, -52.78048324584961, -50.4691162109375, -48.157745361328125, -45.84637451171875, -43.53500747680664, -41.22364044189453, -38.912269592285156, -36.60089874267578, -34.28953170776367, -31.97816276550293, -29.666793823242188, -27.355424880981445, -25.044055938720703, -22.73268699645996, -20.42131805419922, -18.109949111938477, -15.798580169677734, -13.487211227416992, -11.17584228515625, -8.864473342895508, -6.553104400634766, -4.241735458374023, -1.9303665161132812, 0.38100242614746094, 2.692371368408203, 5.003740310668945, 7.3151092529296875, 9.62647819519043, 11.937847137451172, 14.249216079711914, 16.560585021972656, 18.8719539642334, 21.18332290649414, 23.494691848754883, 25.806060791015625, 28.117429733276367, 30.42879867553711, 32.74016571044922, 35.051536560058594, 37.36290740966797, 39.67427444458008, 41.98564147949219, 44.29701232910156, 46.60838317871094, 48.91975021362305, 51.231117248535156, 53.54248809814453, 55.853858947753906, 58.165225982666016, 60.476593017578125, 62.7879638671875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 11.0, 9.0, 11.0, 17.0, 19.0, 22.0, 26.0, 41.0, 33.0, 47.0, 34.0, 47.0, 45.0, 47.0, 49.0, 49.0, 46.0, 43.0, 40.0, 48.0, 36.0, 38.0, 34.0, 30.0, 20.0, 26.0, 21.0, 18.0, 16.0, 10.0, 6.0, 10.0, 9.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.9200439453125, -9.574462890625, -9.2288818359375, -8.88330078125, -8.5377197265625, -8.192138671875, -7.8465576171875, -7.5009765625, -7.1553955078125, -6.809814453125, -6.4642333984375, -6.11865234375, -5.7730712890625, -5.427490234375, -5.0819091796875, -4.736328125, -4.3907470703125, -4.045166015625, -3.6995849609375, -3.35400390625, -3.0084228515625, -2.662841796875, -2.3172607421875, -1.9716796875, -1.6260986328125, -1.280517578125, -0.9349365234375, -0.58935546875, -0.2437744140625, 0.101806640625, 0.4473876953125, 0.79296875, 1.1385498046875, 1.484130859375, 1.8297119140625, 2.17529296875, 2.5208740234375, 2.866455078125, 3.2120361328125, 3.5576171875, 3.9031982421875, 4.248779296875, 4.5943603515625, 4.93994140625, 5.2855224609375, 5.631103515625, 5.9766845703125, 6.322265625, 6.6678466796875, 7.013427734375, 7.3590087890625, 7.70458984375, 8.0501708984375, 8.395751953125, 8.7413330078125, 9.0869140625, 9.4324951171875, 9.778076171875, 10.1236572265625, 10.46923828125, 10.8148193359375, 11.160400390625, 11.5059814453125, 11.8515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 11.0, 12.0, 19.0, 23.0, 29.0, 58.0, 55.0, 106.0, 174.0, 296.0, 447.0, 837.0, 1403.0, 2532.0, 5227.0, 11761.0, 34074.0, 205853.0, 2468379.0, 1317400.0, 103420.0, 23752.0, 9277.0, 4233.0, 2185.0, 1103.0, 614.0, 358.0, 229.0, 133.0, 97.0, 45.0, 39.0, 19.0, 18.0, 16.0, 17.0, 9.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.203125, -27.344482421875, -26.48583984375, -25.627197265625, -24.7685546875, -23.909912109375, -23.05126953125, -22.192626953125, -21.333984375, -20.475341796875, -19.61669921875, -18.758056640625, -17.8994140625, -17.040771484375, -16.18212890625, -15.323486328125, -14.46484375, -13.606201171875, -12.74755859375, -11.888916015625, -11.0302734375, -10.171630859375, -9.31298828125, -8.454345703125, -7.595703125, -6.737060546875, -5.87841796875, -5.019775390625, -4.1611328125, -3.302490234375, -2.44384765625, -1.585205078125, -0.7265625, 0.132080078125, 0.99072265625, 1.849365234375, 2.7080078125, 3.566650390625, 4.42529296875, 5.283935546875, 6.142578125, 7.001220703125, 7.85986328125, 8.718505859375, 9.5771484375, 10.435791015625, 11.29443359375, 12.153076171875, 13.01171875, 13.870361328125, 14.72900390625, 15.587646484375, 16.4462890625, 17.304931640625, 18.16357421875, 19.022216796875, 19.880859375, 20.739501953125, 21.59814453125, 22.456787109375, 23.3154296875, 24.174072265625, 25.03271484375, 25.891357421875, 26.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 9.0, 10.0, 12.0, 18.0, 20.0, 33.0, 48.0, 65.0, 85.0, 149.0, 201.0, 388.0, 523.0, 732.0, 564.0, 370.0, 266.0, 156.0, 130.0, 86.0, 56.0, 43.0, 25.0, 21.0, 14.0, 10.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.6787109375, -19.013671875, -18.3486328125, -17.68359375, -17.0185546875, -16.353515625, -15.6884765625, -15.0234375, -14.3583984375, -13.693359375, -13.0283203125, -12.36328125, -11.6982421875, -11.033203125, -10.3681640625, -9.703125, -9.0380859375, -8.373046875, -7.7080078125, -7.04296875, -6.3779296875, -5.712890625, -5.0478515625, -4.3828125, -3.7177734375, -3.052734375, -2.3876953125, -1.72265625, -1.0576171875, -0.392578125, 0.2724609375, 0.9375, 1.6025390625, 2.267578125, 2.9326171875, 3.59765625, 4.2626953125, 4.927734375, 5.5927734375, 6.2578125, 6.9228515625, 7.587890625, 8.2529296875, 8.91796875, 9.5830078125, 10.248046875, 10.9130859375, 11.578125, 12.2431640625, 12.908203125, 13.5732421875, 14.23828125, 14.9033203125, 15.568359375, 16.2333984375, 16.8984375, 17.5634765625, 18.228515625, 18.8935546875, 19.55859375, 20.2236328125, 20.888671875, 21.5537109375, 22.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 12.0, 7.0, 9.0, 15.0, 32.0, 40.0, 65.0, 101.0, 183.0, 284.0, 614.0, 1558.0, 6273.0, 44772.0, 2374826.0, 1718984.0, 38201.0, 5580.0, 1514.0, 519.0, 281.0, 147.0, 89.0, 50.0, 31.0, 26.0, 20.0, 15.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.375, -68.240234375, -66.10546875, -63.970703125, -61.8359375, -59.701171875, -57.56640625, -55.431640625, -53.296875, -51.162109375, -49.02734375, -46.892578125, -44.7578125, -42.623046875, -40.48828125, -38.353515625, -36.21875, -34.083984375, -31.94921875, -29.814453125, -27.6796875, -25.544921875, -23.41015625, -21.275390625, -19.140625, -17.005859375, -14.87109375, -12.736328125, -10.6015625, -8.466796875, -6.33203125, -4.197265625, -2.0625, 0.072265625, 2.20703125, 4.341796875, 6.4765625, 8.611328125, 10.74609375, 12.880859375, 15.015625, 17.150390625, 19.28515625, 21.419921875, 23.5546875, 25.689453125, 27.82421875, 29.958984375, 32.09375, 34.228515625, 36.36328125, 38.498046875, 40.6328125, 42.767578125, 44.90234375, 47.037109375, 49.171875, 51.306640625, 53.44140625, 55.576171875, 57.7109375, 59.845703125, 61.98046875, 64.115234375, 66.25]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 26.0, 62.0, 134.0, 202.0, 237.0, 166.0, 101.0, 53.0, 18.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-302.11712646484375, -296.54266357421875, -290.9681701660156, -285.3937072753906, -279.8192443847656, -274.2447509765625, -268.6702880859375, -263.0958251953125, -257.5213317871094, -251.9468536376953, -246.3723907470703, -240.79791259765625, -235.2234344482422, -229.6489715576172, -224.07449340820312, -218.50003051757812, -212.92556762695312, -207.35108947753906, -201.77662658691406, -196.2021484375, -190.62767028808594, -185.05320739746094, -179.47872924804688, -173.90426635742188, -168.32977294921875, -162.7552947998047, -157.1808319091797, -151.60635375976562, -146.03187561035156, -140.45741271972656, -134.8829345703125, -129.3084716796875, -123.73399353027344, -118.1595230102539, -112.58504486083984, -107.01057434082031, -101.43610382080078, -95.86163330078125, -90.28715515136719, -84.71268463134766, -79.13821411132812, -73.5637435913086, -67.98926544189453, -62.414794921875, -56.84032440185547, -51.26585006713867, -45.691375732421875, -40.116905212402344, -34.54242706298828, -28.967954635620117, -23.393482208251953, -17.819007873535156, -12.244535446166992, -6.670063018798828, -1.0955886840820312, 4.4788818359375, 10.053356170654297, 15.627828598022461, 21.202301025390625, 26.776775360107422, 32.35124969482422, 37.92572021484375, 43.50019454956055, 49.07466506958008, 54.649139404296875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 7.0, 5.0, 10.0, 23.0, 15.0, 15.0, 25.0, 21.0, 24.0, 21.0, 30.0, 21.0, 40.0, 41.0, 39.0, 29.0, 40.0, 39.0, 58.0, 30.0, 37.0, 33.0, 39.0, 35.0, 30.0, 48.0, 31.0, 35.0, 29.0, 20.0, 17.0, 15.0, 14.0, 7.0, 12.0, 10.0, 6.0, 13.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-53.73297882080078, -52.03872299194336, -50.34446334838867, -48.65020751953125, -46.95594787597656, -45.26169204711914, -43.56743621826172, -41.87317657470703, -40.17892074584961, -38.48466491699219, -36.7904052734375, -35.09614944458008, -33.40188980102539, -31.70763397216797, -30.013376235961914, -28.31911849975586, -26.624860763549805, -24.93060302734375, -23.236345291137695, -21.54208755493164, -19.84783172607422, -18.153573989868164, -16.45931625366211, -14.765059471130371, -13.070801734924316, -11.376543998718262, -9.682287216186523, -7.988029479980469, -6.293772220611572, -4.599514961242676, -2.905257225036621, -1.2110004425048828, 0.4832572937011719, 2.1775145530700684, 3.871772050857544, 5.5660295486450195, 7.260286808013916, 8.954544067382812, 10.648801803588867, 12.343058586120605, 14.03731632232666, 15.731574058532715, 17.425830841064453, 19.120088577270508, 20.814346313476562, 22.508602142333984, 24.202861785888672, 25.897117614746094, 27.59137535095215, 29.285633087158203, 30.979890823364258, 32.67414855957031, 34.368404388427734, 36.062660217285156, 37.756919860839844, 39.451175689697266, 41.14543533325195, 42.839691162109375, 44.53395080566406, 46.228206634521484, 47.92246627807617, 49.616722106933594, 51.31098175048828, 53.0052375793457, 54.699493408203125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 2.0, 7.0, 6.0, 8.0, 8.0, 11.0, 20.0, 15.0, 23.0, 36.0, 38.0, 32.0, 37.0, 30.0, 49.0, 48.0, 41.0, 34.0, 43.0, 48.0, 43.0, 50.0, 39.0, 39.0, 33.0, 45.0, 32.0, 23.0, 33.0, 18.0, 17.0, 11.0, 18.0, 9.0, 10.0, 9.0, 10.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.007568359375, -9.66357421875, -9.319580078125, -8.9755859375, -8.631591796875, -8.28759765625, -7.943603515625, -7.599609375, -7.255615234375, -6.91162109375, -6.567626953125, -6.2236328125, -5.879638671875, -5.53564453125, -5.191650390625, -4.84765625, -4.503662109375, -4.15966796875, -3.815673828125, -3.4716796875, -3.127685546875, -2.78369140625, -2.439697265625, -2.095703125, -1.751708984375, -1.40771484375, -1.063720703125, -0.7197265625, -0.375732421875, -0.03173828125, 0.312255859375, 0.65625, 1.000244140625, 1.34423828125, 1.688232421875, 2.0322265625, 2.376220703125, 2.72021484375, 3.064208984375, 3.408203125, 3.752197265625, 4.09619140625, 4.440185546875, 4.7841796875, 5.128173828125, 5.47216796875, 5.816162109375, 6.16015625, 6.504150390625, 6.84814453125, 7.192138671875, 7.5361328125, 7.880126953125, 8.22412109375, 8.568115234375, 8.912109375, 9.256103515625, 9.60009765625, 9.944091796875, 10.2880859375, 10.632080078125, 10.97607421875, 11.320068359375, 11.6640625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 9.0, 13.0, 15.0, 42.0, 59.0, 74.0, 138.0, 198.0, 306.0, 523.0, 744.0, 1381.0, 2260.0, 3879.0, 6645.0, 11851.0, 21639.0, 40271.0, 78787.0, 156452.0, 268054.0, 216997.0, 112964.0, 57193.0, 30124.0, 16176.0, 9027.0, 5067.0, 3068.0, 1800.0, 1104.0, 624.0, 401.0, 235.0, 146.0, 107.0, 71.0, 36.0, 19.0, 18.0, 15.0, 3.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.7998046875, -1.7480316162109375, -1.696258544921875, -1.6444854736328125, -1.59271240234375, -1.5409393310546875, -1.489166259765625, -1.4373931884765625, -1.3856201171875, -1.3338470458984375, -1.282073974609375, -1.2303009033203125, -1.17852783203125, -1.1267547607421875, -1.074981689453125, -1.0232086181640625, -0.971435546875, -0.9196624755859375, -0.867889404296875, -0.8161163330078125, -0.76434326171875, -0.7125701904296875, -0.660797119140625, -0.6090240478515625, -0.5572509765625, -0.5054779052734375, -0.453704833984375, -0.4019317626953125, -0.35015869140625, -0.2983856201171875, -0.246612548828125, -0.1948394775390625, -0.14306640625, -0.0912933349609375, -0.039520263671875, 0.0122528076171875, 0.06402587890625, 0.1157989501953125, 0.167572021484375, 0.2193450927734375, 0.2711181640625, 0.3228912353515625, 0.374664306640625, 0.4264373779296875, 0.47821044921875, 0.5299835205078125, 0.581756591796875, 0.6335296630859375, 0.685302734375, 0.7370758056640625, 0.788848876953125, 0.8406219482421875, 0.89239501953125, 0.9441680908203125, 0.995941162109375, 1.0477142333984375, 1.0994873046875, 1.1512603759765625, 1.203033447265625, 1.2548065185546875, 1.30657958984375, 1.3583526611328125, 1.410125732421875, 1.4618988037109375, 1.513671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 8.0, 10.0, 13.0, 12.0, 21.0, 24.0, 29.0, 24.0, 28.0, 31.0, 41.0, 36.0, 43.0, 42.0, 41.0, 37.0, 1072.0, 51.0, 47.0, 46.0, 45.0, 44.0, 39.0, 38.0, 22.0, 29.0, 23.0, 23.0, 23.0, 19.0, 20.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-8.5703125, -8.3492431640625, -8.128173828125, -7.9071044921875, -7.68603515625, -7.4649658203125, -7.243896484375, -7.0228271484375, -6.8017578125, -6.5806884765625, -6.359619140625, -6.1385498046875, -5.91748046875, -5.6964111328125, -5.475341796875, -5.2542724609375, -5.033203125, -4.8121337890625, -4.591064453125, -4.3699951171875, -4.14892578125, -3.9278564453125, -3.706787109375, -3.4857177734375, -3.2646484375, -3.0435791015625, -2.822509765625, -2.6014404296875, -2.38037109375, -2.1593017578125, -1.938232421875, -1.7171630859375, -1.49609375, -1.2750244140625, -1.053955078125, -0.8328857421875, -0.61181640625, -0.3907470703125, -0.169677734375, 0.0513916015625, 0.2724609375, 0.4935302734375, 0.714599609375, 0.9356689453125, 1.15673828125, 1.3778076171875, 1.598876953125, 1.8199462890625, 2.041015625, 2.2620849609375, 2.483154296875, 2.7042236328125, 2.92529296875, 3.1463623046875, 3.367431640625, 3.5885009765625, 3.8095703125, 4.0306396484375, 4.251708984375, 4.4727783203125, 4.69384765625, 4.9149169921875, 5.135986328125, 5.3570556640625, 5.578125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 10.0, 12.0, 24.0, 23.0, 49.0, 78.0, 120.0, 182.0, 285.0, 396.0, 605.0, 979.0, 1510.0, 2268.0, 3605.0, 5612.0, 8933.0, 14644.0, 24475.0, 41054.0, 71419.0, 123357.0, 279157.0, 1177236.0, 141214.0, 80973.0, 46700.0, 27522.0, 16727.0, 10186.0, 6373.0, 4116.0, 2551.0, 1613.0, 1057.0, 697.0, 472.0, 313.0, 206.0, 124.0, 73.0, 60.0, 37.0, 26.0, 21.0, 8.0, 6.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5703125, -0.5519866943359375, -0.533660888671875, -0.5153350830078125, -0.49700927734375, -0.4786834716796875, -0.460357666015625, -0.4420318603515625, -0.4237060546875, -0.4053802490234375, -0.387054443359375, -0.3687286376953125, -0.35040283203125, -0.3320770263671875, -0.313751220703125, -0.2954254150390625, -0.277099609375, -0.2587738037109375, -0.240447998046875, -0.2221221923828125, -0.20379638671875, -0.1854705810546875, -0.167144775390625, -0.1488189697265625, -0.1304931640625, -0.1121673583984375, -0.093841552734375, -0.0755157470703125, -0.05718994140625, -0.0388641357421875, -0.020538330078125, -0.0022125244140625, 0.01611328125, 0.0344390869140625, 0.052764892578125, 0.0710906982421875, 0.08941650390625, 0.1077423095703125, 0.126068115234375, 0.1443939208984375, 0.1627197265625, 0.1810455322265625, 0.199371337890625, 0.2176971435546875, 0.23602294921875, 0.2543487548828125, 0.272674560546875, 0.2910003662109375, 0.309326171875, 0.3276519775390625, 0.345977783203125, 0.3643035888671875, 0.38262939453125, 0.4009552001953125, 0.419281005859375, 0.4376068115234375, 0.4559326171875, 0.4742584228515625, 0.492584228515625, 0.5109100341796875, 0.52923583984375, 0.5475616455078125, 0.565887451171875, 0.5842132568359375, 0.6025390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 10.0, 12.0, 12.0, 20.0, 34.0, 34.0, 45.0, 57.0, 81.0, 171.0, 176.0, 89.0, 54.0, 43.0, 23.0, 19.0, 19.0, 10.0, 15.0, 11.0, 9.0, 6.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0726318359375, -0.07012653350830078, -0.06762123107910156, -0.06511592864990234, -0.06261062622070312, -0.060105323791503906, -0.05760002136230469, -0.05509471893310547, -0.05258941650390625, -0.05008411407470703, -0.04757881164550781, -0.045073509216308594, -0.042568206787109375, -0.040062904357910156, -0.03755760192871094, -0.03505229949951172, -0.0325469970703125, -0.03004169464111328, -0.027536392211914062, -0.025031089782714844, -0.022525787353515625, -0.020020484924316406, -0.017515182495117188, -0.015009880065917969, -0.01250457763671875, -0.009999275207519531, -0.0074939727783203125, -0.004988670349121094, -0.002483367919921875, 2.193450927734375e-05, 0.0025272369384765625, 0.005032539367675781, 0.007537841796875, 0.010043144226074219, 0.012548446655273438, 0.015053749084472656, 0.017559051513671875, 0.020064353942871094, 0.022569656372070312, 0.02507495880126953, 0.02758026123046875, 0.03008556365966797, 0.03259086608886719, 0.035096168518066406, 0.037601470947265625, 0.040106773376464844, 0.04261207580566406, 0.04511737823486328, 0.0476226806640625, 0.05012798309326172, 0.05263328552246094, 0.055138587951660156, 0.057643890380859375, 0.060149192810058594, 0.06265449523925781, 0.06515979766845703, 0.06766510009765625, 0.07017040252685547, 0.07267570495605469, 0.0751810073852539, 0.07768630981445312, 0.08019161224365234, 0.08269691467285156, 0.08520221710205078, 0.08770751953125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 9.0, 4.0, 9.0, 10.0, 20.0, 16.0, 22.0, 37.0, 44.0, 97.0, 275.0, 1311.0, 669432.0, 375449.0, 1227.0, 264.0, 100.0, 72.0, 43.0, 25.0, 16.0, 16.0, 10.0, 10.0, 3.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.08984375, -2.0301055908203125, -1.970367431640625, -1.9106292724609375, -1.85089111328125, -1.7911529541015625, -1.731414794921875, -1.6716766357421875, -1.6119384765625, -1.5522003173828125, -1.492462158203125, -1.4327239990234375, -1.37298583984375, -1.3132476806640625, -1.253509521484375, -1.1937713623046875, -1.134033203125, -1.0742950439453125, -1.014556884765625, -0.9548187255859375, -0.89508056640625, -0.8353424072265625, -0.775604248046875, -0.7158660888671875, -0.6561279296875, -0.5963897705078125, -0.536651611328125, -0.4769134521484375, -0.41717529296875, -0.3574371337890625, -0.297698974609375, -0.2379608154296875, -0.17822265625, -0.1184844970703125, -0.058746337890625, 0.0009918212890625, 0.06072998046875, 0.1204681396484375, 0.180206298828125, 0.2399444580078125, 0.2996826171875, 0.3594207763671875, 0.419158935546875, 0.4788970947265625, 0.53863525390625, 0.5983734130859375, 0.658111572265625, 0.7178497314453125, 0.777587890625, 0.8373260498046875, 0.897064208984375, 0.9568023681640625, 1.01654052734375, 1.0762786865234375, 1.136016845703125, 1.1957550048828125, 1.2554931640625, 1.3152313232421875, 1.374969482421875, 1.4347076416015625, 1.49444580078125, 1.5541839599609375, 1.613922119140625, 1.6736602783203125, 1.7333984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 15.0, 16.0, 30.0, 50.0, 118.0, 218.0, 244.0, 140.0, 76.0, 28.0, 20.0, 19.0, 11.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.41359221935272217, -0.40500080585479736, -0.39640936255455017, -0.38781794905662537, -0.3792265057563782, -0.37063509225845337, -0.36204367876052856, -0.35345223546028137, -0.34486082196235657, -0.33626940846443176, -0.32767796516418457, -0.31908655166625977, -0.3104951083660126, -0.30190369486808777, -0.2933122515678406, -0.28472083806991577, -0.27612942457199097, -0.26753801107406616, -0.25894656777381897, -0.25035515427589417, -0.24176372587680817, -0.23317229747772217, -0.22458086907863617, -0.21598944067955017, -0.20739799737930298, -0.19880656898021698, -0.19021514058113098, -0.18162372708320618, -0.17303229868412018, -0.16444087028503418, -0.15584944188594818, -0.14725801348686218, -0.13866659998893738, -0.13007517158985138, -0.12148375064134598, -0.11289232224225998, -0.10430090129375458, -0.09570947289466858, -0.08711804449558258, -0.07852661609649658, -0.06993519514799118, -0.06134377047419548, -0.05275234580039978, -0.04416091740131378, -0.03556949272751808, -0.02697806805372238, -0.018386639654636383, -0.009795214980840683, -0.001203790307044983, 0.007387635298073292, 0.015979060903191566, 0.024570487439632416, 0.033161912113428116, 0.041753336787223816, 0.050344765186309814, 0.058936189860105515, 0.06752761453390121, 0.07611904293298721, 0.08471046388149261, 0.09330189228057861, 0.10189332067966461, 0.11048474162817001, 0.11907617002725601, 0.1276675909757614, 0.1362590193748474]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 12.0, 9.0, 17.0, 16.0, 19.0, 31.0, 24.0, 33.0, 42.0, 27.0, 43.0, 39.0, 36.0, 41.0, 47.0, 43.0, 35.0, 42.0, 39.0, 45.0, 29.0, 39.0, 36.0, 40.0, 36.0, 23.0, 27.0, 22.0, 12.0, 14.0, 8.0, 15.0, 4.0, 9.0, 1.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04847234487533569, -0.04685968533158302, -0.04524702578783035, -0.043634362518787384, -0.042021702975034714, -0.04040904343128204, -0.038796380162239075, -0.037183720618486404, -0.035571061074733734, -0.033958401530981064, -0.032345741987228394, -0.030733078718185425, -0.029120419174432755, -0.027507759630680084, -0.025895098224282265, -0.024282436817884445, -0.022669777274131775, -0.021057117730379105, -0.019444456323981285, -0.017831794917583466, -0.016219135373830795, -0.01460647489875555, -0.012993814423680305, -0.01138115394860506, -0.009768493473529816, -0.00815583299845457, -0.006543172523379326, -0.004930512048304081, -0.003317851573228836, -0.0017051910981535912, -9.253062307834625e-05, 0.0015201298519968987, 0.0031327903270721436, 0.0047454508021473885, 0.006358111277222633, 0.007970771752297878, 0.009583432227373123, 0.011196092702448368, 0.012808753177523613, 0.014421413652598858, 0.016034074127674103, 0.017646733671426773, 0.019259395077824593, 0.020872056484222412, 0.022484716027975082, 0.024097375571727753, 0.025710036978125572, 0.02732269838452339, 0.028935357928276062, 0.030548017472028732, 0.0321606770157814, 0.03377334028482437, 0.03538599982857704, 0.03699865937232971, 0.03861132264137268, 0.04022398218512535, 0.04183664172887802, 0.04344930127263069, 0.04506196081638336, 0.04667462408542633, 0.048287283629179, 0.04989994317293167, 0.05151260644197464, 0.05312526598572731, 0.05473792552947998]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 2.0, 7.0, 6.0, 8.0, 9.0, 10.0, 20.0, 15.0, 23.0, 36.0, 38.0, 32.0, 37.0, 30.0, 49.0, 48.0, 40.0, 35.0, 43.0, 47.0, 44.0, 50.0, 38.0, 40.0, 33.0, 46.0, 31.0, 23.0, 33.0, 18.0, 17.0, 11.0, 18.0, 9.0, 10.0, 9.0, 10.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.007568359375, -9.66357421875, -9.319580078125, -8.9755859375, -8.631591796875, -8.28759765625, -7.943603515625, -7.599609375, -7.255615234375, -6.91162109375, -6.567626953125, -6.2236328125, -5.879638671875, -5.53564453125, -5.191650390625, -4.84765625, -4.503662109375, -4.15966796875, -3.815673828125, -3.4716796875, -3.127685546875, -2.78369140625, -2.439697265625, -2.095703125, -1.751708984375, -1.40771484375, -1.063720703125, -0.7197265625, -0.375732421875, -0.03173828125, 0.312255859375, 0.65625, 1.000244140625, 1.34423828125, 1.688232421875, 2.0322265625, 2.376220703125, 2.72021484375, 3.064208984375, 3.408203125, 3.752197265625, 4.09619140625, 4.440185546875, 4.7841796875, 5.128173828125, 5.47216796875, 5.816162109375, 6.16015625, 6.504150390625, 6.84814453125, 7.192138671875, 7.5361328125, 7.880126953125, 8.22412109375, 8.568115234375, 8.912109375, 9.256103515625, 9.60009765625, 9.944091796875, 10.2880859375, 10.632080078125, 10.97607421875, 11.320068359375, 11.6640625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 0.0, 4.0, 3.0, 8.0, 6.0, 6.0, 18.0, 28.0, 33.0, 47.0, 48.0, 85.0, 127.0, 211.0, 359.0, 718.0, 1743.0, 4553.0, 12624.0, 39029.0, 218856.0, 625656.0, 104870.0, 25259.0, 8477.0, 3194.0, 1230.0, 556.0, 271.0, 177.0, 97.0, 64.0, 47.0, 36.0, 24.0, 27.0, 13.0, 8.0, 9.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.652099609375, -17.06982421875, -16.487548828125, -15.9052734375, -15.322998046875, -14.74072265625, -14.158447265625, -13.576171875, -12.993896484375, -12.41162109375, -11.829345703125, -11.2470703125, -10.664794921875, -10.08251953125, -9.500244140625, -8.91796875, -8.335693359375, -7.75341796875, -7.171142578125, -6.5888671875, -6.006591796875, -5.42431640625, -4.842041015625, -4.259765625, -3.677490234375, -3.09521484375, -2.512939453125, -1.9306640625, -1.348388671875, -0.76611328125, -0.183837890625, 0.3984375, 0.980712890625, 1.56298828125, 2.145263671875, 2.7275390625, 3.309814453125, 3.89208984375, 4.474365234375, 5.056640625, 5.638916015625, 6.22119140625, 6.803466796875, 7.3857421875, 7.968017578125, 8.55029296875, 9.132568359375, 9.71484375, 10.297119140625, 10.87939453125, 11.461669921875, 12.0439453125, 12.626220703125, 13.20849609375, 13.790771484375, 14.373046875, 14.955322265625, 15.53759765625, 16.119873046875, 16.7021484375, 17.284423828125, 17.86669921875, 18.448974609375, 19.03125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 16.0, 23.0, 15.0, 22.0, 34.0, 37.0, 52.0, 48.0, 57.0, 68.0, 102.0, 250.0, 1640.0, 178.0, 77.0, 47.0, 50.0, 44.0, 40.0, 41.0, 35.0, 20.0, 25.0, 24.0, 13.0, 17.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.375, -36.2861328125, -35.197265625, -34.1083984375, -33.01953125, -31.9306640625, -30.841796875, -29.7529296875, -28.6640625, -27.5751953125, -26.486328125, -25.3974609375, -24.30859375, -23.2197265625, -22.130859375, -21.0419921875, -19.953125, -18.8642578125, -17.775390625, -16.6865234375, -15.59765625, -14.5087890625, -13.419921875, -12.3310546875, -11.2421875, -10.1533203125, -9.064453125, -7.9755859375, -6.88671875, -5.7978515625, -4.708984375, -3.6201171875, -2.53125, -1.4423828125, -0.353515625, 0.7353515625, 1.82421875, 2.9130859375, 4.001953125, 5.0908203125, 6.1796875, 7.2685546875, 8.357421875, 9.4462890625, 10.53515625, 11.6240234375, 12.712890625, 13.8017578125, 14.890625, 15.9794921875, 17.068359375, 18.1572265625, 19.24609375, 20.3349609375, 21.423828125, 22.5126953125, 23.6015625, 24.6904296875, 25.779296875, 26.8681640625, 27.95703125, 29.0458984375, 30.134765625, 31.2236328125, 32.3125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 4.0, 8.0, 8.0, 18.0, 15.0, 26.0, 19.0, 35.0, 51.0, 66.0, 75.0, 101.0, 156.0, 280.0, 752.0, 7606.0, 2558736.0, 572288.0, 4070.0, 604.0, 246.0, 145.0, 117.0, 79.0, 42.0, 34.0, 24.0, 20.0, 24.0, 14.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.5, -60.41015625, -58.3203125, -56.23046875, -54.140625, -52.05078125, -49.9609375, -47.87109375, -45.78125, -43.69140625, -41.6015625, -39.51171875, -37.421875, -35.33203125, -33.2421875, -31.15234375, -29.0625, -26.97265625, -24.8828125, -22.79296875, -20.703125, -18.61328125, -16.5234375, -14.43359375, -12.34375, -10.25390625, -8.1640625, -6.07421875, -3.984375, -1.89453125, 0.1953125, 2.28515625, 4.375, 6.46484375, 8.5546875, 10.64453125, 12.734375, 14.82421875, 16.9140625, 19.00390625, 21.09375, 23.18359375, 25.2734375, 27.36328125, 29.453125, 31.54296875, 33.6328125, 35.72265625, 37.8125, 39.90234375, 41.9921875, 44.08203125, 46.171875, 48.26171875, 50.3515625, 52.44140625, 54.53125, 56.62109375, 58.7109375, 60.80078125, 62.890625, 64.98046875, 67.0703125, 69.16015625, 71.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 10.0, 19.0, 37.0, 74.0, 101.0, 171.0, 174.0, 157.0, 127.0, 80.0, 38.0, 16.0, 7.0, 2.0, 2.0, 1.0, 1.0], "bins": [-87.00146484375, -85.37763214111328, -83.75379943847656, -82.12996673583984, -80.50613403320312, -78.8823013305664, -77.25846862792969, -75.63463592529297, -74.01080322265625, -72.38697052001953, -70.76313781738281, -69.1393051147461, -67.51547241210938, -65.89163970947266, -64.26780700683594, -62.64397430419922, -61.020145416259766, -59.39631271362305, -57.77248001098633, -56.14864730834961, -54.52481460571289, -52.90098190307617, -51.27715301513672, -49.6533203125, -48.02948760986328, -46.40565490722656, -44.781822204589844, -43.157989501953125, -41.534156799316406, -39.91032409667969, -38.28649139404297, -36.66265869140625, -35.03882598876953, -33.41499328613281, -31.791160583496094, -30.167327880859375, -28.543495178222656, -26.919662475585938, -25.29583168029785, -23.671998977661133, -22.048168182373047, -20.424335479736328, -18.80050277709961, -17.17667007446289, -15.552838325500488, -13.92900562286377, -12.305173873901367, -10.681341171264648, -9.05750846862793, -7.433675765991211, -5.80984354019165, -4.18601131439209, -2.562178611755371, -0.9383459091186523, 0.68548583984375, 2.3093185424804688, 3.9331512451171875, 5.556983947753906, 7.180816173553467, 8.804648399353027, 10.428481101989746, 12.052313804626465, 13.676145553588867, 15.299978256225586, 16.923810958862305]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 7.0, 15.0, 9.0, 14.0, 20.0, 27.0, 22.0, 21.0, 36.0, 32.0, 44.0, 44.0, 35.0, 39.0, 51.0, 42.0, 52.0, 50.0, 48.0, 41.0, 33.0, 31.0, 49.0, 26.0, 32.0, 24.0, 25.0, 22.0, 20.0, 17.0, 13.0, 11.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.67095184326172, -83.22492218017578, -80.77889251708984, -78.3328628540039, -75.88683319091797, -73.44080352783203, -70.9947738647461, -68.54875183105469, -66.10272216796875, -63.65669250488281, -61.210662841796875, -58.76463317871094, -56.318603515625, -53.87257385253906, -51.42654800415039, -48.98051834106445, -46.53448486328125, -44.08845520019531, -41.642425537109375, -39.19639587402344, -36.7503662109375, -34.30433654785156, -31.85831069946289, -29.412281036376953, -26.966251373291016, -24.520221710205078, -22.07419204711914, -19.628164291381836, -17.1821346282959, -14.736104965209961, -12.29007625579834, -9.844047546386719, -7.3980255126953125, -4.951996326446533, -2.505967140197754, -0.05993795394897461, 2.3860912322998047, 4.832120895385742, 7.278149604797363, 9.724178314208984, 12.170207977294922, 14.61623764038086, 17.062267303466797, 19.5082950592041, 21.95432472229004, 24.400354385375977, 26.84638214111328, 29.29241180419922, 31.738441467285156, 34.184471130371094, 36.63050079345703, 39.07653045654297, 41.522560119628906, 43.968589782714844, 46.414615631103516, 48.86064529418945, 51.30667495727539, 53.75270462036133, 56.198734283447266, 58.6447639465332, 61.090789794921875, 63.53681945800781, 65.98284912109375, 68.42887878417969, 70.87490844726562]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 9.0, 6.0, 7.0, 15.0, 15.0, 13.0, 24.0, 28.0, 23.0, 40.0, 38.0, 37.0, 40.0, 47.0, 45.0, 37.0, 44.0, 45.0, 50.0, 45.0, 50.0, 35.0, 33.0, 37.0, 45.0, 24.0, 29.0, 24.0, 20.0, 14.0, 11.0, 13.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.921142578125, -9.56103515625, -9.200927734375, -8.8408203125, -8.480712890625, -8.12060546875, -7.760498046875, -7.400390625, -7.040283203125, -6.68017578125, -6.320068359375, -5.9599609375, -5.599853515625, -5.23974609375, -4.879638671875, -4.51953125, -4.159423828125, -3.79931640625, -3.439208984375, -3.0791015625, -2.718994140625, -2.35888671875, -1.998779296875, -1.638671875, -1.278564453125, -0.91845703125, -0.558349609375, -0.1982421875, 0.161865234375, 0.52197265625, 0.882080078125, 1.2421875, 1.602294921875, 1.96240234375, 2.322509765625, 2.6826171875, 3.042724609375, 3.40283203125, 3.762939453125, 4.123046875, 4.483154296875, 4.84326171875, 5.203369140625, 5.5634765625, 5.923583984375, 6.28369140625, 6.643798828125, 7.00390625, 7.364013671875, 7.72412109375, 8.084228515625, 8.4443359375, 8.804443359375, 9.16455078125, 9.524658203125, 9.884765625, 10.244873046875, 10.60498046875, 10.965087890625, 11.3251953125, 11.685302734375, 12.04541015625, 12.405517578125, 12.765625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 11.0, 13.0, 23.0, 21.0, 36.0, 43.0, 69.0, 77.0, 123.0, 158.0, 235.0, 337.0, 538.0, 894.0, 1392.0, 2472.0, 4430.0, 9010.0, 21658.0, 68412.0, 422355.0, 2514122.0, 969261.0, 121580.0, 31329.0, 12231.0, 5858.0, 2988.0, 1739.0, 980.0, 586.0, 365.0, 287.0, 173.0, 133.0, 85.0, 56.0, 60.0, 46.0, 23.0, 15.0, 13.0, 12.0, 4.0, 4.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.84912109375, -22.1044921875, -21.35986328125, -20.615234375, -19.87060546875, -19.1259765625, -18.38134765625, -17.63671875, -16.89208984375, -16.1474609375, -15.40283203125, -14.658203125, -13.91357421875, -13.1689453125, -12.42431640625, -11.6796875, -10.93505859375, -10.1904296875, -9.44580078125, -8.701171875, -7.95654296875, -7.2119140625, -6.46728515625, -5.72265625, -4.97802734375, -4.2333984375, -3.48876953125, -2.744140625, -1.99951171875, -1.2548828125, -0.51025390625, 0.234375, 0.97900390625, 1.7236328125, 2.46826171875, 3.212890625, 3.95751953125, 4.7021484375, 5.44677734375, 6.19140625, 6.93603515625, 7.6806640625, 8.42529296875, 9.169921875, 9.91455078125, 10.6591796875, 11.40380859375, 12.1484375, 12.89306640625, 13.6376953125, 14.38232421875, 15.126953125, 15.87158203125, 16.6162109375, 17.36083984375, 18.10546875, 18.85009765625, 19.5947265625, 20.33935546875, 21.083984375, 21.82861328125, 22.5732421875, 23.31787109375, 24.0625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 7.0, 19.0, 15.0, 19.0, 28.0, 36.0, 62.0, 71.0, 133.0, 162.0, 257.0, 383.0, 616.0, 641.0, 505.0, 368.0, 222.0, 175.0, 103.0, 57.0, 57.0, 43.0, 37.0, 9.0, 21.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.5625, -19.86181640625, -19.1611328125, -18.46044921875, -17.759765625, -17.05908203125, -16.3583984375, -15.65771484375, -14.95703125, -14.25634765625, -13.5556640625, -12.85498046875, -12.154296875, -11.45361328125, -10.7529296875, -10.05224609375, -9.3515625, -8.65087890625, -7.9501953125, -7.24951171875, -6.548828125, -5.84814453125, -5.1474609375, -4.44677734375, -3.74609375, -3.04541015625, -2.3447265625, -1.64404296875, -0.943359375, -0.24267578125, 0.4580078125, 1.15869140625, 1.859375, 2.56005859375, 3.2607421875, 3.96142578125, 4.662109375, 5.36279296875, 6.0634765625, 6.76416015625, 7.46484375, 8.16552734375, 8.8662109375, 9.56689453125, 10.267578125, 10.96826171875, 11.6689453125, 12.36962890625, 13.0703125, 13.77099609375, 14.4716796875, 15.17236328125, 15.873046875, 16.57373046875, 17.2744140625, 17.97509765625, 18.67578125, 19.37646484375, 20.0771484375, 20.77783203125, 21.478515625, 22.17919921875, 22.8798828125, 23.58056640625, 24.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 8.0, 18.0, 16.0, 27.0, 35.0, 62.0, 109.0, 181.0, 330.0, 804.0, 2254.0, 8438.0, 51495.0, 934284.0, 3059076.0, 116380.0, 15119.0, 3452.0, 1115.0, 514.0, 226.0, 132.0, 77.0, 43.0, 35.0, 23.0, 10.0, 8.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.65625, -52.9033203125, -51.150390625, -49.3974609375, -47.64453125, -45.8916015625, -44.138671875, -42.3857421875, -40.6328125, -38.8798828125, -37.126953125, -35.3740234375, -33.62109375, -31.8681640625, -30.115234375, -28.3623046875, -26.609375, -24.8564453125, -23.103515625, -21.3505859375, -19.59765625, -17.8447265625, -16.091796875, -14.3388671875, -12.5859375, -10.8330078125, -9.080078125, -7.3271484375, -5.57421875, -3.8212890625, -2.068359375, -0.3154296875, 1.4375, 3.1904296875, 4.943359375, 6.6962890625, 8.44921875, 10.2021484375, 11.955078125, 13.7080078125, 15.4609375, 17.2138671875, 18.966796875, 20.7197265625, 22.47265625, 24.2255859375, 25.978515625, 27.7314453125, 29.484375, 31.2373046875, 32.990234375, 34.7431640625, 36.49609375, 38.2490234375, 40.001953125, 41.7548828125, 43.5078125, 45.2607421875, 47.013671875, 48.7666015625, 50.51953125, 52.2724609375, 54.025390625, 55.7783203125, 57.53125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 12.0, 19.0, 27.0, 32.0, 37.0, 54.0, 88.0, 118.0, 101.0, 140.0, 90.0, 91.0, 60.0, 47.0, 39.0, 14.0, 19.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.418426513671875, -53.722652435302734, -51.02688217163086, -48.33110809326172, -45.635337829589844, -42.9395637512207, -40.24378967285156, -37.54801940917969, -34.85224533081055, -32.156471252441406, -29.46070098876953, -26.76492691040039, -24.069154739379883, -21.373382568359375, -18.677608489990234, -15.981836318969727, -13.286064147949219, -10.590291976928711, -7.894518852233887, -5.1987457275390625, -2.5029735565185547, 0.19279861450195312, 2.8885726928710938, 5.584344863891602, 8.28011703491211, 10.975889205932617, 13.671662330627441, 16.367435455322266, 19.063207626342773, 21.75897979736328, 24.454753875732422, 27.15052604675293, 29.846290588378906, 32.54206466674805, 35.23783493041992, 37.93360900878906, 40.62937927246094, 43.32515335083008, 46.02092742919922, 48.716697692871094, 51.412471771240234, 54.108245849609375, 56.80401611328125, 59.49979019165039, 62.19556427001953, 64.8913345336914, 67.58711242675781, 70.28288269042969, 72.97865295410156, 75.67442321777344, 78.37020111083984, 81.06597137451172, 83.7617416381836, 86.45751953125, 89.15328979492188, 91.84906005859375, 94.54483032226562, 97.2406005859375, 99.9363784790039, 102.63214874267578, 105.32791900634766, 108.02369689941406, 110.71946716308594, 113.41523742675781, 116.11101531982422]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 13.0, 5.0, 6.0, 7.0, 12.0, 16.0, 12.0, 18.0, 25.0, 23.0, 26.0, 34.0, 34.0, 39.0, 28.0, 36.0, 37.0, 34.0, 41.0, 35.0, 33.0, 38.0, 34.0, 40.0, 38.0, 32.0, 30.0, 35.0, 28.0, 27.0, 26.0, 24.0, 17.0, 15.0, 12.0, 13.0, 14.0, 12.0, 5.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-56.64322280883789, -54.900875091552734, -53.158531188964844, -51.41618347167969, -49.67383575439453, -47.93149185180664, -46.189144134521484, -44.446800231933594, -42.70445251464844, -40.96210479736328, -39.21976089477539, -37.477413177490234, -35.73506546020508, -33.99272155761719, -32.25037384033203, -30.508028030395508, -28.76568031311035, -27.023334503173828, -25.280986785888672, -23.53864097595215, -21.796295166015625, -20.05394744873047, -18.311601638793945, -16.569255828857422, -14.826909065246582, -13.084562301635742, -11.342216491699219, -9.599869728088379, -7.857523441314697, -6.115177154541016, -4.372830390930176, -2.6304845809936523, -0.8881378173828125, 0.8542085886001587, 2.59655499458313, 4.338901519775391, 6.081247806549072, 7.823594093322754, 9.565940856933594, 11.308286666870117, 13.050633430480957, 14.792980194091797, 16.53532600402832, 18.277671813964844, 20.02001953125, 21.762365341186523, 23.504711151123047, 25.247058868408203, 26.989404678344727, 28.73175048828125, 30.474098205566406, 32.21644592285156, 33.95878982543945, 35.70113754272461, 37.4434814453125, 39.185829162597656, 40.92817687988281, 42.67052459716797, 44.41286849975586, 46.155216217041016, 47.89756393432617, 49.63990783691406, 51.38225555419922, 53.124603271484375, 54.866947174072266]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 17.0, 15.0, 20.0, 25.0, 23.0, 26.0, 29.0, 37.0, 27.0, 37.0, 41.0, 48.0, 49.0, 47.0, 47.0, 47.0, 39.0, 40.0, 35.0, 38.0, 31.0, 34.0, 34.0, 33.0, 32.0, 19.0, 13.0, 18.0, 11.0, 14.0, 8.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.891845703125, -9.53369140625, -9.175537109375, -8.8173828125, -8.459228515625, -8.10107421875, -7.742919921875, -7.384765625, -7.026611328125, -6.66845703125, -6.310302734375, -5.9521484375, -5.593994140625, -5.23583984375, -4.877685546875, -4.51953125, -4.161376953125, -3.80322265625, -3.445068359375, -3.0869140625, -2.728759765625, -2.37060546875, -2.012451171875, -1.654296875, -1.296142578125, -0.93798828125, -0.579833984375, -0.2216796875, 0.136474609375, 0.49462890625, 0.852783203125, 1.2109375, 1.569091796875, 1.92724609375, 2.285400390625, 2.6435546875, 3.001708984375, 3.35986328125, 3.718017578125, 4.076171875, 4.434326171875, 4.79248046875, 5.150634765625, 5.5087890625, 5.866943359375, 6.22509765625, 6.583251953125, 6.94140625, 7.299560546875, 7.65771484375, 8.015869140625, 8.3740234375, 8.732177734375, 9.09033203125, 9.448486328125, 9.806640625, 10.164794921875, 10.52294921875, 10.881103515625, 11.2392578125, 11.597412109375, 11.95556640625, 12.313720703125, 12.671875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 11.0, 7.0, 21.0, 36.0, 38.0, 70.0, 80.0, 146.0, 184.0, 299.0, 443.0, 671.0, 1009.0, 1453.0, 2172.0, 3381.0, 5147.0, 7899.0, 12169.0, 18843.0, 29963.0, 47657.0, 78685.0, 127542.0, 189557.0, 187648.0, 126044.0, 77004.0, 47429.0, 29483.0, 18620.0, 11908.0, 7763.0, 5018.0, 3393.0, 2209.0, 1459.0, 992.0, 676.0, 443.0, 315.0, 233.0, 129.0, 88.0, 63.0, 39.0, 37.0, 25.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0], "bins": [-1.19140625, -1.1552886962890625, -1.119171142578125, -1.0830535888671875, -1.04693603515625, -1.0108184814453125, -0.974700927734375, -0.9385833740234375, -0.9024658203125, -0.8663482666015625, -0.830230712890625, -0.7941131591796875, -0.75799560546875, -0.7218780517578125, -0.685760498046875, -0.6496429443359375, -0.613525390625, -0.5774078369140625, -0.541290283203125, -0.5051727294921875, -0.46905517578125, -0.4329376220703125, -0.396820068359375, -0.3607025146484375, -0.3245849609375, -0.2884674072265625, -0.252349853515625, -0.2162322998046875, -0.18011474609375, -0.1439971923828125, -0.107879638671875, -0.0717620849609375, -0.03564453125, 0.0004730224609375, 0.036590576171875, 0.0727081298828125, 0.10882568359375, 0.1449432373046875, 0.181060791015625, 0.2171783447265625, 0.2532958984375, 0.2894134521484375, 0.325531005859375, 0.3616485595703125, 0.39776611328125, 0.4338836669921875, 0.470001220703125, 0.5061187744140625, 0.542236328125, 0.5783538818359375, 0.614471435546875, 0.6505889892578125, 0.68670654296875, 0.7228240966796875, 0.758941650390625, 0.7950592041015625, 0.8311767578125, 0.8672943115234375, 0.903411865234375, 0.9395294189453125, 0.97564697265625, 1.0117645263671875, 1.047882080078125, 1.0839996337890625, 1.1201171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 11.0, 7.0, 15.0, 13.0, 18.0, 15.0, 24.0, 25.0, 26.0, 25.0, 35.0, 43.0, 37.0, 34.0, 40.0, 30.0, 45.0, 1071.0, 34.0, 43.0, 39.0, 43.0, 28.0, 23.0, 42.0, 38.0, 25.0, 27.0, 34.0, 14.0, 10.0, 13.0, 15.0, 7.0, 8.0, 9.0, 6.0, 7.0, 7.0, 2.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0], "bins": [-7.921875, -7.69769287109375, -7.4735107421875, -7.24932861328125, -7.025146484375, -6.80096435546875, -6.5767822265625, -6.35260009765625, -6.12841796875, -5.90423583984375, -5.6800537109375, -5.45587158203125, -5.231689453125, -5.00750732421875, -4.7833251953125, -4.55914306640625, -4.3349609375, -4.11077880859375, -3.8865966796875, -3.66241455078125, -3.438232421875, -3.21405029296875, -2.9898681640625, -2.76568603515625, -2.54150390625, -2.31732177734375, -2.0931396484375, -1.86895751953125, -1.644775390625, -1.42059326171875, -1.1964111328125, -0.97222900390625, -0.748046875, -0.52386474609375, -0.2996826171875, -0.07550048828125, 0.148681640625, 0.37286376953125, 0.5970458984375, 0.82122802734375, 1.04541015625, 1.26959228515625, 1.4937744140625, 1.71795654296875, 1.942138671875, 2.16632080078125, 2.3905029296875, 2.61468505859375, 2.8388671875, 3.06304931640625, 3.2872314453125, 3.51141357421875, 3.735595703125, 3.95977783203125, 4.1839599609375, 4.40814208984375, 4.63232421875, 4.85650634765625, 5.0806884765625, 5.30487060546875, 5.529052734375, 5.75323486328125, 5.9774169921875, 6.20159912109375, 6.42578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 9.0, 9.0, 22.0, 25.0, 40.0, 65.0, 108.0, 160.0, 237.0, 394.0, 707.0, 1108.0, 1806.0, 2926.0, 5047.0, 8819.0, 15262.0, 27020.0, 48143.0, 90037.0, 172275.0, 1290967.0, 200516.0, 104172.0, 55402.0, 30677.0, 17216.0, 9734.0, 5696.0, 3419.0, 1964.0, 1200.0, 755.0, 442.0, 267.0, 162.0, 119.0, 71.0, 42.0, 45.0, 13.0, 7.0, 10.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7199020385742188, -0.6971282958984375, -0.6743545532226562, -0.651580810546875, -0.6288070678710938, -0.6060333251953125, -0.5832595825195312, -0.56048583984375, -0.5377120971679688, -0.5149383544921875, -0.49216461181640625, -0.469390869140625, -0.44661712646484375, -0.4238433837890625, -0.40106964111328125, -0.3782958984375, -0.35552215576171875, -0.3327484130859375, -0.30997467041015625, -0.287200927734375, -0.26442718505859375, -0.2416534423828125, -0.21887969970703125, -0.19610595703125, -0.17333221435546875, -0.1505584716796875, -0.12778472900390625, -0.105010986328125, -0.08223724365234375, -0.0594635009765625, -0.03668975830078125, -0.013916015625, 0.00885772705078125, 0.0316314697265625, 0.05440521240234375, 0.077178955078125, 0.09995269775390625, 0.1227264404296875, 0.14550018310546875, 0.16827392578125, 0.19104766845703125, 0.2138214111328125, 0.23659515380859375, 0.259368896484375, 0.28214263916015625, 0.3049163818359375, 0.32769012451171875, 0.3504638671875, 0.37323760986328125, 0.3960113525390625, 0.41878509521484375, 0.441558837890625, 0.46433258056640625, 0.4871063232421875, 0.5098800659179688, 0.53265380859375, 0.5554275512695312, 0.5782012939453125, 0.6009750366210938, 0.623748779296875, 0.6465225219726562, 0.6692962646484375, 0.6920700073242188, 0.71484375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 8.0, 14.0, 22.0, 22.0, 21.0, 34.0, 49.0, 75.0, 108.0, 171.0, 134.0, 85.0, 70.0, 36.0, 30.0, 31.0, 17.0, 10.0, 10.0, 6.0, 4.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.08727645874023438, -0.08434295654296875, -0.08140945434570312, -0.0784759521484375, -0.07554244995117188, -0.07260894775390625, -0.06967544555664062, -0.066741943359375, -0.06380844116210938, -0.06087493896484375, -0.057941436767578125, -0.0550079345703125, -0.052074432373046875, -0.04914093017578125, -0.046207427978515625, -0.04327392578125, -0.040340423583984375, -0.03740692138671875, -0.034473419189453125, -0.0315399169921875, -0.028606414794921875, -0.02567291259765625, -0.022739410400390625, -0.019805908203125, -0.016872406005859375, -0.01393890380859375, -0.011005401611328125, -0.0080718994140625, -0.005138397216796875, -0.00220489501953125, 0.000728607177734375, 0.003662109375, 0.006595611572265625, 0.00952911376953125, 0.012462615966796875, 0.0153961181640625, 0.018329620361328125, 0.02126312255859375, 0.024196624755859375, 0.027130126953125, 0.030063629150390625, 0.03299713134765625, 0.035930633544921875, 0.0388641357421875, 0.041797637939453125, 0.04473114013671875, 0.047664642333984375, 0.05059814453125, 0.053531646728515625, 0.05646514892578125, 0.059398651123046875, 0.0623321533203125, 0.06526565551757812, 0.06819915771484375, 0.07113265991210938, 0.074066162109375, 0.07699966430664062, 0.07993316650390625, 0.08286666870117188, 0.0858001708984375, 0.08873367309570312, 0.09166717529296875, 0.09460067749023438, 0.0975341796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 1.0, 3.0, 10.0, 8.0, 10.0, 20.0, 28.0, 37.0, 61.0, 68.0, 168.0, 510.0, 31795.0, 1013508.0, 1721.0, 264.0, 110.0, 62.0, 34.0, 26.0, 28.0, 20.0, 12.0, 10.0, 8.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.0951690673828125, -2.030181884765625, -1.9651947021484375, -1.90020751953125, -1.8352203369140625, -1.770233154296875, -1.7052459716796875, -1.6402587890625, -1.5752716064453125, -1.510284423828125, -1.4452972412109375, -1.38031005859375, -1.3153228759765625, -1.250335693359375, -1.1853485107421875, -1.120361328125, -1.0553741455078125, -0.990386962890625, -0.9253997802734375, -0.86041259765625, -0.7954254150390625, -0.730438232421875, -0.6654510498046875, -0.6004638671875, -0.5354766845703125, -0.470489501953125, -0.4055023193359375, -0.34051513671875, -0.2755279541015625, -0.210540771484375, -0.1455535888671875, -0.08056640625, -0.0155792236328125, 0.049407958984375, 0.1143951416015625, 0.17938232421875, 0.2443695068359375, 0.309356689453125, 0.3743438720703125, 0.4393310546875, 0.5043182373046875, 0.569305419921875, 0.6342926025390625, 0.69927978515625, 0.7642669677734375, 0.829254150390625, 0.8942413330078125, 0.959228515625, 1.0242156982421875, 1.089202880859375, 1.1541900634765625, 1.21917724609375, 1.2841644287109375, 1.349151611328125, 1.4141387939453125, 1.4791259765625, 1.5441131591796875, 1.609100341796875, 1.6740875244140625, 1.73907470703125, 1.8040618896484375, 1.869049072265625, 1.9340362548828125, 1.9990234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 21.0, 115.0, 623.0, 197.0, 33.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697900652885437, -0.6706209182739258, -0.6433412432670593, -0.6160615086555481, -0.5887818336486816, -0.5615020990371704, -0.5342223644256592, -0.5069426894187927, -0.4796629548072815, -0.45238324999809265, -0.4251035451889038, -0.3978238105773926, -0.37054410576820374, -0.3432644009590149, -0.31598469614982605, -0.2887049913406372, -0.26142528653144836, -0.23414558172225952, -0.20686586201190948, -0.17958615720272064, -0.1523064374923706, -0.12502673268318176, -0.09774702787399292, -0.07046730816364288, -0.04318760335445404, -0.01590789295732975, 0.01137181743979454, 0.03865152597427368, 0.06593123823404312, 0.09321095049381256, 0.1204906553030014, 0.14777037501335144, 0.17505007982254028, 0.20232978463172913, 0.22960950434207916, 0.2568892240524292, 0.28416892886161804, 0.3114486336708069, 0.3387283384799957, 0.36600804328918457, 0.3932877779006958, 0.42056748270988464, 0.4478471875190735, 0.4751269221305847, 0.5024065971374512, 0.5296863317489624, 0.5569660663604736, 0.5842457413673401, 0.6115254163742065, 0.6388051509857178, 0.6660848259925842, 0.6933645606040955, 0.7206442356109619, 0.7479239702224731, 0.7752037048339844, 0.8024833798408508, 0.8297631144523621, 0.8570428490638733, 0.8843225240707397, 0.911602258682251, 0.9388819336891174, 0.9661616683006287, 0.9934413433074951, 1.0207210779190063, 1.0480008125305176]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 5.0, 10.0, 9.0, 12.0, 20.0, 18.0, 19.0, 19.0, 23.0, 30.0, 32.0, 32.0, 40.0, 35.0, 41.0, 33.0, 41.0, 50.0, 36.0, 41.0, 47.0, 30.0, 37.0, 33.0, 42.0, 27.0, 27.0, 31.0, 26.0, 22.0, 23.0, 16.0, 14.0, 14.0, 12.0, 13.0, 6.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16932815313339233, -0.16395199298858643, -0.1585758477449417, -0.1531996876001358, -0.1478235423564911, -0.14244738221168518, -0.13707122206687927, -0.13169507682323456, -0.12631893157958984, -0.12094277888536453, -0.11556662619113922, -0.11019046604633331, -0.1048143208026886, -0.09943816065788269, -0.09406200796365738, -0.08868585526943207, -0.08330969512462616, -0.07793354243040085, -0.07255738973617554, -0.06718122959136963, -0.061805080622434616, -0.056428927928209305, -0.051052771508693695, -0.045676618814468384, -0.04030046612024307, -0.03492431342601776, -0.0295481588691473, -0.02417200431227684, -0.01879585161805153, -0.013419698923826218, -0.008043542504310608, -0.0026673898100852966, 0.0027087628841400146, 0.0080849165096879, 0.013461070135235786, 0.018837224692106247, 0.024213377386331558, 0.02958953008055687, 0.03496568650007248, 0.04034183919429779, 0.0457179918885231, 0.05109414458274841, 0.056470297276973724, 0.061846453696489334, 0.06722261011600494, 0.07259875535964966, 0.07797491550445557, 0.08335106819868088, 0.08872722089290619, 0.0941033735871315, 0.09947952628135681, 0.10485568642616272, 0.11023183166980743, 0.11560799181461334, 0.12098414450883865, 0.12636029720306396, 0.13173645734786987, 0.13711261749267578, 0.1424887627363205, 0.1478649228811264, 0.15324106812477112, 0.15861722826957703, 0.16399338841438293, 0.16936953365802765, 0.17474567890167236]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 17.0, 14.0, 21.0, 25.0, 23.0, 26.0, 29.0, 37.0, 27.0, 37.0, 42.0, 47.0, 49.0, 47.0, 47.0, 47.0, 39.0, 42.0, 34.0, 37.0, 31.0, 34.0, 35.0, 32.0, 32.0, 19.0, 12.0, 20.0, 10.0, 14.0, 8.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.891845703125, -9.53369140625, -9.175537109375, -8.8173828125, -8.459228515625, -8.10107421875, -7.742919921875, -7.384765625, -7.026611328125, -6.66845703125, -6.310302734375, -5.9521484375, -5.593994140625, -5.23583984375, -4.877685546875, -4.51953125, -4.161376953125, -3.80322265625, -3.445068359375, -3.0869140625, -2.728759765625, -2.37060546875, -2.012451171875, -1.654296875, -1.296142578125, -0.93798828125, -0.579833984375, -0.2216796875, 0.136474609375, 0.49462890625, 0.852783203125, 1.2109375, 1.569091796875, 1.92724609375, 2.285400390625, 2.6435546875, 3.001708984375, 3.35986328125, 3.718017578125, 4.076171875, 4.434326171875, 4.79248046875, 5.150634765625, 5.5087890625, 5.866943359375, 6.22509765625, 6.583251953125, 6.94140625, 7.299560546875, 7.65771484375, 8.015869140625, 8.3740234375, 8.732177734375, 9.09033203125, 9.448486328125, 9.806640625, 10.164794921875, 10.52294921875, 10.881103515625, 11.2392578125, 11.597412109375, 11.95556640625, 12.313720703125, 12.671875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 10.0, 15.0, 12.0, 26.0, 24.0, 30.0, 29.0, 65.0, 92.0, 144.0, 180.0, 248.0, 381.0, 643.0, 1070.0, 1875.0, 3712.0, 7196.0, 15750.0, 38700.0, 139572.0, 631213.0, 137793.0, 38570.0, 15430.0, 7284.0, 3598.0, 1914.0, 1094.0, 610.0, 397.0, 246.0, 158.0, 111.0, 89.0, 71.0, 46.0, 30.0, 28.0, 22.0, 16.0, 9.0, 10.0, 5.0, 11.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.1875, -18.51416015625, -17.8408203125, -17.16748046875, -16.494140625, -15.82080078125, -15.1474609375, -14.47412109375, -13.80078125, -13.12744140625, -12.4541015625, -11.78076171875, -11.107421875, -10.43408203125, -9.7607421875, -9.08740234375, -8.4140625, -7.74072265625, -7.0673828125, -6.39404296875, -5.720703125, -5.04736328125, -4.3740234375, -3.70068359375, -3.02734375, -2.35400390625, -1.6806640625, -1.00732421875, -0.333984375, 0.33935546875, 1.0126953125, 1.68603515625, 2.359375, 3.03271484375, 3.7060546875, 4.37939453125, 5.052734375, 5.72607421875, 6.3994140625, 7.07275390625, 7.74609375, 8.41943359375, 9.0927734375, 9.76611328125, 10.439453125, 11.11279296875, 11.7861328125, 12.45947265625, 13.1328125, 13.80615234375, 14.4794921875, 15.15283203125, 15.826171875, 16.49951171875, 17.1728515625, 17.84619140625, 18.51953125, 19.19287109375, 19.8662109375, 20.53955078125, 21.212890625, 21.88623046875, 22.5595703125, 23.23291015625, 23.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 12.0, 18.0, 32.0, 25.0, 17.0, 27.0, 35.0, 36.0, 48.0, 51.0, 53.0, 71.0, 108.0, 191.0, 1528.0, 231.0, 98.0, 80.0, 52.0, 52.0, 31.0, 37.0, 37.0, 29.0, 22.0, 14.0, 20.0, 21.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.484375, -25.487060546875, -24.48974609375, -23.492431640625, -22.4951171875, -21.497802734375, -20.50048828125, -19.503173828125, -18.505859375, -17.508544921875, -16.51123046875, -15.513916015625, -14.5166015625, -13.519287109375, -12.52197265625, -11.524658203125, -10.52734375, -9.530029296875, -8.53271484375, -7.535400390625, -6.5380859375, -5.540771484375, -4.54345703125, -3.546142578125, -2.548828125, -1.551513671875, -0.55419921875, 0.443115234375, 1.4404296875, 2.437744140625, 3.43505859375, 4.432373046875, 5.4296875, 6.427001953125, 7.42431640625, 8.421630859375, 9.4189453125, 10.416259765625, 11.41357421875, 12.410888671875, 13.408203125, 14.405517578125, 15.40283203125, 16.400146484375, 17.3974609375, 18.394775390625, 19.39208984375, 20.389404296875, 21.38671875, 22.384033203125, 23.38134765625, 24.378662109375, 25.3759765625, 26.373291015625, 27.37060546875, 28.367919921875, 29.365234375, 30.362548828125, 31.35986328125, 32.357177734375, 33.3544921875, 34.351806640625, 35.34912109375, 36.346435546875, 37.34375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 10.0, 7.0, 18.0, 26.0, 22.0, 29.0, 32.0, 55.0, 67.0, 80.0, 129.0, 205.0, 430.0, 1334.0, 6521.0, 74687.0, 2899231.0, 150075.0, 9672.0, 1666.0, 568.0, 257.0, 153.0, 103.0, 74.0, 43.0, 35.0, 39.0, 22.0, 30.0, 24.0, 11.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-76.5, -74.51806640625, -72.5361328125, -70.55419921875, -68.572265625, -66.59033203125, -64.6083984375, -62.62646484375, -60.64453125, -58.66259765625, -56.6806640625, -54.69873046875, -52.716796875, -50.73486328125, -48.7529296875, -46.77099609375, -44.7890625, -42.80712890625, -40.8251953125, -38.84326171875, -36.861328125, -34.87939453125, -32.8974609375, -30.91552734375, -28.93359375, -26.95166015625, -24.9697265625, -22.98779296875, -21.005859375, -19.02392578125, -17.0419921875, -15.06005859375, -13.078125, -11.09619140625, -9.1142578125, -7.13232421875, -5.150390625, -3.16845703125, -1.1865234375, 0.79541015625, 2.77734375, 4.75927734375, 6.7412109375, 8.72314453125, 10.705078125, 12.68701171875, 14.6689453125, 16.65087890625, 18.6328125, 20.61474609375, 22.5966796875, 24.57861328125, 26.560546875, 28.54248046875, 30.5244140625, 32.50634765625, 34.48828125, 36.47021484375, 38.4521484375, 40.43408203125, 42.416015625, 44.39794921875, 46.3798828125, 48.36181640625, 50.34375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 26.0, 46.0, 70.0, 128.0, 146.0, 160.0, 142.0, 98.0, 84.0, 34.0, 30.0, 8.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.074270248413086, -21.95652961730957, -19.838788986206055, -17.721050262451172, -15.60330867767334, -13.485568046569824, -11.367828369140625, -9.25008773803711, -7.132347106933594, -5.014606475830078, -2.8968663215637207, -0.7791261672973633, 1.3386144638061523, 3.456355094909668, 5.574094772338867, 7.691835403442383, 9.809576034545898, 11.927316665649414, 14.04505729675293, 16.162796020507812, 18.280536651611328, 20.398277282714844, 22.51601791381836, 24.633758544921875, 26.75149917602539, 28.869239807128906, 30.986980438232422, 33.10472106933594, 35.22246170043945, 37.34020233154297, 39.45793914794922, 41.57568359375, 43.69342803955078, 45.8111686706543, 47.92890930175781, 50.04664993286133, 52.164390563964844, 54.28213119506836, 56.399871826171875, 58.517608642578125, 60.635353088378906, 62.75309371948242, 64.87083435058594, 66.98857116699219, 69.10631561279297, 71.22405242919922, 73.341796875, 75.45953369140625, 77.5772705078125, 79.69500732421875, 81.81275177001953, 83.93048858642578, 86.04823303222656, 88.16596984863281, 90.2837142944336, 92.40145111083984, 94.51919555664062, 96.63693237304688, 98.75467681884766, 100.8724136352539, 102.99015808105469, 105.10789489746094, 107.22563934326172, 109.34337615966797, 111.46112060546875]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 9.0, 14.0, 5.0, 15.0, 17.0, 16.0, 16.0, 16.0, 24.0, 22.0, 21.0, 24.0, 28.0, 28.0, 32.0, 44.0, 48.0, 39.0, 33.0, 35.0, 35.0, 38.0, 39.0, 38.0, 39.0, 33.0, 32.0, 25.0, 18.0, 36.0, 25.0, 18.0, 20.0, 13.0, 17.0, 9.0, 16.0, 9.0, 9.0, 7.0, 6.0, 1.0, 4.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-66.19977569580078, -64.14521789550781, -62.09065628051758, -60.03609848022461, -57.981536865234375, -55.926979064941406, -53.87242126464844, -51.8178596496582, -49.76329803466797, -47.708740234375, -45.654178619384766, -43.5996208190918, -41.54505920410156, -39.490501403808594, -37.435943603515625, -35.38138198852539, -33.32682418823242, -31.27226448059082, -29.21770477294922, -27.16314697265625, -25.108585357666016, -23.054027557373047, -20.999467849731445, -18.944908142089844, -16.890348434448242, -14.83578872680664, -12.781229019165039, -10.726670265197754, -8.672110557556152, -6.617550849914551, -4.562992095947266, -2.508432388305664, -0.4538726806640625, 1.60068678855896, 3.6552462577819824, 5.709805488586426, 7.764365196228027, 9.818924903869629, 11.873483657836914, 13.928043365478516, 15.982603073120117, 18.03716278076172, 20.09172248840332, 22.146282196044922, 24.20083999633789, 26.255401611328125, 28.309959411621094, 30.364519119262695, 32.4190788269043, 34.473636627197266, 36.5281982421875, 38.58275604248047, 40.6373176574707, 42.69187545776367, 44.746437072753906, 46.800994873046875, 48.855552673339844, 50.91011047363281, 52.96467208862305, 55.019229888916016, 57.07379150390625, 59.12834930419922, 61.18290710449219, 63.23746871948242, 65.29203033447266]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 15.0, 19.0, 22.0, 29.0, 27.0, 26.0, 30.0, 33.0, 46.0, 49.0, 48.0, 50.0, 57.0, 56.0, 46.0, 36.0, 43.0, 38.0, 43.0, 36.0, 40.0, 30.0, 30.0, 25.0, 22.0, 16.0, 15.0, 16.0, 11.0, 4.0, 5.0, 1.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.3485107421875, -10.939208984375, -10.5299072265625, -10.12060546875, -9.7113037109375, -9.302001953125, -8.8927001953125, -8.4833984375, -8.0740966796875, -7.664794921875, -7.2554931640625, -6.84619140625, -6.4368896484375, -6.027587890625, -5.6182861328125, -5.208984375, -4.7996826171875, -4.390380859375, -3.9810791015625, -3.57177734375, -3.1624755859375, -2.753173828125, -2.3438720703125, -1.9345703125, -1.5252685546875, -1.115966796875, -0.7066650390625, -0.29736328125, 0.1119384765625, 0.521240234375, 0.9305419921875, 1.33984375, 1.7491455078125, 2.158447265625, 2.5677490234375, 2.97705078125, 3.3863525390625, 3.795654296875, 4.2049560546875, 4.6142578125, 5.0235595703125, 5.432861328125, 5.8421630859375, 6.25146484375, 6.6607666015625, 7.070068359375, 7.4793701171875, 7.888671875, 8.2979736328125, 8.707275390625, 9.1165771484375, 9.52587890625, 9.9351806640625, 10.344482421875, 10.7537841796875, 11.1630859375, 11.5723876953125, 11.981689453125, 12.3909912109375, 12.80029296875, 13.2095947265625, 13.618896484375, 14.0281982421875, 14.4375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 10.0, 13.0, 9.0, 13.0, 30.0, 26.0, 32.0, 50.0, 72.0, 116.0, 127.0, 160.0, 256.0, 375.0, 462.0, 692.0, 1078.0, 1681.0, 2673.0, 4525.0, 8557.0, 17715.0, 46034.0, 194257.0, 1301374.0, 2120788.0, 371487.0, 71360.0, 24274.0, 10913.0, 5758.0, 3296.0, 2000.0, 1294.0, 875.0, 622.0, 361.0, 276.0, 195.0, 123.0, 102.0, 56.0, 51.0, 40.0, 28.0, 13.0, 5.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.452392578125, -21.79541015625, -21.138427734375, -20.4814453125, -19.824462890625, -19.16748046875, -18.510498046875, -17.853515625, -17.196533203125, -16.53955078125, -15.882568359375, -15.2255859375, -14.568603515625, -13.91162109375, -13.254638671875, -12.59765625, -11.940673828125, -11.28369140625, -10.626708984375, -9.9697265625, -9.312744140625, -8.65576171875, -7.998779296875, -7.341796875, -6.684814453125, -6.02783203125, -5.370849609375, -4.7138671875, -4.056884765625, -3.39990234375, -2.742919921875, -2.0859375, -1.428955078125, -0.77197265625, -0.114990234375, 0.5419921875, 1.198974609375, 1.85595703125, 2.512939453125, 3.169921875, 3.826904296875, 4.48388671875, 5.140869140625, 5.7978515625, 6.454833984375, 7.11181640625, 7.768798828125, 8.42578125, 9.082763671875, 9.73974609375, 10.396728515625, 11.0537109375, 11.710693359375, 12.36767578125, 13.024658203125, 13.681640625, 14.338623046875, 14.99560546875, 15.652587890625, 16.3095703125, 16.966552734375, 17.62353515625, 18.280517578125, 18.9375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 13.0, 16.0, 17.0, 21.0, 29.0, 39.0, 42.0, 72.0, 104.0, 132.0, 230.0, 303.0, 418.0, 554.0, 578.0, 436.0, 290.0, 219.0, 145.0, 98.0, 71.0, 60.0, 33.0, 30.0, 15.0, 20.0, 21.0, 11.0, 8.0, 5.0, 4.0, 9.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.265625, -17.65673828125, -17.0478515625, -16.43896484375, -15.830078125, -15.22119140625, -14.6123046875, -14.00341796875, -13.39453125, -12.78564453125, -12.1767578125, -11.56787109375, -10.958984375, -10.35009765625, -9.7412109375, -9.13232421875, -8.5234375, -7.91455078125, -7.3056640625, -6.69677734375, -6.087890625, -5.47900390625, -4.8701171875, -4.26123046875, -3.65234375, -3.04345703125, -2.4345703125, -1.82568359375, -1.216796875, -0.60791015625, 0.0009765625, 0.60986328125, 1.21875, 1.82763671875, 2.4365234375, 3.04541015625, 3.654296875, 4.26318359375, 4.8720703125, 5.48095703125, 6.08984375, 6.69873046875, 7.3076171875, 7.91650390625, 8.525390625, 9.13427734375, 9.7431640625, 10.35205078125, 10.9609375, 11.56982421875, 12.1787109375, 12.78759765625, 13.396484375, 14.00537109375, 14.6142578125, 15.22314453125, 15.83203125, 16.44091796875, 17.0498046875, 17.65869140625, 18.267578125, 18.87646484375, 19.4853515625, 20.09423828125, 20.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 11.0, 16.0, 24.0, 27.0, 32.0, 46.0, 81.0, 145.0, 273.0, 547.0, 1276.0, 3420.0, 11598.0, 54582.0, 674876.0, 3240245.0, 171096.0, 25628.0, 6313.0, 2196.0, 877.0, 419.0, 215.0, 99.0, 61.0, 37.0, 29.0, 19.0, 14.0, 19.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.65625, -51.07373046875, -49.4912109375, -47.90869140625, -46.326171875, -44.74365234375, -43.1611328125, -41.57861328125, -39.99609375, -38.41357421875, -36.8310546875, -35.24853515625, -33.666015625, -32.08349609375, -30.5009765625, -28.91845703125, -27.3359375, -25.75341796875, -24.1708984375, -22.58837890625, -21.005859375, -19.42333984375, -17.8408203125, -16.25830078125, -14.67578125, -13.09326171875, -11.5107421875, -9.92822265625, -8.345703125, -6.76318359375, -5.1806640625, -3.59814453125, -2.015625, -0.43310546875, 1.1494140625, 2.73193359375, 4.314453125, 5.89697265625, 7.4794921875, 9.06201171875, 10.64453125, 12.22705078125, 13.8095703125, 15.39208984375, 16.974609375, 18.55712890625, 20.1396484375, 21.72216796875, 23.3046875, 24.88720703125, 26.4697265625, 28.05224609375, 29.634765625, 31.21728515625, 32.7998046875, 34.38232421875, 35.96484375, 37.54736328125, 39.1298828125, 40.71240234375, 42.294921875, 43.87744140625, 45.4599609375, 47.04248046875, 48.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 10.0, 19.0, 46.0, 92.0, 155.0, 199.0, 177.0, 122.0, 97.0, 47.0, 21.0, 6.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.65194702148438, -213.535888671875, -208.41983032226562, -203.30377197265625, -198.18771362304688, -193.0716552734375, -187.95559692382812, -182.83953857421875, -177.72348022460938, -172.607421875, -167.49136352539062, -162.37530517578125, -157.25924682617188, -152.1431884765625, -147.02713012695312, -141.91107177734375, -136.79501342773438, -131.678955078125, -126.56289672851562, -121.44683837890625, -116.33078002929688, -111.2147216796875, -106.09866333007812, -100.98260498046875, -95.86656188964844, -90.75050354003906, -85.63444519042969, -80.51838684082031, -75.40232849121094, -70.28627014160156, -65.17021179199219, -60.05415725708008, -54.938087463378906, -49.82202911376953, -44.705970764160156, -39.58991241455078, -34.473854064941406, -29.357797622680664, -24.241741180419922, -19.125682830810547, -14.009624481201172, -8.893566131591797, -3.7775087356567383, 1.3385486602783203, 6.454607009887695, 11.57066535949707, 16.686721801757812, 21.802780151367188, 26.918838500976562, 32.03489685058594, 37.15095520019531, 42.26701354980469, 47.38307189941406, 52.49913024902344, 57.61518478393555, 62.73124313354492, 67.84730529785156, 72.96336364746094, 78.07942199707031, 83.19548034667969, 88.31153869628906, 93.42759704589844, 98.54365539550781, 103.65971374511719, 108.77576446533203]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 10.0, 10.0, 7.0, 13.0, 19.0, 21.0, 12.0, 22.0, 24.0, 22.0, 31.0, 23.0, 19.0, 31.0, 33.0, 43.0, 42.0, 27.0, 32.0, 44.0, 44.0, 36.0, 30.0, 29.0, 54.0, 43.0, 38.0, 33.0, 19.0, 32.0, 21.0, 16.0, 20.0, 16.0, 14.0, 13.0, 9.0, 15.0, 8.0, 6.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.485225677490234, -56.39339828491211, -54.30157470703125, -52.209747314453125, -50.117919921875, -48.026092529296875, -45.93426513671875, -43.84244155883789, -41.750614166259766, -39.65878677368164, -37.56696319580078, -35.475135803222656, -33.38330841064453, -31.291481018066406, -29.199655532836914, -27.107830047607422, -25.016002655029297, -22.924175262451172, -20.83234977722168, -18.740524291992188, -16.648696899414062, -14.556870460510254, -12.465044021606445, -10.373217582702637, -8.281391143798828, -6.1895647048950195, -4.097738265991211, -2.0059118270874023, 0.08591461181640625, 2.177741050720215, 4.269567489624023, 6.361393928527832, 8.453216552734375, 10.545042991638184, 12.636869430541992, 14.7286958694458, 16.82052230834961, 18.912349700927734, 21.004175186157227, 23.09600067138672, 25.187828063964844, 27.27965545654297, 29.37148094177246, 31.463306427001953, 33.55513381958008, 35.6469612121582, 37.73878479003906, 39.83061218261719, 41.92243957519531, 44.01426696777344, 46.10609436035156, 48.19791793823242, 50.28974533081055, 52.38157272338867, 54.47339630126953, 56.565223693847656, 58.65705108642578, 60.748878479003906, 62.84070587158203, 64.93253326416016, 67.02435302734375, 69.11618041992188, 71.2080078125, 73.29983520507812, 75.39166259765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 12.0, 10.0, 12.0, 13.0, 20.0, 27.0, 20.0, 32.0, 39.0, 25.0, 48.0, 39.0, 31.0, 38.0, 43.0, 40.0, 44.0, 60.0, 45.0, 49.0, 44.0, 42.0, 36.0, 28.0, 37.0, 25.0, 16.0, 12.0, 18.0, 18.0, 12.0, 12.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.5765380859375, -10.176513671875, -9.7764892578125, -9.37646484375, -8.9764404296875, -8.576416015625, -8.1763916015625, -7.7763671875, -7.3763427734375, -6.976318359375, -6.5762939453125, -6.17626953125, -5.7762451171875, -5.376220703125, -4.9761962890625, -4.576171875, -4.1761474609375, -3.776123046875, -3.3760986328125, -2.97607421875, -2.5760498046875, -2.176025390625, -1.7760009765625, -1.3759765625, -0.9759521484375, -0.575927734375, -0.1759033203125, 0.22412109375, 0.6241455078125, 1.024169921875, 1.4241943359375, 1.82421875, 2.2242431640625, 2.624267578125, 3.0242919921875, 3.42431640625, 3.8243408203125, 4.224365234375, 4.6243896484375, 5.0244140625, 5.4244384765625, 5.824462890625, 6.2244873046875, 6.62451171875, 7.0245361328125, 7.424560546875, 7.8245849609375, 8.224609375, 8.6246337890625, 9.024658203125, 9.4246826171875, 9.82470703125, 10.2247314453125, 10.624755859375, 11.0247802734375, 11.4248046875, 11.8248291015625, 12.224853515625, 12.6248779296875, 13.02490234375, 13.4249267578125, 13.824951171875, 14.2249755859375, 14.625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 12.0, 10.0, 13.0, 22.0, 34.0, 62.0, 94.0, 123.0, 182.0, 299.0, 465.0, 754.0, 1168.0, 1744.0, 2748.0, 4466.0, 7058.0, 11926.0, 19515.0, 32792.0, 55381.0, 97167.0, 169219.0, 233223.0, 171083.0, 98477.0, 56215.0, 33118.0, 19590.0, 12025.0, 7345.0, 4481.0, 2758.0, 1767.0, 1135.0, 737.0, 454.0, 318.0, 220.0, 145.0, 77.0, 36.0, 35.0, 37.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.4765625, -1.43377685546875, -1.3909912109375, -1.34820556640625, -1.305419921875, -1.26263427734375, -1.2198486328125, -1.17706298828125, -1.13427734375, -1.09149169921875, -1.0487060546875, -1.00592041015625, -0.963134765625, -0.92034912109375, -0.8775634765625, -0.83477783203125, -0.7919921875, -0.74920654296875, -0.7064208984375, -0.66363525390625, -0.620849609375, -0.57806396484375, -0.5352783203125, -0.49249267578125, -0.44970703125, -0.40692138671875, -0.3641357421875, -0.32135009765625, -0.278564453125, -0.23577880859375, -0.1929931640625, -0.15020751953125, -0.107421875, -0.06463623046875, -0.0218505859375, 0.02093505859375, 0.063720703125, 0.10650634765625, 0.1492919921875, 0.19207763671875, 0.23486328125, 0.27764892578125, 0.3204345703125, 0.36322021484375, 0.406005859375, 0.44879150390625, 0.4915771484375, 0.53436279296875, 0.5771484375, 0.61993408203125, 0.6627197265625, 0.70550537109375, 0.748291015625, 0.79107666015625, 0.8338623046875, 0.87664794921875, 0.91943359375, 0.96221923828125, 1.0050048828125, 1.04779052734375, 1.090576171875, 1.13336181640625, 1.1761474609375, 1.21893310546875, 1.26171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 12.0, 13.0, 21.0, 13.0, 16.0, 19.0, 19.0, 35.0, 27.0, 27.0, 35.0, 24.0, 39.0, 45.0, 38.0, 32.0, 37.0, 1056.0, 50.0, 40.0, 51.0, 36.0, 28.0, 27.0, 36.0, 25.0, 28.0, 18.0, 19.0, 22.0, 25.0, 16.0, 12.0, 20.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.728271484375, -6.49951171875, -6.270751953125, -6.0419921875, -5.813232421875, -5.58447265625, -5.355712890625, -5.126953125, -4.898193359375, -4.66943359375, -4.440673828125, -4.2119140625, -3.983154296875, -3.75439453125, -3.525634765625, -3.296875, -3.068115234375, -2.83935546875, -2.610595703125, -2.3818359375, -2.153076171875, -1.92431640625, -1.695556640625, -1.466796875, -1.238037109375, -1.00927734375, -0.780517578125, -0.5517578125, -0.322998046875, -0.09423828125, 0.134521484375, 0.36328125, 0.592041015625, 0.82080078125, 1.049560546875, 1.2783203125, 1.507080078125, 1.73583984375, 1.964599609375, 2.193359375, 2.422119140625, 2.65087890625, 2.879638671875, 3.1083984375, 3.337158203125, 3.56591796875, 3.794677734375, 4.0234375, 4.252197265625, 4.48095703125, 4.709716796875, 4.9384765625, 5.167236328125, 5.39599609375, 5.624755859375, 5.853515625, 6.082275390625, 6.31103515625, 6.539794921875, 6.7685546875, 6.997314453125, 7.22607421875, 7.454833984375, 7.68359375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 13.0, 21.0, 39.0, 47.0, 68.0, 86.0, 143.0, 200.0, 310.0, 435.0, 619.0, 865.0, 1205.0, 1835.0, 2687.0, 3874.0, 5899.0, 8602.0, 12932.0, 19654.0, 30532.0, 47807.0, 75894.0, 120209.0, 282108.0, 1111028.0, 133961.0, 83877.0, 52976.0, 33905.0, 21652.0, 14356.0, 9460.0, 6208.0, 4257.0, 2943.0, 1945.0, 1363.0, 971.0, 680.0, 465.0, 311.0, 220.0, 142.0, 101.0, 70.0, 60.0, 38.0, 15.0, 17.0, 14.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.56640625, -0.5493011474609375, -0.532196044921875, -0.5150909423828125, -0.49798583984375, -0.4808807373046875, -0.463775634765625, -0.4466705322265625, -0.4295654296875, -0.4124603271484375, -0.395355224609375, -0.3782501220703125, -0.36114501953125, -0.3440399169921875, -0.326934814453125, -0.3098297119140625, -0.292724609375, -0.2756195068359375, -0.258514404296875, -0.2414093017578125, -0.22430419921875, -0.2071990966796875, -0.190093994140625, -0.1729888916015625, -0.1558837890625, -0.1387786865234375, -0.121673583984375, -0.1045684814453125, -0.08746337890625, -0.0703582763671875, -0.053253173828125, -0.0361480712890625, -0.01904296875, -0.0019378662109375, 0.015167236328125, 0.0322723388671875, 0.04937744140625, 0.0664825439453125, 0.083587646484375, 0.1006927490234375, 0.1177978515625, 0.1349029541015625, 0.152008056640625, 0.1691131591796875, 0.18621826171875, 0.2033233642578125, 0.220428466796875, 0.2375335693359375, 0.254638671875, 0.2717437744140625, 0.288848876953125, 0.3059539794921875, 0.32305908203125, 0.3401641845703125, 0.357269287109375, 0.3743743896484375, 0.3914794921875, 0.4085845947265625, 0.425689697265625, 0.4427947998046875, 0.45989990234375, 0.4770050048828125, 0.494110107421875, 0.5112152099609375, 0.5283203125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 7.0, 17.0, 5.0, 14.0, 19.0, 21.0, 27.0, 37.0, 48.0, 129.0, 285.0, 141.0, 37.0, 35.0, 23.0, 27.0, 14.0, 12.0, 13.0, 11.0, 12.0, 6.0, 0.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1016845703125, -0.09874248504638672, -0.09580039978027344, -0.09285831451416016, -0.08991622924804688, -0.0869741439819336, -0.08403205871582031, -0.08108997344970703, -0.07814788818359375, -0.07520580291748047, -0.07226371765136719, -0.0693216323852539, -0.06637954711914062, -0.06343746185302734, -0.06049537658691406, -0.05755329132080078, -0.0546112060546875, -0.05166912078857422, -0.04872703552246094, -0.045784950256347656, -0.042842864990234375, -0.039900779724121094, -0.03695869445800781, -0.03401660919189453, -0.03107452392578125, -0.02813243865966797, -0.025190353393554688, -0.022248268127441406, -0.019306182861328125, -0.016364097595214844, -0.013422012329101562, -0.010479927062988281, -0.007537841796875, -0.004595756530761719, -0.0016536712646484375, 0.0012884140014648438, 0.004230499267578125, 0.007172584533691406, 0.010114669799804688, 0.013056755065917969, 0.01599884033203125, 0.01894092559814453, 0.021883010864257812, 0.024825096130371094, 0.027767181396484375, 0.030709266662597656, 0.03365135192871094, 0.03659343719482422, 0.0395355224609375, 0.04247760772705078, 0.04541969299316406, 0.048361778259277344, 0.051303863525390625, 0.054245948791503906, 0.05718803405761719, 0.06013011932373047, 0.06307220458984375, 0.06601428985595703, 0.06895637512207031, 0.0718984603881836, 0.07484054565429688, 0.07778263092041016, 0.08072471618652344, 0.08366680145263672, 0.08660888671875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 3.0, 4.0, 10.0, 13.0, 20.0, 20.0, 19.0, 24.0, 33.0, 70.0, 164.0, 592.0, 15490.0, 1021452.0, 9782.0, 498.0, 124.0, 57.0, 32.0, 28.0, 17.0, 14.0, 18.0, 9.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.01885986328125, -1.9478759765625, -1.87689208984375, -1.805908203125, -1.73492431640625, -1.6639404296875, -1.59295654296875, -1.52197265625, -1.45098876953125, -1.3800048828125, -1.30902099609375, -1.238037109375, -1.16705322265625, -1.0960693359375, -1.02508544921875, -0.9541015625, -0.88311767578125, -0.8121337890625, -0.74114990234375, -0.670166015625, -0.59918212890625, -0.5281982421875, -0.45721435546875, -0.38623046875, -0.31524658203125, -0.2442626953125, -0.17327880859375, -0.102294921875, -0.03131103515625, 0.0396728515625, 0.11065673828125, 0.181640625, 0.25262451171875, 0.3236083984375, 0.39459228515625, 0.465576171875, 0.53656005859375, 0.6075439453125, 0.67852783203125, 0.74951171875, 0.82049560546875, 0.8914794921875, 0.96246337890625, 1.033447265625, 1.10443115234375, 1.1754150390625, 1.24639892578125, 1.3173828125, 1.38836669921875, 1.4593505859375, 1.53033447265625, 1.601318359375, 1.67230224609375, 1.7432861328125, 1.81427001953125, 1.88525390625, 1.95623779296875, 2.0272216796875, 2.09820556640625, 2.169189453125, 2.24017333984375, 2.3111572265625, 2.38214111328125, 2.453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 20.0, 52.0, 101.0, 289.0, 297.0, 128.0, 63.0, 23.0, 8.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2532458007335663, -0.23838427662849426, -0.22352273762226105, -0.20866119861602783, -0.1937996745109558, -0.1789381504058838, -0.16407661139965057, -0.14921507239341736, -0.13435354828834534, -0.11949201673269272, -0.1046304851770401, -0.08976895362138748, -0.07490742206573486, -0.060045890510082245, -0.045184358954429626, -0.030322827398777008, -0.01546129584312439, -0.0005997642874717712, 0.014261767268180847, 0.029123298823833466, 0.043984830379486084, 0.0588463619351387, 0.07370789349079132, 0.08856942504644394, 0.10343095660209656, 0.11829248815774918, 0.1331540197134018, 0.148015558719635, 0.16287708282470703, 0.17773860692977905, 0.19260014593601227, 0.20746168494224548, 0.22232317924499512, 0.23718470335006714, 0.25204622745513916, 0.26690778136253357, 0.2817693054676056, 0.2966308295726776, 0.311492383480072, 0.32635390758514404, 0.34121543169021606, 0.3560769557952881, 0.3709384799003601, 0.3858000338077545, 0.40066155791282654, 0.41552308201789856, 0.43038463592529297, 0.445246160030365, 0.460107684135437, 0.47496920824050903, 0.48983073234558105, 0.5046922564506531, 0.5195537805557251, 0.5344153642654419, 0.5492768883705139, 0.5641384124755859, 0.578999936580658, 0.59386146068573, 0.608722984790802, 0.623584508895874, 0.6384460926055908, 0.6533076167106628, 0.6681691408157349, 0.6830306649208069, 0.6978921890258789]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 10.0, 9.0, 13.0, 10.0, 13.0, 14.0, 21.0, 18.0, 29.0, 26.0, 30.0, 31.0, 25.0, 46.0, 39.0, 48.0, 45.0, 30.0, 32.0, 31.0, 50.0, 57.0, 34.0, 42.0, 41.0, 37.0, 29.0, 22.0, 19.0, 19.0, 17.0, 15.0, 14.0, 17.0, 18.0, 10.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.17142736911773682, -0.16631774604320526, -0.1612081080675125, -0.15609848499298096, -0.1509888470172882, -0.14587922394275665, -0.1407695859670639, -0.13565996289253235, -0.1305503249168396, -0.12544070184230804, -0.1203310638666153, -0.11522143334150314, -0.11011180281639099, -0.10500217974185944, -0.09989254921674728, -0.09478291869163513, -0.08967329561710358, -0.08456366509199142, -0.07945403456687927, -0.07434440404176712, -0.06923477351665497, -0.06412515044212341, -0.05901551991701126, -0.05390588939189911, -0.04879625886678696, -0.043686628341674805, -0.03857699781656265, -0.0334673710167408, -0.028357740491628647, -0.023248109966516495, -0.018138481304049492, -0.013028852641582489, -0.007919222116470337, -0.0028095925226807594, 0.002300037071108818, 0.0074096666648983955, 0.012519296258687973, 0.017628926783800125, 0.022738555446267128, 0.02784818410873413, 0.03295781463384628, 0.038067445158958435, 0.04317707568407059, 0.04828670248389244, 0.05339633300900459, 0.058505963534116745, 0.0636155903339386, 0.06872522085905075, 0.0738348513841629, 0.07894448190927505, 0.08405411243438721, 0.08916374295949936, 0.09427337348461151, 0.09938299655914307, 0.10449262708425522, 0.10960225760936737, 0.11471188813447952, 0.11982151865959167, 0.12493114918470383, 0.13004077970981598, 0.13515040278434753, 0.14026004076004028, 0.14536966383457184, 0.1504792869091034, 0.15558892488479614]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 12.0, 13.0, 20.0, 27.0, 20.0, 34.0, 37.0, 26.0, 47.0, 39.0, 32.0, 36.0, 45.0, 39.0, 44.0, 60.0, 45.0, 50.0, 43.0, 43.0, 36.0, 27.0, 37.0, 25.0, 16.0, 12.0, 18.0, 18.0, 12.0, 11.0, 11.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.56884765625, -10.1689453125, -9.76904296875, -9.369140625, -8.96923828125, -8.5693359375, -8.16943359375, -7.76953125, -7.36962890625, -6.9697265625, -6.56982421875, -6.169921875, -5.77001953125, -5.3701171875, -4.97021484375, -4.5703125, -4.17041015625, -3.7705078125, -3.37060546875, -2.970703125, -2.57080078125, -2.1708984375, -1.77099609375, -1.37109375, -0.97119140625, -0.5712890625, -0.17138671875, 0.228515625, 0.62841796875, 1.0283203125, 1.42822265625, 1.828125, 2.22802734375, 2.6279296875, 3.02783203125, 3.427734375, 3.82763671875, 4.2275390625, 4.62744140625, 5.02734375, 5.42724609375, 5.8271484375, 6.22705078125, 6.626953125, 7.02685546875, 7.4267578125, 7.82666015625, 8.2265625, 8.62646484375, 9.0263671875, 9.42626953125, 9.826171875, 10.22607421875, 10.6259765625, 11.02587890625, 11.42578125, 11.82568359375, 12.2255859375, 12.62548828125, 13.025390625, 13.42529296875, 13.8251953125, 14.22509765625, 14.625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 10.0, 13.0, 14.0, 24.0, 47.0, 58.0, 72.0, 118.0, 180.0, 285.0, 402.0, 550.0, 823.0, 1225.0, 1921.0, 2973.0, 4602.0, 7481.0, 12223.0, 21825.0, 40416.0, 80334.0, 177162.0, 338302.0, 179681.0, 81396.0, 41284.0, 21522.0, 12629.0, 7482.0, 4766.0, 2896.0, 1900.0, 1340.0, 848.0, 549.0, 365.0, 271.0, 179.0, 120.0, 86.0, 55.0, 36.0, 30.0, 20.0, 18.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.29931640625, -12.8486328125, -12.39794921875, -11.947265625, -11.49658203125, -11.0458984375, -10.59521484375, -10.14453125, -9.69384765625, -9.2431640625, -8.79248046875, -8.341796875, -7.89111328125, -7.4404296875, -6.98974609375, -6.5390625, -6.08837890625, -5.6376953125, -5.18701171875, -4.736328125, -4.28564453125, -3.8349609375, -3.38427734375, -2.93359375, -2.48291015625, -2.0322265625, -1.58154296875, -1.130859375, -0.68017578125, -0.2294921875, 0.22119140625, 0.671875, 1.12255859375, 1.5732421875, 2.02392578125, 2.474609375, 2.92529296875, 3.3759765625, 3.82666015625, 4.27734375, 4.72802734375, 5.1787109375, 5.62939453125, 6.080078125, 6.53076171875, 6.9814453125, 7.43212890625, 7.8828125, 8.33349609375, 8.7841796875, 9.23486328125, 9.685546875, 10.13623046875, 10.5869140625, 11.03759765625, 11.48828125, 11.93896484375, 12.3896484375, 12.84033203125, 13.291015625, 13.74169921875, 14.1923828125, 14.64306640625, 15.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 5.0, 7.0, 4.0, 13.0, 12.0, 9.0, 12.0, 11.0, 14.0, 24.0, 16.0, 32.0, 30.0, 35.0, 52.0, 37.0, 52.0, 60.0, 62.0, 129.0, 252.0, 1375.0, 238.0, 109.0, 73.0, 63.0, 41.0, 47.0, 39.0, 31.0, 23.0, 20.0, 14.0, 17.0, 19.0, 15.0, 12.0, 6.0, 8.0, 7.0, 11.0, 6.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.810302734375, -24.90185546875, -23.993408203125, -23.0849609375, -22.176513671875, -21.26806640625, -20.359619140625, -19.451171875, -18.542724609375, -17.63427734375, -16.725830078125, -15.8173828125, -14.908935546875, -14.00048828125, -13.092041015625, -12.18359375, -11.275146484375, -10.36669921875, -9.458251953125, -8.5498046875, -7.641357421875, -6.73291015625, -5.824462890625, -4.916015625, -4.007568359375, -3.09912109375, -2.190673828125, -1.2822265625, -0.373779296875, 0.53466796875, 1.443115234375, 2.3515625, 3.260009765625, 4.16845703125, 5.076904296875, 5.9853515625, 6.893798828125, 7.80224609375, 8.710693359375, 9.619140625, 10.527587890625, 11.43603515625, 12.344482421875, 13.2529296875, 14.161376953125, 15.06982421875, 15.978271484375, 16.88671875, 17.795166015625, 18.70361328125, 19.612060546875, 20.5205078125, 21.428955078125, 22.33740234375, 23.245849609375, 24.154296875, 25.062744140625, 25.97119140625, 26.879638671875, 27.7880859375, 28.696533203125, 29.60498046875, 30.513427734375, 31.421875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 22.0, 24.0, 37.0, 59.0, 81.0, 134.0, 187.0, 408.0, 875.0, 2839.0, 11760.0, 64051.0, 1147007.0, 1818166.0, 80581.0, 13997.0, 3256.0, 1088.0, 448.0, 250.0, 130.0, 89.0, 68.0, 48.0, 29.0, 22.0, 14.0, 9.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5625, -37.2353515625, -35.908203125, -34.5810546875, -33.25390625, -31.9267578125, -30.599609375, -29.2724609375, -27.9453125, -26.6181640625, -25.291015625, -23.9638671875, -22.63671875, -21.3095703125, -19.982421875, -18.6552734375, -17.328125, -16.0009765625, -14.673828125, -13.3466796875, -12.01953125, -10.6923828125, -9.365234375, -8.0380859375, -6.7109375, -5.3837890625, -4.056640625, -2.7294921875, -1.40234375, -0.0751953125, 1.251953125, 2.5791015625, 3.90625, 5.2333984375, 6.560546875, 7.8876953125, 9.21484375, 10.5419921875, 11.869140625, 13.1962890625, 14.5234375, 15.8505859375, 17.177734375, 18.5048828125, 19.83203125, 21.1591796875, 22.486328125, 23.8134765625, 25.140625, 26.4677734375, 27.794921875, 29.1220703125, 30.44921875, 31.7763671875, 33.103515625, 34.4306640625, 35.7578125, 37.0849609375, 38.412109375, 39.7392578125, 41.06640625, 42.3935546875, 43.720703125, 45.0478515625, 46.375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 29.0, 118.0, 271.0, 303.0, 181.0, 74.0, 18.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.94976806640625, -106.17694091796875, -101.40411376953125, -96.63127899169922, -91.85845184326172, -87.08562469482422, -82.31278991699219, -77.53996276855469, -72.76713562011719, -67.99430847167969, -63.22147750854492, -58.448646545410156, -53.675819396972656, -48.902992248535156, -44.13016128540039, -39.357330322265625, -34.584503173828125, -29.811674118041992, -25.03884506225586, -20.266016006469727, -15.493186950683594, -10.720357894897461, -5.947528839111328, -1.1746978759765625, 3.5981292724609375, 8.37095832824707, 13.143787384033203, 17.916616439819336, 22.68944549560547, 27.4622745513916, 32.235103607177734, 37.0079345703125, 41.78077697753906, 46.55360412597656, 51.32643508911133, 56.099266052246094, 60.872093200683594, 65.6449203491211, 70.41775512695312, 75.19058227539062, 79.96340942382812, 84.73623657226562, 89.50906372070312, 94.28189849853516, 99.05472564697266, 103.82755279541016, 108.60038757324219, 113.37321472167969, 118.14604187011719, 122.91886901855469, 127.69169616699219, 132.4645233154297, 137.23736572265625, 142.01019287109375, 146.78302001953125, 151.55584716796875, 156.32867431640625, 161.10150146484375, 165.87432861328125, 170.64715576171875, 175.41998291015625, 180.1928253173828, 184.9656524658203, 189.7384796142578, 194.5113067626953]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 5.0, 6.0, 4.0, 2.0, 3.0, 10.0, 2.0, 9.0, 21.0, 22.0, 17.0, 17.0, 19.0, 22.0, 33.0, 32.0, 30.0, 26.0, 36.0, 33.0, 32.0, 46.0, 42.0, 31.0, 42.0, 34.0, 42.0, 39.0, 40.0, 35.0, 25.0, 41.0, 31.0, 30.0, 14.0, 20.0, 15.0, 25.0, 15.0, 11.0, 5.0, 10.0, 5.0, 8.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.461021423339844, -61.39417266845703, -59.32732391357422, -57.260475158691406, -55.193626403808594, -53.12677764892578, -51.05992889404297, -48.993080139160156, -46.926231384277344, -44.85938262939453, -42.79253387451172, -40.725685119628906, -38.658836364746094, -36.59198760986328, -34.52513885498047, -32.458290100097656, -30.391441345214844, -28.32459259033203, -26.25774383544922, -24.190895080566406, -22.124046325683594, -20.05719757080078, -17.99034881591797, -15.923500061035156, -13.856651306152344, -11.789802551269531, -9.722953796386719, -7.656105041503906, -5.589256286621094, -3.5224075317382812, -1.4555587768554688, 0.6112899780273438, 2.678131103515625, 4.7449798583984375, 6.81182861328125, 8.878677368164062, 10.945526123046875, 13.012374877929688, 15.0792236328125, 17.146072387695312, 19.212921142578125, 21.279769897460938, 23.34661865234375, 25.413467407226562, 27.480316162109375, 29.547164916992188, 31.614013671875, 33.68086242675781, 35.747711181640625, 37.81455993652344, 39.88140869140625, 41.94825744628906, 44.015106201171875, 46.08195495605469, 48.1488037109375, 50.21565246582031, 52.282501220703125, 54.34934997558594, 56.41619873046875, 58.48304748535156, 60.549896240234375, 62.61674499511719, 64.68359375, 66.75044250488281, 68.81729125976562]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 5.0, 13.0, 8.0, 17.0, 19.0, 20.0, 16.0, 29.0, 24.0, 34.0, 38.0, 29.0, 46.0, 39.0, 39.0, 39.0, 44.0, 36.0, 54.0, 49.0, 48.0, 41.0, 43.0, 42.0, 33.0, 30.0, 26.0, 20.0, 14.0, 15.0, 14.0, 14.0, 8.0, 10.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.9879150390625, -10.585205078125, -10.1824951171875, -9.77978515625, -9.3770751953125, -8.974365234375, -8.5716552734375, -8.1689453125, -7.7662353515625, -7.363525390625, -6.9608154296875, -6.55810546875, -6.1553955078125, -5.752685546875, -5.3499755859375, -4.947265625, -4.5445556640625, -4.141845703125, -3.7391357421875, -3.33642578125, -2.9337158203125, -2.531005859375, -2.1282958984375, -1.7255859375, -1.3228759765625, -0.920166015625, -0.5174560546875, -0.11474609375, 0.2879638671875, 0.690673828125, 1.0933837890625, 1.49609375, 1.8988037109375, 2.301513671875, 2.7042236328125, 3.10693359375, 3.5096435546875, 3.912353515625, 4.3150634765625, 4.7177734375, 5.1204833984375, 5.523193359375, 5.9259033203125, 6.32861328125, 6.7313232421875, 7.134033203125, 7.5367431640625, 7.939453125, 8.3421630859375, 8.744873046875, 9.1475830078125, 9.55029296875, 9.9530029296875, 10.355712890625, 10.7584228515625, 11.1611328125, 11.5638427734375, 11.966552734375, 12.3692626953125, 12.77197265625, 13.1746826171875, 13.577392578125, 13.9801025390625, 14.3828125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 3.0, 7.0, 18.0, 15.0, 14.0, 30.0, 42.0, 60.0, 75.0, 144.0, 180.0, 255.0, 375.0, 553.0, 810.0, 1218.0, 1961.0, 3175.0, 5163.0, 8922.0, 15927.0, 32486.0, 84763.0, 354102.0, 1735327.0, 1511900.0, 295826.0, 74354.0, 29494.0, 14888.0, 8494.0, 4830.0, 3053.0, 1992.0, 1270.0, 789.0, 560.0, 371.0, 243.0, 164.0, 112.0, 101.0, 67.0, 38.0, 31.0, 17.0, 17.0, 10.0, 10.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.90625, -19.31982421875, -18.7333984375, -18.14697265625, -17.560546875, -16.97412109375, -16.3876953125, -15.80126953125, -15.21484375, -14.62841796875, -14.0419921875, -13.45556640625, -12.869140625, -12.28271484375, -11.6962890625, -11.10986328125, -10.5234375, -9.93701171875, -9.3505859375, -8.76416015625, -8.177734375, -7.59130859375, -7.0048828125, -6.41845703125, -5.83203125, -5.24560546875, -4.6591796875, -4.07275390625, -3.486328125, -2.89990234375, -2.3134765625, -1.72705078125, -1.140625, -0.55419921875, 0.0322265625, 0.61865234375, 1.205078125, 1.79150390625, 2.3779296875, 2.96435546875, 3.55078125, 4.13720703125, 4.7236328125, 5.31005859375, 5.896484375, 6.48291015625, 7.0693359375, 7.65576171875, 8.2421875, 8.82861328125, 9.4150390625, 10.00146484375, 10.587890625, 11.17431640625, 11.7607421875, 12.34716796875, 12.93359375, 13.52001953125, 14.1064453125, 14.69287109375, 15.279296875, 15.86572265625, 16.4521484375, 17.03857421875, 17.625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 14.0, 21.0, 19.0, 23.0, 32.0, 27.0, 68.0, 73.0, 100.0, 159.0, 218.0, 312.0, 510.0, 633.0, 561.0, 392.0, 259.0, 170.0, 120.0, 75.0, 62.0, 51.0, 23.0, 24.0, 23.0, 11.0, 11.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.203125, -21.563232421875, -20.92333984375, -20.283447265625, -19.6435546875, -19.003662109375, -18.36376953125, -17.723876953125, -17.083984375, -16.444091796875, -15.80419921875, -15.164306640625, -14.5244140625, -13.884521484375, -13.24462890625, -12.604736328125, -11.96484375, -11.324951171875, -10.68505859375, -10.045166015625, -9.4052734375, -8.765380859375, -8.12548828125, -7.485595703125, -6.845703125, -6.205810546875, -5.56591796875, -4.926025390625, -4.2861328125, -3.646240234375, -3.00634765625, -2.366455078125, -1.7265625, -1.086669921875, -0.44677734375, 0.193115234375, 0.8330078125, 1.472900390625, 2.11279296875, 2.752685546875, 3.392578125, 4.032470703125, 4.67236328125, 5.312255859375, 5.9521484375, 6.592041015625, 7.23193359375, 7.871826171875, 8.51171875, 9.151611328125, 9.79150390625, 10.431396484375, 11.0712890625, 11.711181640625, 12.35107421875, 12.990966796875, 13.630859375, 14.270751953125, 14.91064453125, 15.550537109375, 16.1904296875, 16.830322265625, 17.47021484375, 18.110107421875, 18.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 6.0, 23.0, 10.0, 18.0, 34.0, 42.0, 55.0, 86.0, 117.0, 169.0, 282.0, 492.0, 846.0, 1672.0, 3237.0, 6668.0, 14396.0, 35064.0, 106600.0, 586565.0, 2803919.0, 480308.0, 95215.0, 32324.0, 13523.0, 5972.0, 2975.0, 1578.0, 793.0, 473.0, 270.0, 179.0, 87.0, 84.0, 49.0, 39.0, 37.0, 26.0, 10.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.109375, -28.153564453125, -27.19775390625, -26.241943359375, -25.2861328125, -24.330322265625, -23.37451171875, -22.418701171875, -21.462890625, -20.507080078125, -19.55126953125, -18.595458984375, -17.6396484375, -16.683837890625, -15.72802734375, -14.772216796875, -13.81640625, -12.860595703125, -11.90478515625, -10.948974609375, -9.9931640625, -9.037353515625, -8.08154296875, -7.125732421875, -6.169921875, -5.214111328125, -4.25830078125, -3.302490234375, -2.3466796875, -1.390869140625, -0.43505859375, 0.520751953125, 1.4765625, 2.432373046875, 3.38818359375, 4.343994140625, 5.2998046875, 6.255615234375, 7.21142578125, 8.167236328125, 9.123046875, 10.078857421875, 11.03466796875, 11.990478515625, 12.9462890625, 13.902099609375, 14.85791015625, 15.813720703125, 16.76953125, 17.725341796875, 18.68115234375, 19.636962890625, 20.5927734375, 21.548583984375, 22.50439453125, 23.460205078125, 24.416015625, 25.371826171875, 26.32763671875, 27.283447265625, 28.2392578125, 29.195068359375, 30.15087890625, 31.106689453125, 32.0625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 31.0, 47.0, 73.0, 110.0, 161.0, 179.0, 143.0, 110.0, 73.0, 29.0, 21.0, 9.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.40711212158203, -116.99440002441406, -112.58168029785156, -108.1689682006836, -103.75625610351562, -99.34353637695312, -94.93082427978516, -90.51811218261719, -86.10539245605469, -81.69268035888672, -77.27996063232422, -72.86724853515625, -68.45453643798828, -64.04182434082031, -59.62910461425781, -55.216392517089844, -50.803680419921875, -46.39096450805664, -41.97825241088867, -37.56553649902344, -33.15282440185547, -28.740108489990234, -24.327392578125, -19.9146785736084, -15.501964569091797, -11.089250564575195, -6.676535606384277, -2.2638206481933594, 2.148893356323242, 6.561607360839844, 10.974323272705078, 15.38703727722168, 19.799758911132812, 24.212472915649414, 28.625186920166016, 33.03790283203125, 37.45061492919922, 41.86333084106445, 46.27604675292969, 50.688758850097656, 55.10147476196289, 59.514190673828125, 63.926902770996094, 68.33961486816406, 72.75233459472656, 77.16504669189453, 81.5777587890625, 85.990478515625, 90.40319061279297, 94.81590270996094, 99.22862243652344, 103.6413345336914, 108.05404663085938, 112.46676635742188, 116.87947845458984, 121.29219055175781, 125.70491027832031, 130.1176300048828, 134.53033447265625, 138.94305419921875, 143.35577392578125, 147.7684783935547, 152.1811981201172, 156.5939178466797, 161.00662231445312]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 12.0, 15.0, 13.0, 20.0, 12.0, 22.0, 18.0, 25.0, 33.0, 22.0, 33.0, 33.0, 36.0, 23.0, 42.0, 44.0, 41.0, 43.0, 38.0, 30.0, 35.0, 29.0, 35.0, 42.0, 25.0, 38.0, 32.0, 38.0, 25.0, 23.0, 18.0, 20.0, 11.0, 11.0, 10.0, 5.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-74.04548645019531, -71.90771484375, -69.76993560791016, -67.63216400146484, -65.49439239501953, -63.35661315917969, -61.218841552734375, -59.0810661315918, -56.94329071044922, -54.80551528930664, -52.66774368286133, -50.52996826171875, -48.39219284057617, -46.254417419433594, -44.11664581298828, -41.9788703918457, -39.84109878540039, -37.70332336425781, -35.5655517578125, -33.42777633666992, -31.290000915527344, -29.1522274017334, -27.014453887939453, -24.876678466796875, -22.73890495300293, -20.601131439208984, -18.463356018066406, -16.32558250427246, -14.1878080368042, -12.050033569335938, -9.912260055541992, -7.7744855880737305, -5.636711120605469, -3.498936891555786, -1.3611626625061035, 0.776611328125, 2.9143857955932617, 5.052160263061523, 7.189933776855469, 9.32770824432373, 11.465482711791992, 13.603257179260254, 15.741031646728516, 17.87880516052246, 20.016578674316406, 22.154354095458984, 24.29212760925293, 26.429901123046875, 28.567676544189453, 30.7054500579834, 32.843223571777344, 34.98099899291992, 37.1187744140625, 39.25654602050781, 41.39432144165039, 43.53209686279297, 45.66986846923828, 47.80764389038086, 49.94541549682617, 52.08319091796875, 54.22096633911133, 56.358741760253906, 58.49651336669922, 60.6342887878418, 62.772064208984375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 10.0, 8.0, 17.0, 17.0, 23.0, 15.0, 36.0, 27.0, 24.0, 21.0, 40.0, 28.0, 39.0, 42.0, 36.0, 38.0, 35.0, 34.0, 36.0, 45.0, 39.0, 40.0, 29.0, 40.0, 34.0, 26.0, 28.0, 29.0, 20.0, 15.0, 20.0, 12.0, 8.0, 12.0, 13.0, 7.0, 2.0, 5.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.4140625, -12.0390625, -11.6640625, -11.2890625, -10.9140625, -10.5390625, -10.1640625, -9.7890625, -9.4140625, -9.0390625, -8.6640625, -8.2890625, -7.9140625, -7.5390625, -7.1640625, -6.7890625, -6.4140625, -6.0390625, -5.6640625, -5.2890625, -4.9140625, -4.5390625, -4.1640625, -3.7890625, -3.4140625, -3.0390625, -2.6640625, -2.2890625, -1.9140625, -1.5390625, -1.1640625, -0.7890625, -0.4140625, -0.0390625, 0.3359375, 0.7109375, 1.0859375, 1.4609375, 1.8359375, 2.2109375, 2.5859375, 2.9609375, 3.3359375, 3.7109375, 4.0859375, 4.4609375, 4.8359375, 5.2109375, 5.5859375, 5.9609375, 6.3359375, 6.7109375, 7.0859375, 7.4609375, 7.8359375, 8.2109375, 8.5859375, 8.9609375, 9.3359375, 9.7109375, 10.0859375, 10.4609375, 10.8359375, 11.2109375, 11.5859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 7.0, 20.0, 13.0, 39.0, 49.0, 47.0, 61.0, 106.0, 155.0, 203.0, 319.0, 514.0, 764.0, 1080.0, 1856.0, 3009.0, 4930.0, 8207.0, 14012.0, 24670.0, 45167.0, 85517.0, 161265.0, 261549.0, 198696.0, 106909.0, 56227.0, 30482.0, 17305.0, 9863.0, 5849.0, 3471.0, 2215.0, 1362.0, 882.0, 579.0, 344.0, 228.0, 174.0, 149.0, 72.0, 60.0, 41.0, 27.0, 17.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.861328125, -1.8025665283203125, -1.743804931640625, -1.6850433349609375, -1.62628173828125, -1.5675201416015625, -1.508758544921875, -1.4499969482421875, -1.3912353515625, -1.3324737548828125, -1.273712158203125, -1.2149505615234375, -1.15618896484375, -1.0974273681640625, -1.038665771484375, -0.9799041748046875, -0.921142578125, -0.8623809814453125, -0.803619384765625, -0.7448577880859375, -0.68609619140625, -0.6273345947265625, -0.568572998046875, -0.5098114013671875, -0.4510498046875, -0.3922882080078125, -0.333526611328125, -0.2747650146484375, -0.21600341796875, -0.1572418212890625, -0.098480224609375, -0.0397186279296875, 0.01904296875, 0.0778045654296875, 0.136566162109375, 0.1953277587890625, 0.25408935546875, 0.3128509521484375, 0.371612548828125, 0.4303741455078125, 0.4891357421875, 0.5478973388671875, 0.606658935546875, 0.6654205322265625, 0.72418212890625, 0.7829437255859375, 0.841705322265625, 0.9004669189453125, 0.959228515625, 1.0179901123046875, 1.076751708984375, 1.1355133056640625, 1.19427490234375, 1.2530364990234375, 1.311798095703125, 1.3705596923828125, 1.4293212890625, 1.4880828857421875, 1.546844482421875, 1.6056060791015625, 1.66436767578125, 1.7231292724609375, 1.781890869140625, 1.8406524658203125, 1.8994140625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 6.0, 3.0, 7.0, 8.0, 9.0, 10.0, 11.0, 14.0, 16.0, 17.0, 15.0, 22.0, 29.0, 15.0, 34.0, 32.0, 34.0, 29.0, 32.0, 38.0, 56.0, 27.0, 1054.0, 48.0, 34.0, 41.0, 36.0, 36.0, 27.0, 27.0, 25.0, 28.0, 25.0, 24.0, 18.0, 21.0, 21.0, 12.0, 21.0, 13.0, 10.0, 7.0, 15.0, 7.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.5694580078125, -6.334228515625, -6.0989990234375, -5.86376953125, -5.6285400390625, -5.393310546875, -5.1580810546875, -4.9228515625, -4.6876220703125, -4.452392578125, -4.2171630859375, -3.98193359375, -3.7467041015625, -3.511474609375, -3.2762451171875, -3.041015625, -2.8057861328125, -2.570556640625, -2.3353271484375, -2.10009765625, -1.8648681640625, -1.629638671875, -1.3944091796875, -1.1591796875, -0.9239501953125, -0.688720703125, -0.4534912109375, -0.21826171875, 0.0169677734375, 0.252197265625, 0.4874267578125, 0.72265625, 0.9578857421875, 1.193115234375, 1.4283447265625, 1.66357421875, 1.8988037109375, 2.134033203125, 2.3692626953125, 2.6044921875, 2.8397216796875, 3.074951171875, 3.3101806640625, 3.54541015625, 3.7806396484375, 4.015869140625, 4.2510986328125, 4.486328125, 4.7215576171875, 4.956787109375, 5.1920166015625, 5.42724609375, 5.6624755859375, 5.897705078125, 6.1329345703125, 6.3681640625, 6.6033935546875, 6.838623046875, 7.0738525390625, 7.30908203125, 7.5443115234375, 7.779541015625, 8.0147705078125, 8.25]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 4.0, 10.0, 11.0, 14.0, 25.0, 30.0, 56.0, 78.0, 128.0, 170.0, 285.0, 376.0, 647.0, 1166.0, 2036.0, 3794.0, 7241.0, 14558.0, 30572.0, 65779.0, 151593.0, 1218099.0, 369897.0, 124042.0, 54697.0, 25389.0, 12408.0, 6284.0, 3217.0, 1806.0, 1007.0, 581.0, 385.0, 240.0, 134.0, 116.0, 71.0, 55.0, 31.0, 22.0, 16.0, 11.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0], "bins": [-1.275390625, -1.23883056640625, -1.2022705078125, -1.16571044921875, -1.129150390625, -1.09259033203125, -1.0560302734375, -1.01947021484375, -0.98291015625, -0.94635009765625, -0.9097900390625, -0.87322998046875, -0.836669921875, -0.80010986328125, -0.7635498046875, -0.72698974609375, -0.6904296875, -0.65386962890625, -0.6173095703125, -0.58074951171875, -0.544189453125, -0.50762939453125, -0.4710693359375, -0.43450927734375, -0.39794921875, -0.36138916015625, -0.3248291015625, -0.28826904296875, -0.251708984375, -0.21514892578125, -0.1785888671875, -0.14202880859375, -0.10546875, -0.06890869140625, -0.0323486328125, 0.00421142578125, 0.040771484375, 0.07733154296875, 0.1138916015625, 0.15045166015625, 0.18701171875, 0.22357177734375, 0.2601318359375, 0.29669189453125, 0.333251953125, 0.36981201171875, 0.4063720703125, 0.44293212890625, 0.4794921875, 0.51605224609375, 0.5526123046875, 0.58917236328125, 0.625732421875, 0.66229248046875, 0.6988525390625, 0.73541259765625, 0.77197265625, 0.80853271484375, 0.8450927734375, 0.88165283203125, 0.918212890625, 0.95477294921875, 0.9913330078125, 1.02789306640625, 1.064453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 3.0, 5.0, 5.0, 8.0, 9.0, 12.0, 19.0, 32.0, 44.0, 92.0, 462.0, 110.0, 54.0, 24.0, 18.0, 9.0, 6.0, 9.0, 6.0, 2.0, 6.0, 9.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.445556640625, -0.4322547912597656, -0.41895294189453125, -0.4056510925292969, -0.3923492431640625, -0.3790473937988281, -0.36574554443359375, -0.3524436950683594, -0.339141845703125, -0.3258399963378906, -0.31253814697265625, -0.2992362976074219, -0.2859344482421875, -0.2726325988769531, -0.25933074951171875, -0.24602890014648438, -0.23272705078125, -0.21942520141601562, -0.20612335205078125, -0.19282150268554688, -0.1795196533203125, -0.16621780395507812, -0.15291595458984375, -0.13961410522460938, -0.126312255859375, -0.11301040649414062, -0.09970855712890625, -0.08640670776367188, -0.0731048583984375, -0.059803009033203125, -0.04650115966796875, -0.033199310302734375, -0.0198974609375, -0.006595611572265625, 0.00670623779296875, 0.020008087158203125, 0.0333099365234375, 0.046611785888671875, 0.05991363525390625, 0.07321548461914062, 0.086517333984375, 0.09981918334960938, 0.11312103271484375, 0.12642288208007812, 0.1397247314453125, 0.15302658081054688, 0.16632843017578125, 0.17963027954101562, 0.19293212890625, 0.20623397827148438, 0.21953582763671875, 0.23283767700195312, 0.2461395263671875, 0.2594413757324219, 0.27274322509765625, 0.2860450744628906, 0.299346923828125, 0.3126487731933594, 0.32595062255859375, 0.3392524719238281, 0.3525543212890625, 0.3658561706542969, 0.37915802001953125, 0.3924598693847656, 0.40576171875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 8.0, 6.0, 12.0, 10.0, 8.0, 10.0, 18.0, 25.0, 21.0, 48.0, 69.0, 161.0, 604.0, 8852.0, 1028661.0, 8999.0, 592.0, 163.0, 78.0, 50.0, 27.0, 20.0, 16.0, 12.0, 10.0, 8.0, 6.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.68359375, -7.43170166015625, -7.1798095703125, -6.92791748046875, -6.676025390625, -6.42413330078125, -6.1722412109375, -5.92034912109375, -5.66845703125, -5.41656494140625, -5.1646728515625, -4.91278076171875, -4.660888671875, -4.40899658203125, -4.1571044921875, -3.90521240234375, -3.6533203125, -3.40142822265625, -3.1495361328125, -2.89764404296875, -2.645751953125, -2.39385986328125, -2.1419677734375, -1.89007568359375, -1.63818359375, -1.38629150390625, -1.1343994140625, -0.88250732421875, -0.630615234375, -0.37872314453125, -0.1268310546875, 0.12506103515625, 0.376953125, 0.62884521484375, 0.8807373046875, 1.13262939453125, 1.384521484375, 1.63641357421875, 1.8883056640625, 2.14019775390625, 2.39208984375, 2.64398193359375, 2.8958740234375, 3.14776611328125, 3.399658203125, 3.65155029296875, 3.9034423828125, 4.15533447265625, 4.4072265625, 4.65911865234375, 4.9110107421875, 5.16290283203125, 5.414794921875, 5.66668701171875, 5.9185791015625, 6.17047119140625, 6.42236328125, 6.67425537109375, 6.9261474609375, 7.17803955078125, 7.429931640625, 7.68182373046875, 7.9337158203125, 8.18560791015625, 8.4375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 15.0, 22.0, 31.0, 90.0, 235.0, 408.0, 119.0, 53.0, 13.0, 13.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0584172010421753, -1.0036890506744385, -0.9489607810974121, -0.8942325711250305, -0.8395043611526489, -0.7847761511802673, -0.7300479412078857, -0.6753197312355042, -0.6205915212631226, -0.565863311290741, -0.5111351013183594, -0.4564068913459778, -0.4016786813735962, -0.3469504714012146, -0.292222261428833, -0.23749405145645142, -0.18276584148406982, -0.12803763151168823, -0.07330942153930664, -0.01858121156692505, 0.03614699840545654, 0.09087520837783813, 0.14560341835021973, 0.20033162832260132, 0.2550598382949829, 0.3097880482673645, 0.3645162582397461, 0.4192444682121277, 0.4739726781845093, 0.5287008881568909, 0.5834290981292725, 0.638157308101654, 0.6928856372833252, 0.7476138472557068, 0.8023420572280884, 0.85707026720047, 0.9117984771728516, 0.9665266871452332, 1.0212548971176147, 1.0759830474853516, 1.130711317062378, 1.1854395866394043, 1.2401677370071411, 1.294895887374878, 1.3496241569519043, 1.4043524265289307, 1.4590805768966675, 1.5138087272644043, 1.5685369968414307, 1.623265266418457, 1.6779934167861938, 1.7327215671539307, 1.787449836730957, 1.8421781063079834, 1.8969062566757202, 1.951634407043457, 2.0063626766204834, 2.0610909461975098, 2.115818977355957, 2.1705472469329834, 2.2252755165100098, 2.280003786087036, 2.3347320556640625, 2.3894600868225098, 2.444188356399536]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 7.0, 4.0, 9.0, 8.0, 11.0, 16.0, 24.0, 14.0, 20.0, 20.0, 27.0, 13.0, 36.0, 25.0, 34.0, 34.0, 35.0, 36.0, 44.0, 39.0, 57.0, 33.0, 35.0, 33.0, 48.0, 36.0, 29.0, 22.0, 27.0, 22.0, 19.0, 25.0, 18.0, 20.0, 22.0, 15.0, 17.0, 7.0, 14.0, 10.0, 2.0, 7.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.5580988526344299, -0.5399051904678345, -0.521711528301239, -0.5035178661346436, -0.4853241741657257, -0.46713051199913025, -0.4489368200302124, -0.43074315786361694, -0.4125494956970215, -0.394355833530426, -0.37616217136383057, -0.3579684793949127, -0.33977481722831726, -0.3215811550617218, -0.30338746309280396, -0.2851938009262085, -0.26700013875961304, -0.24880647659301758, -0.23061279952526093, -0.21241912245750427, -0.1942254602909088, -0.17603179812431335, -0.1578381210565567, -0.13964444398880005, -0.12145078182220459, -0.10325711220502853, -0.08506344258785248, -0.06686977297067642, -0.048676103353500366, -0.03048243373632431, -0.012288764119148254, 0.0059049129486083984, 0.024098515510559082, 0.04229218512773514, 0.060485854744911194, 0.07867952436208725, 0.0968731939792633, 0.11506686359643936, 0.13326053321361542, 0.15145421028137207, 0.16964787244796753, 0.187841534614563, 0.20603521168231964, 0.2242288887500763, 0.24242255091667175, 0.2606162130832672, 0.27880990505218506, 0.2970035672187805, 0.315197229385376, 0.33339089155197144, 0.3515845537185669, 0.36977824568748474, 0.3879719078540802, 0.40616557002067566, 0.4243592619895935, 0.44255292415618896, 0.4607465863227844, 0.4789402484893799, 0.49713391065597534, 0.5153275728225708, 0.533521294593811, 0.5517149567604065, 0.569908618927002, 0.5881022810935974, 0.6062959432601929]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 6.0, 10.0, 10.0, 9.0, 14.0, 19.0, 22.0, 16.0, 35.0, 28.0, 24.0, 22.0, 39.0, 28.0, 39.0, 41.0, 35.0, 40.0, 33.0, 34.0, 39.0, 40.0, 41.0, 42.0, 31.0, 36.0, 36.0, 26.0, 27.0, 27.0, 24.0, 13.0, 19.0, 12.0, 9.0, 12.0, 13.0, 7.0, 2.0, 4.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.4140625, -12.0389404296875, -11.663818359375, -11.2886962890625, -10.91357421875, -10.5384521484375, -10.163330078125, -9.7882080078125, -9.4130859375, -9.0379638671875, -8.662841796875, -8.2877197265625, -7.91259765625, -7.5374755859375, -7.162353515625, -6.7872314453125, -6.412109375, -6.0369873046875, -5.661865234375, -5.2867431640625, -4.91162109375, -4.5364990234375, -4.161376953125, -3.7862548828125, -3.4111328125, -3.0360107421875, -2.660888671875, -2.2857666015625, -1.91064453125, -1.5355224609375, -1.160400390625, -0.7852783203125, -0.41015625, -0.0350341796875, 0.340087890625, 0.7152099609375, 1.09033203125, 1.4654541015625, 1.840576171875, 2.2156982421875, 2.5908203125, 2.9659423828125, 3.341064453125, 3.7161865234375, 4.09130859375, 4.4664306640625, 4.841552734375, 5.2166748046875, 5.591796875, 5.9669189453125, 6.342041015625, 6.7171630859375, 7.09228515625, 7.4674072265625, 7.842529296875, 8.2176513671875, 8.5927734375, 8.9678955078125, 9.343017578125, 9.7181396484375, 10.09326171875, 10.4683837890625, 10.843505859375, 11.2186279296875, 11.59375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 15.0, 23.0, 28.0, 46.0, 46.0, 92.0, 122.0, 165.0, 251.0, 404.0, 611.0, 963.0, 1510.0, 2428.0, 4171.0, 7168.0, 13051.0, 25144.0, 50447.0, 114347.0, 324507.0, 296869.0, 105698.0, 47192.0, 23397.0, 12454.0, 6823.0, 4021.0, 2350.0, 1436.0, 938.0, 609.0, 394.0, 271.0, 170.0, 114.0, 86.0, 50.0, 33.0, 17.0, 29.0, 15.0, 14.0, 9.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-20.0625, -19.4716796875, -18.880859375, -18.2900390625, -17.69921875, -17.1083984375, -16.517578125, -15.9267578125, -15.3359375, -14.7451171875, -14.154296875, -13.5634765625, -12.97265625, -12.3818359375, -11.791015625, -11.2001953125, -10.609375, -10.0185546875, -9.427734375, -8.8369140625, -8.24609375, -7.6552734375, -7.064453125, -6.4736328125, -5.8828125, -5.2919921875, -4.701171875, -4.1103515625, -3.51953125, -2.9287109375, -2.337890625, -1.7470703125, -1.15625, -0.5654296875, 0.025390625, 0.6162109375, 1.20703125, 1.7978515625, 2.388671875, 2.9794921875, 3.5703125, 4.1611328125, 4.751953125, 5.3427734375, 5.93359375, 6.5244140625, 7.115234375, 7.7060546875, 8.296875, 8.8876953125, 9.478515625, 10.0693359375, 10.66015625, 11.2509765625, 11.841796875, 12.4326171875, 13.0234375, 13.6142578125, 14.205078125, 14.7958984375, 15.38671875, 15.9775390625, 16.568359375, 17.1591796875, 17.75]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 8.0, 10.0, 14.0, 24.0, 20.0, 30.0, 34.0, 36.0, 40.0, 47.0, 76.0, 76.0, 111.0, 192.0, 1424.0, 279.0, 148.0, 91.0, 73.0, 46.0, 35.0, 25.0, 39.0, 29.0, 25.0, 18.0, 13.0, 12.0, 16.0, 9.0, 7.0, 9.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.0078125, -27.921875, -26.8359375, -25.75, -24.6640625, -23.578125, -22.4921875, -21.40625, -20.3203125, -19.234375, -18.1484375, -17.0625, -15.9765625, -14.890625, -13.8046875, -12.71875, -11.6328125, -10.546875, -9.4609375, -8.375, -7.2890625, -6.203125, -5.1171875, -4.03125, -2.9453125, -1.859375, -0.7734375, 0.3125, 1.3984375, 2.484375, 3.5703125, 4.65625, 5.7421875, 6.828125, 7.9140625, 9.0, 10.0859375, 11.171875, 12.2578125, 13.34375, 14.4296875, 15.515625, 16.6015625, 17.6875, 18.7734375, 19.859375, 20.9453125, 22.03125, 23.1171875, 24.203125, 25.2890625, 26.375, 27.4609375, 28.546875, 29.6328125, 30.71875, 31.8046875, 32.890625, 33.9765625, 35.0625, 36.1484375, 37.234375, 38.3203125, 39.40625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 11.0, 10.0, 11.0, 11.0, 16.0, 15.0, 41.0, 41.0, 60.0, 73.0, 80.0, 143.0, 203.0, 343.0, 656.0, 1441.0, 3850.0, 12756.0, 56524.0, 607476.0, 2299758.0, 128661.0, 22802.0, 6335.0, 2191.0, 886.0, 448.0, 245.0, 177.0, 105.0, 76.0, 54.0, 38.0, 39.0, 33.0, 18.0, 13.0, 8.0, 11.0, 9.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0], "bins": [-43.84375, -42.5986328125, -41.353515625, -40.1083984375, -38.86328125, -37.6181640625, -36.373046875, -35.1279296875, -33.8828125, -32.6376953125, -31.392578125, -30.1474609375, -28.90234375, -27.6572265625, -26.412109375, -25.1669921875, -23.921875, -22.6767578125, -21.431640625, -20.1865234375, -18.94140625, -17.6962890625, -16.451171875, -15.2060546875, -13.9609375, -12.7158203125, -11.470703125, -10.2255859375, -8.98046875, -7.7353515625, -6.490234375, -5.2451171875, -4.0, -2.7548828125, -1.509765625, -0.2646484375, 0.98046875, 2.2255859375, 3.470703125, 4.7158203125, 5.9609375, 7.2060546875, 8.451171875, 9.6962890625, 10.94140625, 12.1865234375, 13.431640625, 14.6767578125, 15.921875, 17.1669921875, 18.412109375, 19.6572265625, 20.90234375, 22.1474609375, 23.392578125, 24.6376953125, 25.8828125, 27.1279296875, 28.373046875, 29.6181640625, 30.86328125, 32.1083984375, 33.353515625, 34.5986328125, 35.84375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 144.0, 611.0, 235.0, 19.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.13589477539062, -175.244140625, -162.35238647460938, -149.46063232421875, -136.56887817382812, -123.67711639404297, -110.78535461425781, -97.89360046386719, -85.00184631347656, -72.11009216308594, -59.21833419799805, -46.326576232910156, -33.43482208251953, -20.543067932128906, -7.65130615234375, 5.240447998046875, 18.1322021484375, 31.023958206176758, 43.915714263916016, 56.807472229003906, 69.69922637939453, 82.59098052978516, 95.48274230957031, 108.37449645996094, 121.26625061035156, 134.1580047607422, 147.0497589111328, 159.9415283203125, 172.83328247070312, 185.72503662109375, 198.61679077148438, 211.508544921875, 224.4002685546875, 237.29202270507812, 250.18377685546875, 263.0755310058594, 275.96728515625, 288.8590393066406, 301.75079345703125, 314.642578125, 327.5343017578125, 340.4260559082031, 353.31781005859375, 366.2095642089844, 379.101318359375, 391.9930725097656, 404.88482666015625, 417.776611328125, 430.6683654785156, 443.56011962890625, 456.4518737792969, 469.3436279296875, 482.2353820800781, 495.12713623046875, 508.0189208984375, 520.91064453125, 533.8024291992188, 546.6942138671875, 559.5859375, 572.4777221679688, 585.3694458007812, 598.26123046875, 611.1529541015625, 624.0447387695312, 636.9364624023438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 6.0, 10.0, 7.0, 7.0, 15.0, 10.0, 18.0, 17.0, 15.0, 27.0, 18.0, 30.0, 28.0, 38.0, 31.0, 37.0, 40.0, 32.0, 32.0, 33.0, 25.0, 42.0, 35.0, 47.0, 40.0, 37.0, 35.0, 26.0, 30.0, 29.0, 24.0, 26.0, 21.0, 16.0, 22.0, 7.0, 11.0, 14.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0], "bins": [-73.77397155761719, -71.63825988769531, -69.50255584716797, -67.3668441772461, -65.23114013671875, -63.095428466796875, -60.959720611572266, -58.824012756347656, -56.68830108642578, -54.55259323120117, -52.41688537597656, -50.28117370605469, -48.14546585083008, -46.00975799560547, -43.87405014038086, -41.73834228515625, -39.60263442993164, -37.46692657470703, -35.33121871948242, -33.19551086425781, -31.059799194335938, -28.924091339111328, -26.78838348388672, -24.65267562866211, -22.516965866088867, -20.381258010864258, -18.245548248291016, -16.109840393066406, -13.97413158416748, -11.838422775268555, -9.702714920043945, -7.5670061111450195, -5.431301116943359, -3.2955925464630127, -1.159883975982666, 0.9758243560791016, 3.1115331649780273, 5.247241973876953, 7.3829498291015625, 9.518658638000488, 11.654367446899414, 13.79007625579834, 15.925785064697266, 18.061492919921875, 20.197200775146484, 22.332910537719727, 24.468618392944336, 26.604328155517578, 28.740036010742188, 30.875743865966797, 33.011451721191406, 35.14716339111328, 37.28287124633789, 39.4185791015625, 41.55428695678711, 43.68999481201172, 45.825706481933594, 47.9614143371582, 50.09712219238281, 52.23283386230469, 54.3685417175293, 56.504249572753906, 58.639957427978516, 60.775665283203125, 62.911373138427734]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 3.0, 12.0, 14.0, 16.0, 13.0, 19.0, 22.0, 32.0, 23.0, 33.0, 22.0, 34.0, 25.0, 37.0, 31.0, 41.0, 49.0, 39.0, 40.0, 51.0, 43.0, 35.0, 37.0, 33.0, 32.0, 32.0, 29.0, 29.0, 21.0, 14.0, 21.0, 20.0, 14.0, 14.0, 9.0, 9.0, 7.0, 3.0, 10.0, 1.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.921875, -12.533935546875, -12.14599609375, -11.758056640625, -11.3701171875, -10.982177734375, -10.59423828125, -10.206298828125, -9.818359375, -9.430419921875, -9.04248046875, -8.654541015625, -8.2666015625, -7.878662109375, -7.49072265625, -7.102783203125, -6.71484375, -6.326904296875, -5.93896484375, -5.551025390625, -5.1630859375, -4.775146484375, -4.38720703125, -3.999267578125, -3.611328125, -3.223388671875, -2.83544921875, -2.447509765625, -2.0595703125, -1.671630859375, -1.28369140625, -0.895751953125, -0.5078125, -0.119873046875, 0.26806640625, 0.656005859375, 1.0439453125, 1.431884765625, 1.81982421875, 2.207763671875, 2.595703125, 2.983642578125, 3.37158203125, 3.759521484375, 4.1474609375, 4.535400390625, 4.92333984375, 5.311279296875, 5.69921875, 6.087158203125, 6.47509765625, 6.863037109375, 7.2509765625, 7.638916015625, 8.02685546875, 8.414794921875, 8.802734375, 9.190673828125, 9.57861328125, 9.966552734375, 10.3544921875, 10.742431640625, 11.13037109375, 11.518310546875, 11.90625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 9.0, 12.0, 20.0, 22.0, 35.0, 33.0, 42.0, 51.0, 90.0, 111.0, 184.0, 344.0, 778.0, 2566.0, 14877.0, 671443.0, 3468596.0, 29101.0, 3806.0, 1014.0, 415.0, 215.0, 120.0, 81.0, 55.0, 51.0, 38.0, 30.0, 25.0, 16.0, 15.0, 16.0, 12.0, 11.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.8125, -91.6669921875, -88.521484375, -85.3759765625, -82.23046875, -79.0849609375, -75.939453125, -72.7939453125, -69.6484375, -66.5029296875, -63.357421875, -60.2119140625, -57.06640625, -53.9208984375, -50.775390625, -47.6298828125, -44.484375, -41.3388671875, -38.193359375, -35.0478515625, -31.90234375, -28.7568359375, -25.611328125, -22.4658203125, -19.3203125, -16.1748046875, -13.029296875, -9.8837890625, -6.73828125, -3.5927734375, -0.447265625, 2.6982421875, 5.84375, 8.9892578125, 12.134765625, 15.2802734375, 18.42578125, 21.5712890625, 24.716796875, 27.8623046875, 31.0078125, 34.1533203125, 37.298828125, 40.4443359375, 43.58984375, 46.7353515625, 49.880859375, 53.0263671875, 56.171875, 59.3173828125, 62.462890625, 65.6083984375, 68.75390625, 71.8994140625, 75.044921875, 78.1904296875, 81.3359375, 84.4814453125, 87.626953125, 90.7724609375, 93.91796875, 97.0634765625, 100.208984375, 103.3544921875, 106.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 0.0, 9.0, 10.0, 8.0, 11.0, 25.0, 20.0, 30.0, 39.0, 65.0, 80.0, 105.0, 141.0, 231.0, 395.0, 692.0, 776.0, 505.0, 290.0, 167.0, 129.0, 87.0, 69.0, 47.0, 29.0, 31.0, 19.0, 18.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.595458984375, -18.84716796875, -18.098876953125, -17.3505859375, -16.602294921875, -15.85400390625, -15.105712890625, -14.357421875, -13.609130859375, -12.86083984375, -12.112548828125, -11.3642578125, -10.615966796875, -9.86767578125, -9.119384765625, -8.37109375, -7.622802734375, -6.87451171875, -6.126220703125, -5.3779296875, -4.629638671875, -3.88134765625, -3.133056640625, -2.384765625, -1.636474609375, -0.88818359375, -0.139892578125, 0.6083984375, 1.356689453125, 2.10498046875, 2.853271484375, 3.6015625, 4.349853515625, 5.09814453125, 5.846435546875, 6.5947265625, 7.343017578125, 8.09130859375, 8.839599609375, 9.587890625, 10.336181640625, 11.08447265625, 11.832763671875, 12.5810546875, 13.329345703125, 14.07763671875, 14.825927734375, 15.57421875, 16.322509765625, 17.07080078125, 17.819091796875, 18.5673828125, 19.315673828125, 20.06396484375, 20.812255859375, 21.560546875, 22.308837890625, 23.05712890625, 23.805419921875, 24.5537109375, 25.302001953125, 26.05029296875, 26.798583984375, 27.546875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 13.0, 15.0, 15.0, 29.0, 37.0, 59.0, 102.0, 180.0, 378.0, 899.0, 2317.0, 7714.0, 32981.0, 240137.0, 3472915.0, 378698.0, 43446.0, 9624.0, 2768.0, 985.0, 420.0, 225.0, 111.0, 64.0, 36.0, 40.0, 29.0, 20.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.75, -61.03466796875, -59.3193359375, -57.60400390625, -55.888671875, -54.17333984375, -52.4580078125, -50.74267578125, -49.02734375, -47.31201171875, -45.5966796875, -43.88134765625, -42.166015625, -40.45068359375, -38.7353515625, -37.02001953125, -35.3046875, -33.58935546875, -31.8740234375, -30.15869140625, -28.443359375, -26.72802734375, -25.0126953125, -23.29736328125, -21.58203125, -19.86669921875, -18.1513671875, -16.43603515625, -14.720703125, -13.00537109375, -11.2900390625, -9.57470703125, -7.859375, -6.14404296875, -4.4287109375, -2.71337890625, -0.998046875, 0.71728515625, 2.4326171875, 4.14794921875, 5.86328125, 7.57861328125, 9.2939453125, 11.00927734375, 12.724609375, 14.43994140625, 16.1552734375, 17.87060546875, 19.5859375, 21.30126953125, 23.0166015625, 24.73193359375, 26.447265625, 28.16259765625, 29.8779296875, 31.59326171875, 33.30859375, 35.02392578125, 36.7392578125, 38.45458984375, 40.169921875, 41.88525390625, 43.6005859375, 45.31591796875, 47.03125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 10.0, 12.0, 11.0, 26.0, 36.0, 40.0, 60.0, 116.0, 103.0, 128.0, 117.0, 93.0, 70.0, 64.0, 36.0, 32.0, 25.0, 14.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.65469360351562, -92.7312240600586, -89.80774688720703, -86.88427734375, -83.96080017089844, -81.0373306274414, -78.11386108398438, -75.19038391113281, -72.26691436767578, -69.34344482421875, -66.41996765136719, -63.496498107910156, -60.57302474975586, -57.64955139160156, -54.726078033447266, -51.80260467529297, -48.87913131713867, -45.955657958984375, -43.03218460083008, -40.10871124267578, -37.18524169921875, -34.26176834106445, -31.338294982910156, -28.414823532104492, -25.491350173950195, -22.5678768157959, -19.644405364990234, -16.720932006835938, -13.797459602355957, -10.873987197875977, -7.95051383972168, -5.027042388916016, -2.1035690307617188, 0.8199036121368408, 3.7433762550354004, 6.666849136352539, 9.59032154083252, 12.5137939453125, 15.437267303466797, 18.36073875427246, 21.284212112426758, 24.207685470581055, 27.13115692138672, 30.054630279541016, 32.97810363769531, 35.901573181152344, 38.825050354003906, 41.74851989746094, 44.671993255615234, 47.59546661376953, 50.51893997192383, 53.442413330078125, 56.365882873535156, 59.28935623168945, 62.21282958984375, 65.13629913330078, 68.05977630615234, 70.98324584960938, 73.90672302246094, 76.83019256591797, 79.75366973876953, 82.67713928222656, 85.60061645507812, 88.52408599853516, 91.44755554199219]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 12.0, 5.0, 10.0, 8.0, 20.0, 11.0, 18.0, 28.0, 9.0, 31.0, 22.0, 34.0, 33.0, 30.0, 33.0, 41.0, 44.0, 38.0, 43.0, 49.0, 39.0, 41.0, 38.0, 33.0, 30.0, 36.0, 36.0, 24.0, 39.0, 28.0, 21.0, 14.0, 23.0, 10.0, 12.0, 11.0, 14.0, 14.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.27718353271484, -73.09468841552734, -70.91220092773438, -68.72970581054688, -66.5472183227539, -64.3647232055664, -62.18223571777344, -59.99974060058594, -57.81725311279297, -55.634761810302734, -53.4522705078125, -51.269779205322266, -49.08728790283203, -46.9047966003418, -44.72230529785156, -42.53981018066406, -40.35731887817383, -38.174827575683594, -35.99233627319336, -33.809844970703125, -31.62735366821289, -29.444862365722656, -27.26236915588379, -25.079877853393555, -22.89738655090332, -20.714895248413086, -18.53240394592285, -16.349910736083984, -14.167420387268066, -11.984929084777832, -9.802436828613281, -7.619945526123047, -5.4374542236328125, -3.254962682723999, -1.0724711418151855, 1.110020637512207, 3.2925119400024414, 5.475003242492676, 7.657495498657227, 9.839986801147461, 12.022478103637695, 14.20496940612793, 16.387460708618164, 18.56995391845703, 20.752445220947266, 22.9349365234375, 25.117427825927734, 27.29991912841797, 29.482410430908203, 31.664901733398438, 33.84739303588867, 36.029884338378906, 38.21237564086914, 40.394866943359375, 42.577362060546875, 44.759849548339844, 46.942344665527344, 49.12483596801758, 51.30732727050781, 53.48981857299805, 55.67230987548828, 57.854801177978516, 60.03729248046875, 62.21978759765625, 64.40227508544922]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 8.0, 10.0, 10.0, 11.0, 9.0, 16.0, 21.0, 26.0, 15.0, 21.0, 24.0, 31.0, 32.0, 43.0, 39.0, 39.0, 46.0, 48.0, 50.0, 38.0, 57.0, 35.0, 43.0, 41.0, 33.0, 34.0, 20.0, 33.0, 32.0, 19.0, 15.0, 17.0, 9.0, 6.0, 12.0, 11.0, 5.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0], "bins": [-14.7578125, -14.345458984375, -13.93310546875, -13.520751953125, -13.1083984375, -12.696044921875, -12.28369140625, -11.871337890625, -11.458984375, -11.046630859375, -10.63427734375, -10.221923828125, -9.8095703125, -9.397216796875, -8.98486328125, -8.572509765625, -8.16015625, -7.747802734375, -7.33544921875, -6.923095703125, -6.5107421875, -6.098388671875, -5.68603515625, -5.273681640625, -4.861328125, -4.448974609375, -4.03662109375, -3.624267578125, -3.2119140625, -2.799560546875, -2.38720703125, -1.974853515625, -1.5625, -1.150146484375, -0.73779296875, -0.325439453125, 0.0869140625, 0.499267578125, 0.91162109375, 1.323974609375, 1.736328125, 2.148681640625, 2.56103515625, 2.973388671875, 3.3857421875, 3.798095703125, 4.21044921875, 4.622802734375, 5.03515625, 5.447509765625, 5.85986328125, 6.272216796875, 6.6845703125, 7.096923828125, 7.50927734375, 7.921630859375, 8.333984375, 8.746337890625, 9.15869140625, 9.571044921875, 9.9833984375, 10.395751953125, 10.80810546875, 11.220458984375, 11.6328125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 18.0, 18.0, 29.0, 62.0, 72.0, 108.0, 177.0, 264.0, 374.0, 629.0, 1000.0, 1647.0, 2898.0, 4890.0, 8377.0, 15051.0, 27147.0, 50111.0, 93757.0, 171531.0, 250232.0, 188504.0, 105068.0, 56557.0, 30665.0, 16855.0, 9335.0, 5271.0, 3088.0, 1802.0, 1082.0, 649.0, 439.0, 248.0, 198.0, 128.0, 96.0, 49.0, 37.0, 24.0, 15.0, 18.0, 6.0, 10.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7724609375, -1.719696044921875, -1.66693115234375, -1.614166259765625, -1.5614013671875, -1.508636474609375, -1.45587158203125, -1.403106689453125, -1.350341796875, -1.297576904296875, -1.24481201171875, -1.192047119140625, -1.1392822265625, -1.086517333984375, -1.03375244140625, -0.980987548828125, -0.92822265625, -0.875457763671875, -0.82269287109375, -0.769927978515625, -0.7171630859375, -0.664398193359375, -0.61163330078125, -0.558868408203125, -0.506103515625, -0.453338623046875, -0.40057373046875, -0.347808837890625, -0.2950439453125, -0.242279052734375, -0.18951416015625, -0.136749267578125, -0.083984375, -0.031219482421875, 0.02154541015625, 0.074310302734375, 0.1270751953125, 0.179840087890625, 0.23260498046875, 0.285369873046875, 0.338134765625, 0.390899658203125, 0.44366455078125, 0.496429443359375, 0.5491943359375, 0.601959228515625, 0.65472412109375, 0.707489013671875, 0.76025390625, 0.813018798828125, 0.86578369140625, 0.918548583984375, 0.9713134765625, 1.024078369140625, 1.07684326171875, 1.129608154296875, 1.182373046875, 1.235137939453125, 1.28790283203125, 1.340667724609375, 1.3934326171875, 1.446197509765625, 1.49896240234375, 1.551727294921875, 1.6044921875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 11.0, 7.0, 15.0, 11.0, 15.0, 18.0, 25.0, 21.0, 19.0, 25.0, 27.0, 24.0, 37.0, 32.0, 44.0, 41.0, 38.0, 38.0, 41.0, 1063.0, 36.0, 41.0, 50.0, 40.0, 23.0, 32.0, 28.0, 31.0, 22.0, 27.0, 22.0, 18.0, 31.0, 13.0, 13.0, 8.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.12567138671875, -6.8646240234375, -6.60357666015625, -6.342529296875, -6.08148193359375, -5.8204345703125, -5.55938720703125, -5.29833984375, -5.03729248046875, -4.7762451171875, -4.51519775390625, -4.254150390625, -3.99310302734375, -3.7320556640625, -3.47100830078125, -3.2099609375, -2.94891357421875, -2.6878662109375, -2.42681884765625, -2.165771484375, -1.90472412109375, -1.6436767578125, -1.38262939453125, -1.12158203125, -0.86053466796875, -0.5994873046875, -0.33843994140625, -0.077392578125, 0.18365478515625, 0.4447021484375, 0.70574951171875, 0.966796875, 1.22784423828125, 1.4888916015625, 1.74993896484375, 2.010986328125, 2.27203369140625, 2.5330810546875, 2.79412841796875, 3.05517578125, 3.31622314453125, 3.5772705078125, 3.83831787109375, 4.099365234375, 4.36041259765625, 4.6214599609375, 4.88250732421875, 5.1435546875, 5.40460205078125, 5.6656494140625, 5.92669677734375, 6.187744140625, 6.44879150390625, 6.7098388671875, 6.97088623046875, 7.23193359375, 7.49298095703125, 7.7540283203125, 8.01507568359375, 8.276123046875, 8.53717041015625, 8.7982177734375, 9.05926513671875, 9.3203125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 8.0, 8.0, 9.0, 24.0, 35.0, 65.0, 81.0, 110.0, 163.0, 268.0, 380.0, 573.0, 998.0, 1601.0, 2486.0, 3954.0, 6271.0, 10118.0, 16517.0, 26974.0, 45124.0, 77681.0, 134987.0, 660228.0, 777741.0, 136294.0, 78034.0, 45680.0, 27123.0, 16380.0, 10215.0, 6247.0, 3947.0, 2496.0, 1488.0, 982.0, 624.0, 433.0, 254.0, 198.0, 107.0, 82.0, 48.0, 31.0, 26.0, 11.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73193359375, -0.7083282470703125, -0.684722900390625, -0.6611175537109375, -0.63751220703125, -0.6139068603515625, -0.590301513671875, -0.5666961669921875, -0.5430908203125, -0.5194854736328125, -0.495880126953125, -0.4722747802734375, -0.44866943359375, -0.4250640869140625, -0.401458740234375, -0.3778533935546875, -0.354248046875, -0.3306427001953125, -0.307037353515625, -0.2834320068359375, -0.25982666015625, -0.2362213134765625, -0.212615966796875, -0.1890106201171875, -0.1654052734375, -0.1417999267578125, -0.118194580078125, -0.0945892333984375, -0.07098388671875, -0.0473785400390625, -0.023773193359375, -0.0001678466796875, 0.0234375, 0.0470428466796875, 0.070648193359375, 0.0942535400390625, 0.11785888671875, 0.1414642333984375, 0.165069580078125, 0.1886749267578125, 0.2122802734375, 0.2358856201171875, 0.259490966796875, 0.2830963134765625, 0.30670166015625, 0.3303070068359375, 0.353912353515625, 0.3775177001953125, 0.401123046875, 0.4247283935546875, 0.448333740234375, 0.4719390869140625, 0.49554443359375, 0.5191497802734375, 0.542755126953125, 0.5663604736328125, 0.5899658203125, 0.6135711669921875, 0.637176513671875, 0.6607818603515625, 0.68438720703125, 0.7079925537109375, 0.731597900390625, 0.7552032470703125, 0.77880859375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 8.0, 15.0, 23.0, 49.0, 102.0, 197.0, 368.0, 104.0, 49.0, 32.0, 12.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2442626953125, -0.2341442108154297, -0.22402572631835938, -0.21390724182128906, -0.20378875732421875, -0.19367027282714844, -0.18355178833007812, -0.1734333038330078, -0.1633148193359375, -0.1531963348388672, -0.14307785034179688, -0.13295936584472656, -0.12284088134765625, -0.11272239685058594, -0.10260391235351562, -0.09248542785644531, -0.082366943359375, -0.07224845886230469, -0.062129974365234375, -0.05201148986816406, -0.04189300537109375, -0.03177452087402344, -0.021656036376953125, -0.011537551879882812, -0.0014190673828125, 0.008699417114257812, 0.018817901611328125, 0.028936386108398438, 0.03905487060546875, 0.04917335510253906, 0.059291839599609375, 0.06941032409667969, 0.07952880859375, 0.08964729309082031, 0.09976577758789062, 0.10988426208496094, 0.12000274658203125, 0.13012123107910156, 0.14023971557617188, 0.1503582000732422, 0.1604766845703125, 0.1705951690673828, 0.18071365356445312, 0.19083213806152344, 0.20095062255859375, 0.21106910705566406, 0.22118759155273438, 0.2313060760498047, 0.241424560546875, 0.2515430450439453, 0.2616615295410156, 0.27178001403808594, 0.28189849853515625, 0.29201698303222656, 0.3021354675292969, 0.3122539520263672, 0.3223724365234375, 0.3324909210205078, 0.3426094055175781, 0.35272789001464844, 0.36284637451171875, 0.37296485900878906, 0.3830833435058594, 0.3932018280029297, 0.4033203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 14.0, 16.0, 40.0, 74.0, 280.0, 1993.0, 983556.0, 61070.0, 1098.0, 222.0, 74.0, 29.0, 21.0, 9.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.5625, -7.372802734375, -7.18310546875, -6.993408203125, -6.8037109375, -6.614013671875, -6.42431640625, -6.234619140625, -6.044921875, -5.855224609375, -5.66552734375, -5.475830078125, -5.2861328125, -5.096435546875, -4.90673828125, -4.717041015625, -4.52734375, -4.337646484375, -4.14794921875, -3.958251953125, -3.7685546875, -3.578857421875, -3.38916015625, -3.199462890625, -3.009765625, -2.820068359375, -2.63037109375, -2.440673828125, -2.2509765625, -2.061279296875, -1.87158203125, -1.681884765625, -1.4921875, -1.302490234375, -1.11279296875, -0.923095703125, -0.7333984375, -0.543701171875, -0.35400390625, -0.164306640625, 0.025390625, 0.215087890625, 0.40478515625, 0.594482421875, 0.7841796875, 0.973876953125, 1.16357421875, 1.353271484375, 1.54296875, 1.732666015625, 1.92236328125, 2.112060546875, 2.3017578125, 2.491455078125, 2.68115234375, 2.870849609375, 3.060546875, 3.250244140625, 3.43994140625, 3.629638671875, 3.8193359375, 4.009033203125, 4.19873046875, 4.388427734375, 4.578125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 14.0, 29.0, 61.0, 203.0, 483.0, 144.0, 44.0, 23.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3135902881622314, -1.2673454284667969, -1.2211005687713623, -1.1748557090759277, -1.1286108493804932, -1.0823659896850586, -1.036121129989624, -0.9898763298988342, -0.9436314702033997, -0.8973866105079651, -0.8511417508125305, -0.8048969507217407, -0.7586520910263062, -0.7124072313308716, -0.666162371635437, -0.6199175119400024, -0.5736726522445679, -0.5274277925491333, -0.48118293285369873, -0.43493810296058655, -0.388693243265152, -0.3424483835697174, -0.2962035536766052, -0.24995869398117065, -0.20371383428573608, -0.1574689745903015, -0.11122412979602814, -0.06497928500175476, -0.01873442530632019, 0.02751043438911438, 0.07375526428222656, 0.12000012397766113, 0.1662449836730957, 0.21248984336853027, 0.25873470306396484, 0.304979532957077, 0.3512243926525116, 0.39746925234794617, 0.44371408224105835, 0.4899589419364929, 0.5362038016319275, 0.5824486613273621, 0.6286935210227966, 0.6749383211135864, 0.721183180809021, 0.7674280405044556, 0.8136729001998901, 0.8599177598953247, 0.9061626195907593, 0.9524074792861938, 0.9986523389816284, 1.044897198677063, 1.0911420583724976, 1.1373869180679321, 1.1836316585540771, 1.2298765182495117, 1.2761213779449463, 1.3223662376403809, 1.3686110973358154, 1.41485595703125, 1.4611008167266846, 1.5073456764221191, 1.5535905361175537, 1.5998353958129883, 1.6460802555084229]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 6.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 6.0, 5.0, 10.0, 15.0, 19.0, 15.0, 14.0, 31.0, 29.0, 27.0, 23.0, 33.0, 25.0, 21.0, 32.0, 49.0, 37.0, 39.0, 42.0, 39.0, 36.0, 29.0, 35.0, 34.0, 18.0, 33.0, 39.0, 36.0, 21.0, 22.0, 21.0, 15.0, 15.0, 25.0, 15.0, 10.0, 10.0, 9.0, 10.0, 5.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.2591186761856079, -0.2505349814891815, -0.24195128679275513, -0.23336759209632874, -0.22478389739990234, -0.21620020270347595, -0.20761650800704956, -0.19903281331062317, -0.19044911861419678, -0.18186542391777039, -0.173281729221344, -0.1646980345249176, -0.1561143398284912, -0.14753064513206482, -0.13894695043563843, -0.13036325573921204, -0.12177957594394684, -0.11319588124752045, -0.10461218655109406, -0.09602849185466766, -0.08744479715824127, -0.07886110246181488, -0.07027741521596909, -0.061693720519542694, -0.0531100258231163, -0.04452633112668991, -0.03594263643026352, -0.027358945459127426, -0.018775250762701035, -0.010191556066274643, -0.0016078650951385498, 0.006975829601287842, 0.015559524297714233, 0.024143218994140625, 0.03272691369056702, 0.04131060466170311, 0.0498942993581295, 0.05847799405455589, 0.06706168502569199, 0.07564537972211838, 0.08422907441854477, 0.09281276911497116, 0.10139646381139755, 0.10998015105724335, 0.11856384575366974, 0.12714754045009613, 0.13573123514652252, 0.1443149298429489, 0.1528986245393753, 0.1614823192358017, 0.1700660139322281, 0.17864970862865448, 0.18723340332508087, 0.19581709802150726, 0.20440077781677246, 0.21298447251319885, 0.22156816720962524, 0.23015186190605164, 0.23873555660247803, 0.24731925129890442, 0.2559029459953308, 0.2644866406917572, 0.2730703353881836, 0.28165403008461, 0.2902377247810364]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 8.0, 11.0, 10.0, 10.0, 10.0, 15.0, 21.0, 26.0, 15.0, 20.0, 25.0, 34.0, 33.0, 41.0, 37.0, 40.0, 48.0, 46.0, 49.0, 40.0, 55.0, 36.0, 42.0, 42.0, 32.0, 34.0, 20.0, 32.0, 35.0, 17.0, 14.0, 18.0, 9.0, 6.0, 13.0, 10.0, 5.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-14.7421875, -14.330078125, -13.91796875, -13.505859375, -13.09375, -12.681640625, -12.26953125, -11.857421875, -11.4453125, -11.033203125, -10.62109375, -10.208984375, -9.796875, -9.384765625, -8.97265625, -8.560546875, -8.1484375, -7.736328125, -7.32421875, -6.912109375, -6.5, -6.087890625, -5.67578125, -5.263671875, -4.8515625, -4.439453125, -4.02734375, -3.615234375, -3.203125, -2.791015625, -2.37890625, -1.966796875, -1.5546875, -1.142578125, -0.73046875, -0.318359375, 0.09375, 0.505859375, 0.91796875, 1.330078125, 1.7421875, 2.154296875, 2.56640625, 2.978515625, 3.390625, 3.802734375, 4.21484375, 4.626953125, 5.0390625, 5.451171875, 5.86328125, 6.275390625, 6.6875, 7.099609375, 7.51171875, 7.923828125, 8.3359375, 8.748046875, 9.16015625, 9.572265625, 9.984375, 10.396484375, 10.80859375, 11.220703125, 11.6328125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 15.0, 29.0, 41.0, 35.0, 53.0, 71.0, 105.0, 152.0, 199.0, 271.0, 390.0, 548.0, 779.0, 1238.0, 1770.0, 2956.0, 4960.0, 9263.0, 18445.0, 39176.0, 86474.0, 222359.0, 368469.0, 160423.0, 65899.0, 30623.0, 14424.0, 7611.0, 4115.0, 2545.0, 1588.0, 1056.0, 693.0, 522.0, 347.0, 255.0, 164.0, 146.0, 85.0, 72.0, 51.0, 37.0, 22.0, 13.0, 9.0, 16.0, 16.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.703125, -20.04248046875, -19.3818359375, -18.72119140625, -18.060546875, -17.39990234375, -16.7392578125, -16.07861328125, -15.41796875, -14.75732421875, -14.0966796875, -13.43603515625, -12.775390625, -12.11474609375, -11.4541015625, -10.79345703125, -10.1328125, -9.47216796875, -8.8115234375, -8.15087890625, -7.490234375, -6.82958984375, -6.1689453125, -5.50830078125, -4.84765625, -4.18701171875, -3.5263671875, -2.86572265625, -2.205078125, -1.54443359375, -0.8837890625, -0.22314453125, 0.4375, 1.09814453125, 1.7587890625, 2.41943359375, 3.080078125, 3.74072265625, 4.4013671875, 5.06201171875, 5.72265625, 6.38330078125, 7.0439453125, 7.70458984375, 8.365234375, 9.02587890625, 9.6865234375, 10.34716796875, 11.0078125, 11.66845703125, 12.3291015625, 12.98974609375, 13.650390625, 14.31103515625, 14.9716796875, 15.63232421875, 16.29296875, 16.95361328125, 17.6142578125, 18.27490234375, 18.935546875, 19.59619140625, 20.2568359375, 20.91748046875, 21.578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 6.0, 10.0, 13.0, 9.0, 16.0, 18.0, 30.0, 34.0, 21.0, 42.0, 38.0, 48.0, 39.0, 66.0, 118.0, 215.0, 1358.0, 321.0, 175.0, 95.0, 57.0, 43.0, 34.0, 43.0, 33.0, 28.0, 26.0, 19.0, 16.0, 15.0, 9.0, 10.0, 8.0, 4.0, 9.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-34.71875, -33.6904296875, -32.662109375, -31.6337890625, -30.60546875, -29.5771484375, -28.548828125, -27.5205078125, -26.4921875, -25.4638671875, -24.435546875, -23.4072265625, -22.37890625, -21.3505859375, -20.322265625, -19.2939453125, -18.265625, -17.2373046875, -16.208984375, -15.1806640625, -14.15234375, -13.1240234375, -12.095703125, -11.0673828125, -10.0390625, -9.0107421875, -7.982421875, -6.9541015625, -5.92578125, -4.8974609375, -3.869140625, -2.8408203125, -1.8125, -0.7841796875, 0.244140625, 1.2724609375, 2.30078125, 3.3291015625, 4.357421875, 5.3857421875, 6.4140625, 7.4423828125, 8.470703125, 9.4990234375, 10.52734375, 11.5556640625, 12.583984375, 13.6123046875, 14.640625, 15.6689453125, 16.697265625, 17.7255859375, 18.75390625, 19.7822265625, 20.810546875, 21.8388671875, 22.8671875, 23.8955078125, 24.923828125, 25.9521484375, 26.98046875, 28.0087890625, 29.037109375, 30.0654296875, 31.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 4.0, 10.0, 13.0, 29.0, 25.0, 56.0, 62.0, 95.0, 123.0, 191.0, 288.0, 469.0, 927.0, 4099.0, 193104.0, 2929448.0, 13701.0, 1390.0, 585.0, 348.0, 221.0, 150.0, 101.0, 58.0, 54.0, 25.0, 32.0, 26.0, 13.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.6875, -84.0654296875, -80.443359375, -76.8212890625, -73.19921875, -69.5771484375, -65.955078125, -62.3330078125, -58.7109375, -55.0888671875, -51.466796875, -47.8447265625, -44.22265625, -40.6005859375, -36.978515625, -33.3564453125, -29.734375, -26.1123046875, -22.490234375, -18.8681640625, -15.24609375, -11.6240234375, -8.001953125, -4.3798828125, -0.7578125, 2.8642578125, 6.486328125, 10.1083984375, 13.73046875, 17.3525390625, 20.974609375, 24.5966796875, 28.21875, 31.8408203125, 35.462890625, 39.0849609375, 42.70703125, 46.3291015625, 49.951171875, 53.5732421875, 57.1953125, 60.8173828125, 64.439453125, 68.0615234375, 71.68359375, 75.3056640625, 78.927734375, 82.5498046875, 86.171875, 89.7939453125, 93.416015625, 97.0380859375, 100.66015625, 104.2822265625, 107.904296875, 111.5263671875, 115.1484375, 118.7705078125, 122.392578125, 126.0146484375, 129.63671875, 133.2587890625, 136.880859375, 140.5029296875, 144.125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 37.0, 107.0, 209.0, 296.0, 208.0, 88.0, 36.0, 11.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.4510498046875, -235.21420288085938, -227.9773712158203, -220.7405242919922, -213.50367736816406, -206.266845703125, -199.02999877929688, -191.79315185546875, -184.55630493164062, -177.3194580078125, -170.08262634277344, -162.8457794189453, -155.6089324951172, -148.37210083007812, -141.13525390625, -133.89840698242188, -126.66156768798828, -119.42472839355469, -112.18788146972656, -104.95104217529297, -97.71419525146484, -90.47735595703125, -83.24050903320312, -76.00366973876953, -68.76683044433594, -61.52998733520508, -54.29314422607422, -47.056304931640625, -39.8194580078125, -32.582618713378906, -25.345775604248047, -18.108932495117188, -10.872085571289062, -3.6352429389953613, 3.60159969329834, 10.838441848754883, 18.075284957885742, 25.31212615966797, 32.54896926879883, 39.78581237792969, 47.02265548706055, 54.259498596191406, 61.496341705322266, 68.73318481445312, 75.97002410888672, 83.20686340332031, 90.44371032714844, 97.68055725097656, 104.91739654541016, 112.15423583984375, 119.39108276367188, 126.62792205810547, 133.86476135253906, 141.1016082763672, 148.3384552001953, 155.57528686523438, 162.8121337890625, 170.04898071289062, 177.2858123779297, 184.5226593017578, 191.75950622558594, 198.996337890625, 206.23318481445312, 213.47003173828125, 220.70687866210938]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 11.0, 14.0, 14.0, 13.0, 16.0, 23.0, 25.0, 24.0, 33.0, 30.0, 34.0, 37.0, 45.0, 38.0, 37.0, 29.0, 41.0, 42.0, 40.0, 38.0, 35.0, 41.0, 39.0, 29.0, 36.0, 33.0, 17.0, 20.0, 18.0, 23.0, 23.0, 17.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-85.57408142089844, -82.92086791992188, -80.26764678955078, -77.61443328857422, -74.96121215820312, -72.30799865722656, -69.65477752685547, -67.0015640258789, -64.34834289550781, -61.695125579833984, -59.041908264160156, -56.38869094848633, -53.7354736328125, -51.08226013183594, -48.42904281616211, -45.77582550048828, -43.12261199951172, -40.46939468383789, -37.81617736816406, -35.162960052490234, -32.509742736816406, -29.85652732849121, -27.203311920166016, -24.550094604492188, -21.89687728881836, -19.24365997314453, -16.590442657470703, -13.937227249145508, -11.28400993347168, -8.630792617797852, -5.97757625579834, -3.324359893798828, -0.671142578125, 1.98207426071167, 4.63529109954834, 7.28850793838501, 9.94172477722168, 12.594942092895508, 15.24815845489502, 17.90137481689453, 20.55459213256836, 23.207809448242188, 25.861026763916016, 28.51424217224121, 31.16745948791504, 33.8206787109375, 36.47389221191406, 39.12710952758789, 41.78032684326172, 44.43354415893555, 47.086761474609375, 49.7399787902832, 52.39319610595703, 55.046409606933594, 57.69962692260742, 60.35284423828125, 63.00606155395508, 65.6592788696289, 68.31249237060547, 70.96571350097656, 73.61892700195312, 76.27214813232422, 78.92536163330078, 81.57858276367188, 84.23179626464844]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 1.0, 8.0, 12.0, 10.0, 17.0, 10.0, 13.0, 17.0, 17.0, 28.0, 24.0, 34.0, 38.0, 40.0, 44.0, 46.0, 44.0, 38.0, 51.0, 52.0, 37.0, 40.0, 37.0, 31.0, 49.0, 41.0, 29.0, 22.0, 34.0, 16.0, 12.0, 13.0, 18.0, 10.0, 16.0, 8.0, 7.0, 9.0, 11.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-14.9296875, -14.5035400390625, -14.077392578125, -13.6512451171875, -13.22509765625, -12.7989501953125, -12.372802734375, -11.9466552734375, -11.5205078125, -11.0943603515625, -10.668212890625, -10.2420654296875, -9.81591796875, -9.3897705078125, -8.963623046875, -8.5374755859375, -8.111328125, -7.6851806640625, -7.259033203125, -6.8328857421875, -6.40673828125, -5.9805908203125, -5.554443359375, -5.1282958984375, -4.7021484375, -4.2760009765625, -3.849853515625, -3.4237060546875, -2.99755859375, -2.5714111328125, -2.145263671875, -1.7191162109375, -1.29296875, -0.8668212890625, -0.440673828125, -0.0145263671875, 0.41162109375, 0.8377685546875, 1.263916015625, 1.6900634765625, 2.1162109375, 2.5423583984375, 2.968505859375, 3.3946533203125, 3.82080078125, 4.2469482421875, 4.673095703125, 5.0992431640625, 5.525390625, 5.9515380859375, 6.377685546875, 6.8038330078125, 7.22998046875, 7.6561279296875, 8.082275390625, 8.5084228515625, 8.9345703125, 9.3607177734375, 9.786865234375, 10.2130126953125, 10.63916015625, 11.0653076171875, 11.491455078125, 11.9176025390625, 12.34375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 11.0, 10.0, 11.0, 23.0, 25.0, 35.0, 43.0, 68.0, 94.0, 126.0, 206.0, 274.0, 416.0, 657.0, 1188.0, 2258.0, 4591.0, 11600.0, 39929.0, 254809.0, 1912177.0, 1686555.0, 221339.0, 37438.0, 10778.0, 4426.0, 2084.0, 1149.0, 670.0, 405.0, 251.0, 169.0, 134.0, 86.0, 69.0, 46.0, 39.0, 24.0, 20.0, 16.0, 12.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.25, -28.3349609375, -27.419921875, -26.5048828125, -25.58984375, -24.6748046875, -23.759765625, -22.8447265625, -21.9296875, -21.0146484375, -20.099609375, -19.1845703125, -18.26953125, -17.3544921875, -16.439453125, -15.5244140625, -14.609375, -13.6943359375, -12.779296875, -11.8642578125, -10.94921875, -10.0341796875, -9.119140625, -8.2041015625, -7.2890625, -6.3740234375, -5.458984375, -4.5439453125, -3.62890625, -2.7138671875, -1.798828125, -0.8837890625, 0.03125, 0.9462890625, 1.861328125, 2.7763671875, 3.69140625, 4.6064453125, 5.521484375, 6.4365234375, 7.3515625, 8.2666015625, 9.181640625, 10.0966796875, 11.01171875, 11.9267578125, 12.841796875, 13.7568359375, 14.671875, 15.5869140625, 16.501953125, 17.4169921875, 18.33203125, 19.2470703125, 20.162109375, 21.0771484375, 21.9921875, 22.9072265625, 23.822265625, 24.7373046875, 25.65234375, 26.5673828125, 27.482421875, 28.3974609375, 29.3125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 9.0, 16.0, 19.0, 11.0, 23.0, 33.0, 56.0, 58.0, 74.0, 96.0, 146.0, 198.0, 306.0, 357.0, 510.0, 540.0, 416.0, 301.0, 217.0, 188.0, 98.0, 105.0, 64.0, 52.0, 39.0, 39.0, 24.0, 25.0, 14.0, 9.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.3212890625, -16.658203125, -15.9951171875, -15.33203125, -14.6689453125, -14.005859375, -13.3427734375, -12.6796875, -12.0166015625, -11.353515625, -10.6904296875, -10.02734375, -9.3642578125, -8.701171875, -8.0380859375, -7.375, -6.7119140625, -6.048828125, -5.3857421875, -4.72265625, -4.0595703125, -3.396484375, -2.7333984375, -2.0703125, -1.4072265625, -0.744140625, -0.0810546875, 0.58203125, 1.2451171875, 1.908203125, 2.5712890625, 3.234375, 3.8974609375, 4.560546875, 5.2236328125, 5.88671875, 6.5498046875, 7.212890625, 7.8759765625, 8.5390625, 9.2021484375, 9.865234375, 10.5283203125, 11.19140625, 11.8544921875, 12.517578125, 13.1806640625, 13.84375, 14.5068359375, 15.169921875, 15.8330078125, 16.49609375, 17.1591796875, 17.822265625, 18.4853515625, 19.1484375, 19.8115234375, 20.474609375, 21.1376953125, 21.80078125, 22.4638671875, 23.126953125, 23.7900390625, 24.453125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 1.0, 9.0, 10.0, 13.0, 20.0, 36.0, 31.0, 52.0, 81.0, 162.0, 175.0, 350.0, 571.0, 1058.0, 2198.0, 5119.0, 14840.0, 52404.0, 252844.0, 2135960.0, 1475340.0, 190293.0, 41773.0, 12232.0, 4528.0, 1870.0, 942.0, 464.0, 328.0, 184.0, 126.0, 78.0, 60.0, 38.0, 20.0, 22.0, 13.0, 14.0, 6.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.15625, -32.1787109375, -31.201171875, -30.2236328125, -29.24609375, -28.2685546875, -27.291015625, -26.3134765625, -25.3359375, -24.3583984375, -23.380859375, -22.4033203125, -21.42578125, -20.4482421875, -19.470703125, -18.4931640625, -17.515625, -16.5380859375, -15.560546875, -14.5830078125, -13.60546875, -12.6279296875, -11.650390625, -10.6728515625, -9.6953125, -8.7177734375, -7.740234375, -6.7626953125, -5.78515625, -4.8076171875, -3.830078125, -2.8525390625, -1.875, -0.8974609375, 0.080078125, 1.0576171875, 2.03515625, 3.0126953125, 3.990234375, 4.9677734375, 5.9453125, 6.9228515625, 7.900390625, 8.8779296875, 9.85546875, 10.8330078125, 11.810546875, 12.7880859375, 13.765625, 14.7431640625, 15.720703125, 16.6982421875, 17.67578125, 18.6533203125, 19.630859375, 20.6083984375, 21.5859375, 22.5634765625, 23.541015625, 24.5185546875, 25.49609375, 26.4736328125, 27.451171875, 28.4287109375, 29.40625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 31.0, 187.0, 531.0, 234.0, 24.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.2575988769531, -248.2565155029297, -232.2554473876953, -216.25436401367188, -200.2532958984375, -184.25221252441406, -168.25112915039062, -152.25006103515625, -136.2489776611328, -120.2479019165039, -104.246826171875, -88.24574279785156, -72.24466705322266, -56.24359130859375, -40.24250793457031, -24.241432189941406, -8.2403564453125, 7.760721206665039, 23.761798858642578, 39.76287841796875, 55.763954162597656, 71.76502990722656, 87.76611328125, 103.7671890258789, 119.76826477050781, 135.76934814453125, 151.77041625976562, 167.77149963378906, 183.7725830078125, 199.77365112304688, 215.7747344970703, 231.77581787109375, 247.77691650390625, 263.7779846191406, 279.7790832519531, 295.7801513671875, 311.7812194824219, 327.78228759765625, 343.78338623046875, 359.7844543457031, 375.7855224609375, 391.7865905761719, 407.7876892089844, 423.78875732421875, 439.7898254394531, 455.7908935546875, 471.7919921875, 487.7930603027344, 503.7941589355469, 519.7952270507812, 535.7963256835938, 551.79736328125, 567.7984619140625, 583.799560546875, 599.8006591796875, 615.8016967773438, 631.8027954101562, 647.8038940429688, 663.804931640625, 679.8060302734375, 695.80712890625, 711.8081665039062, 727.8092651367188, 743.8103637695312, 759.8114013671875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 9.0, 4.0, 7.0, 6.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 12.0, 16.0, 22.0, 28.0, 25.0, 32.0, 22.0, 33.0, 33.0, 30.0, 29.0, 37.0, 36.0, 36.0, 36.0, 38.0, 38.0, 42.0, 30.0, 39.0, 28.0, 27.0, 29.0, 30.0, 17.0, 20.0, 22.0, 18.0, 23.0, 12.0, 12.0, 14.0, 11.0, 10.0, 8.0, 10.0, 2.0, 7.0, 7.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-62.77647399902344, -60.68628692626953, -58.596099853515625, -56.50591278076172, -54.41572189331055, -52.32553482055664, -50.235347747802734, -48.14516067504883, -46.054969787597656, -43.96478271484375, -41.874595642089844, -39.78440856933594, -37.694217681884766, -35.60403060913086, -33.51384353637695, -31.423656463623047, -29.33346939086914, -27.243282318115234, -25.153093338012695, -23.06290626525879, -20.97271728515625, -18.882530212402344, -16.792343139648438, -14.702155113220215, -12.611967086791992, -10.52177906036377, -8.431591033935547, -6.341403961181641, -4.251215934753418, -2.1610279083251953, -0.07084083557128906, 2.0193471908569336, 4.109535217285156, 6.199723243713379, 8.289911270141602, 10.380098342895508, 12.47028636932373, 14.560474395751953, 16.65066146850586, 18.740848541259766, 20.831037521362305, 22.92122459411621, 25.01141357421875, 27.101600646972656, 29.191787719726562, 31.2819766998291, 33.372161865234375, 35.46235275268555, 37.55253982543945, 39.64272689819336, 41.732913970947266, 43.82310485839844, 45.913291931152344, 48.00347900390625, 50.093666076660156, 52.18385314941406, 54.27404022216797, 56.364227294921875, 58.45441436767578, 60.54460144042969, 62.63479232788086, 64.7249755859375, 66.81517028808594, 68.90535736083984, 70.99554443359375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 9.0, 9.0, 9.0, 12.0, 14.0, 22.0, 15.0, 26.0, 38.0, 32.0, 41.0, 31.0, 33.0, 50.0, 36.0, 40.0, 48.0, 40.0, 40.0, 41.0, 32.0, 43.0, 33.0, 38.0, 22.0, 32.0, 31.0, 32.0, 27.0, 15.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.58544921875, -11.1943359375, -10.80322265625, -10.412109375, -10.02099609375, -9.6298828125, -9.23876953125, -8.84765625, -8.45654296875, -8.0654296875, -7.67431640625, -7.283203125, -6.89208984375, -6.5009765625, -6.10986328125, -5.71875, -5.32763671875, -4.9365234375, -4.54541015625, -4.154296875, -3.76318359375, -3.3720703125, -2.98095703125, -2.58984375, -2.19873046875, -1.8076171875, -1.41650390625, -1.025390625, -0.63427734375, -0.2431640625, 0.14794921875, 0.5390625, 0.93017578125, 1.3212890625, 1.71240234375, 2.103515625, 2.49462890625, 2.8857421875, 3.27685546875, 3.66796875, 4.05908203125, 4.4501953125, 4.84130859375, 5.232421875, 5.62353515625, 6.0146484375, 6.40576171875, 6.796875, 7.18798828125, 7.5791015625, 7.97021484375, 8.361328125, 8.75244140625, 9.1435546875, 9.53466796875, 9.92578125, 10.31689453125, 10.7080078125, 11.09912109375, 11.490234375, 11.88134765625, 12.2724609375, 12.66357421875, 13.0546875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 14.0, 21.0, 30.0, 33.0, 60.0, 82.0, 99.0, 183.0, 234.0, 397.0, 545.0, 885.0, 1410.0, 2253.0, 3573.0, 6066.0, 10013.0, 17485.0, 30418.0, 54965.0, 99215.0, 176363.0, 239062.0, 176027.0, 100136.0, 55128.0, 30617.0, 17365.0, 9996.0, 6090.0, 3554.0, 2230.0, 1393.0, 881.0, 580.0, 363.0, 250.0, 149.0, 115.0, 85.0, 57.0, 36.0, 20.0, 23.0, 14.0, 14.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.19158935546875, -1.1497802734375, -1.10797119140625, -1.066162109375, -1.02435302734375, -0.9825439453125, -0.94073486328125, -0.89892578125, -0.85711669921875, -0.8153076171875, -0.77349853515625, -0.731689453125, -0.68988037109375, -0.6480712890625, -0.60626220703125, -0.564453125, -0.52264404296875, -0.4808349609375, -0.43902587890625, -0.397216796875, -0.35540771484375, -0.3135986328125, -0.27178955078125, -0.22998046875, -0.18817138671875, -0.1463623046875, -0.10455322265625, -0.062744140625, -0.02093505859375, 0.0208740234375, 0.06268310546875, 0.1044921875, 0.14630126953125, 0.1881103515625, 0.22991943359375, 0.271728515625, 0.31353759765625, 0.3553466796875, 0.39715576171875, 0.43896484375, 0.48077392578125, 0.5225830078125, 0.56439208984375, 0.606201171875, 0.64801025390625, 0.6898193359375, 0.73162841796875, 0.7734375, 0.81524658203125, 0.8570556640625, 0.89886474609375, 0.940673828125, 0.98248291015625, 1.0242919921875, 1.06610107421875, 1.10791015625, 1.14971923828125, 1.1915283203125, 1.23333740234375, 1.275146484375, 1.31695556640625, 1.3587646484375, 1.40057373046875, 1.4423828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 3.0, 7.0, 4.0, 10.0, 10.0, 10.0, 16.0, 9.0, 17.0, 20.0, 19.0, 21.0, 21.0, 29.0, 36.0, 44.0, 27.0, 35.0, 46.0, 48.0, 26.0, 1066.0, 39.0, 48.0, 42.0, 51.0, 49.0, 39.0, 31.0, 24.0, 28.0, 27.0, 15.0, 23.0, 17.0, 21.0, 10.0, 6.0, 10.0, 12.0, 3.0, 9.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.39324951171875, -6.1263427734375, -5.85943603515625, -5.592529296875, -5.32562255859375, -5.0587158203125, -4.79180908203125, -4.52490234375, -4.25799560546875, -3.9910888671875, -3.72418212890625, -3.457275390625, -3.19036865234375, -2.9234619140625, -2.65655517578125, -2.3896484375, -2.12274169921875, -1.8558349609375, -1.58892822265625, -1.322021484375, -1.05511474609375, -0.7882080078125, -0.52130126953125, -0.25439453125, 0.01251220703125, 0.2794189453125, 0.54632568359375, 0.813232421875, 1.08013916015625, 1.3470458984375, 1.61395263671875, 1.880859375, 2.14776611328125, 2.4146728515625, 2.68157958984375, 2.948486328125, 3.21539306640625, 3.4822998046875, 3.74920654296875, 4.01611328125, 4.28302001953125, 4.5499267578125, 4.81683349609375, 5.083740234375, 5.35064697265625, 5.6175537109375, 5.88446044921875, 6.1513671875, 6.41827392578125, 6.6851806640625, 6.95208740234375, 7.218994140625, 7.48590087890625, 7.7528076171875, 8.01971435546875, 8.28662109375, 8.55352783203125, 8.8204345703125, 9.08734130859375, 9.354248046875, 9.62115478515625, 9.8880615234375, 10.15496826171875, 10.421875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 11.0, 17.0, 11.0, 28.0, 29.0, 59.0, 60.0, 95.0, 177.0, 244.0, 360.0, 538.0, 796.0, 1195.0, 1909.0, 2888.0, 4402.0, 6902.0, 10528.0, 16433.0, 26225.0, 43269.0, 71527.0, 123039.0, 294848.0, 1143718.0, 138739.0, 80740.0, 47715.0, 29115.0, 18343.0, 11645.0, 7387.0, 4685.0, 3249.0, 2073.0, 1353.0, 923.0, 610.0, 379.0, 291.0, 197.0, 112.0, 83.0, 53.0, 38.0, 34.0, 17.0, 18.0, 13.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.64306640625, -0.6230392456054688, -0.6030120849609375, -0.5829849243164062, -0.562957763671875, -0.5429306030273438, -0.5229034423828125, -0.5028762817382812, -0.48284912109375, -0.46282196044921875, -0.4427947998046875, -0.42276763916015625, -0.402740478515625, -0.38271331787109375, -0.3626861572265625, -0.34265899658203125, -0.3226318359375, -0.30260467529296875, -0.2825775146484375, -0.26255035400390625, -0.242523193359375, -0.22249603271484375, -0.2024688720703125, -0.18244171142578125, -0.16241455078125, -0.14238739013671875, -0.1223602294921875, -0.10233306884765625, -0.082305908203125, -0.06227874755859375, -0.0422515869140625, -0.02222442626953125, -0.002197265625, 0.01782989501953125, 0.0378570556640625, 0.05788421630859375, 0.077911376953125, 0.09793853759765625, 0.1179656982421875, 0.13799285888671875, 0.15802001953125, 0.17804718017578125, 0.1980743408203125, 0.21810150146484375, 0.238128662109375, 0.25815582275390625, 0.2781829833984375, 0.29821014404296875, 0.3182373046875, 0.33826446533203125, 0.3582916259765625, 0.37831878662109375, 0.398345947265625, 0.41837310791015625, 0.4384002685546875, 0.45842742919921875, 0.47845458984375, 0.49848175048828125, 0.5185089111328125, 0.5385360717773438, 0.558563232421875, 0.5785903930664062, 0.5986175537109375, 0.6186447143554688, 0.638671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 2.0, 6.0, 5.0, 9.0, 9.0, 8.0, 19.0, 31.0, 39.0, 40.0, 100.0, 142.0, 187.0, 128.0, 74.0, 38.0, 36.0, 18.0, 12.0, 17.0, 9.0, 10.0, 12.0, 6.0, 4.0, 6.0, 7.0, 2.0, 0.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07232666015625, -0.07021903991699219, -0.06811141967773438, -0.06600379943847656, -0.06389617919921875, -0.06178855895996094, -0.059680938720703125, -0.05757331848144531, -0.0554656982421875, -0.05335807800292969, -0.051250457763671875, -0.04914283752441406, -0.04703521728515625, -0.04492759704589844, -0.042819976806640625, -0.04071235656738281, -0.038604736328125, -0.03649711608886719, -0.034389495849609375, -0.03228187561035156, -0.03017425537109375, -0.028066635131835938, -0.025959014892578125, -0.023851394653320312, -0.0217437744140625, -0.019636154174804688, -0.017528533935546875, -0.015420913696289062, -0.01331329345703125, -0.011205673217773438, -0.009098052978515625, -0.0069904327392578125, -0.0048828125, -0.0027751922607421875, -0.000667572021484375, 0.0014400482177734375, 0.00354766845703125, 0.0056552886962890625, 0.007762908935546875, 0.009870529174804688, 0.0119781494140625, 0.014085769653320312, 0.016193389892578125, 0.018301010131835938, 0.02040863037109375, 0.022516250610351562, 0.024623870849609375, 0.026731491088867188, 0.028839111328125, 0.030946731567382812, 0.033054351806640625, 0.03516197204589844, 0.03726959228515625, 0.03937721252441406, 0.041484832763671875, 0.04359245300292969, 0.0457000732421875, 0.04780769348144531, 0.049915313720703125, 0.05202293395996094, 0.05413055419921875, 0.05623817443847656, 0.058345794677734375, 0.06045341491699219, 0.06256103515625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 10.0, 3.0, 7.0, 1.0, 9.0, 8.0, 6.0, 10.0, 8.0, 15.0, 19.0, 24.0, 25.0, 57.0, 48.0, 95.0, 139.0, 306.0, 839.0, 2932.0, 19867.0, 966673.0, 50682.0, 4648.0, 1210.0, 415.0, 161.0, 98.0, 63.0, 34.0, 35.0, 25.0, 20.0, 8.0, 12.0, 7.0, 8.0, 6.0, 7.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.05859375, -1.02288818359375, -0.9871826171875, -0.95147705078125, -0.915771484375, -0.88006591796875, -0.8443603515625, -0.80865478515625, -0.77294921875, -0.73724365234375, -0.7015380859375, -0.66583251953125, -0.630126953125, -0.59442138671875, -0.5587158203125, -0.52301025390625, -0.4873046875, -0.45159912109375, -0.4158935546875, -0.38018798828125, -0.344482421875, -0.30877685546875, -0.2730712890625, -0.23736572265625, -0.20166015625, -0.16595458984375, -0.1302490234375, -0.09454345703125, -0.058837890625, -0.02313232421875, 0.0125732421875, 0.04827880859375, 0.083984375, 0.11968994140625, 0.1553955078125, 0.19110107421875, 0.226806640625, 0.26251220703125, 0.2982177734375, 0.33392333984375, 0.36962890625, 0.40533447265625, 0.4410400390625, 0.47674560546875, 0.512451171875, 0.54815673828125, 0.5838623046875, 0.61956787109375, 0.6552734375, 0.69097900390625, 0.7266845703125, 0.76239013671875, 0.798095703125, 0.83380126953125, 0.8695068359375, 0.90521240234375, 0.94091796875, 0.97662353515625, 1.0123291015625, 1.04803466796875, 1.083740234375, 1.11944580078125, 1.1551513671875, 1.19085693359375, 1.2265625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 20.0, 48.0, 149.0, 433.0, 226.0, 77.0, 32.0, 9.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9330242872238159, -0.9146406650543213, -0.8962571024894714, -0.8778734803199768, -0.859489917755127, -0.8411062955856323, -0.8227227330207825, -0.8043391108512878, -0.785955548286438, -0.7675719261169434, -0.7491883635520935, -0.7308047413825989, -0.712421178817749, -0.6940375566482544, -0.6756539940834045, -0.6572703719139099, -0.6388868093490601, -0.6205031871795654, -0.6021196246147156, -0.583736002445221, -0.5653524398803711, -0.5469688177108765, -0.5285852551460266, -0.510201632976532, -0.49181801080703735, -0.4734344184398651, -0.45505082607269287, -0.43666723370552063, -0.4182836413383484, -0.39990004897117615, -0.3815164566040039, -0.3631328344345093, -0.3447492718696594, -0.3263656795024872, -0.30798208713531494, -0.2895984947681427, -0.27121490240097046, -0.2528313100337982, -0.23444770276546478, -0.21606411039829254, -0.1976805329322815, -0.17929694056510925, -0.160913348197937, -0.14252975583076477, -0.12414615601301193, -0.10576256364583969, -0.08737896382808685, -0.06899537146091461, -0.05061177909374237, -0.03222818672657013, -0.01384459063410759, 0.00453900545835495, 0.02292259782552719, 0.04130619019269943, 0.05968979001045227, 0.07807338237762451, 0.09645697474479675, 0.114840567111969, 0.13322415947914124, 0.15160775184631348, 0.16999134421348572, 0.18837493658065796, 0.2067585438489914, 0.22514213621616364, 0.24352572858333588]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 2.0, 9.0, 10.0, 11.0, 13.0, 21.0, 26.0, 19.0, 25.0, 27.0, 16.0, 40.0, 35.0, 43.0, 30.0, 29.0, 40.0, 26.0, 51.0, 45.0, 42.0, 48.0, 46.0, 33.0, 43.0, 25.0, 31.0, 38.0, 29.0, 26.0, 15.0, 24.0, 23.0, 13.0, 13.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05482608079910278, -0.05288701131939888, -0.05094794183969498, -0.049008868634700775, -0.04706979915499687, -0.04513072967529297, -0.04319165647029877, -0.041252586990594864, -0.03931351751089096, -0.03737444803118706, -0.035435378551483154, -0.03349630534648895, -0.03155723586678505, -0.029618166387081146, -0.027679095044732094, -0.02574002370238304, -0.023800954222679138, -0.021861884742975235, -0.019922813400626183, -0.01798374205827713, -0.016044672578573227, -0.014105602167546749, -0.012166531756520271, -0.010227461345493793, -0.008288390934467316, -0.006349320523440838, -0.00441025011241436, -0.0024711797013878822, -0.0005321092903614044, 0.0014069611206650734, 0.003346031531691551, 0.005285101942718029, 0.007224172353744507, 0.009163242764770985, 0.011102313175797462, 0.01304138358682394, 0.014980453997850418, 0.01691952347755432, 0.018858594819903374, 0.020797666162252426, 0.02273673564195633, 0.024675805121660233, 0.026614876464009285, 0.028553947806358337, 0.03049301728606224, 0.032432086765766144, 0.034371159970760345, 0.03631022945046425, 0.03824929893016815, 0.040188368409872055, 0.04212743788957596, 0.04406651109457016, 0.04600558057427406, 0.047944650053977966, 0.04988372325897217, 0.05182279273867607, 0.053761862218379974, 0.05570093169808388, 0.05764000117778778, 0.05957907438278198, 0.061518143862485886, 0.06345721334218979, 0.06539628654718399, 0.0673353523015976, 0.0692744255065918]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 9.0, 9.0, 9.0, 12.0, 14.0, 22.0, 18.0, 23.0, 38.0, 32.0, 41.0, 31.0, 33.0, 51.0, 36.0, 41.0, 47.0, 39.0, 40.0, 42.0, 31.0, 43.0, 33.0, 38.0, 23.0, 31.0, 31.0, 32.0, 28.0, 14.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.5853271484375, -11.194091796875, -10.8028564453125, -10.41162109375, -10.0203857421875, -9.629150390625, -9.2379150390625, -8.8466796875, -8.4554443359375, -8.064208984375, -7.6729736328125, -7.28173828125, -6.8905029296875, -6.499267578125, -6.1080322265625, -5.716796875, -5.3255615234375, -4.934326171875, -4.5430908203125, -4.15185546875, -3.7606201171875, -3.369384765625, -2.9781494140625, -2.5869140625, -2.1956787109375, -1.804443359375, -1.4132080078125, -1.02197265625, -0.6307373046875, -0.239501953125, 0.1517333984375, 0.54296875, 0.9342041015625, 1.325439453125, 1.7166748046875, 2.10791015625, 2.4991455078125, 2.890380859375, 3.2816162109375, 3.6728515625, 4.0640869140625, 4.455322265625, 4.8465576171875, 5.23779296875, 5.6290283203125, 6.020263671875, 6.4114990234375, 6.802734375, 7.1939697265625, 7.585205078125, 7.9764404296875, 8.36767578125, 8.7589111328125, 9.150146484375, 9.5413818359375, 9.9326171875, 10.3238525390625, 10.715087890625, 11.1063232421875, 11.49755859375, 11.8887939453125, 12.280029296875, 12.6712646484375, 13.0625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 10.0, 4.0, 17.0, 22.0, 23.0, 33.0, 44.0, 68.0, 89.0, 119.0, 151.0, 240.0, 331.0, 474.0, 680.0, 1044.0, 1727.0, 2910.0, 5432.0, 11494.0, 27993.0, 85445.0, 327636.0, 413140.0, 107337.0, 33857.0, 13288.0, 6123.0, 3224.0, 1817.0, 1233.0, 799.0, 507.0, 396.0, 246.0, 151.0, 121.0, 100.0, 56.0, 47.0, 35.0, 26.0, 19.0, 12.0, 12.0, 7.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.625, -23.880859375, -23.13671875, -22.392578125, -21.6484375, -20.904296875, -20.16015625, -19.416015625, -18.671875, -17.927734375, -17.18359375, -16.439453125, -15.6953125, -14.951171875, -14.20703125, -13.462890625, -12.71875, -11.974609375, -11.23046875, -10.486328125, -9.7421875, -8.998046875, -8.25390625, -7.509765625, -6.765625, -6.021484375, -5.27734375, -4.533203125, -3.7890625, -3.044921875, -2.30078125, -1.556640625, -0.8125, -0.068359375, 0.67578125, 1.419921875, 2.1640625, 2.908203125, 3.65234375, 4.396484375, 5.140625, 5.884765625, 6.62890625, 7.373046875, 8.1171875, 8.861328125, 9.60546875, 10.349609375, 11.09375, 11.837890625, 12.58203125, 13.326171875, 14.0703125, 14.814453125, 15.55859375, 16.302734375, 17.046875, 17.791015625, 18.53515625, 19.279296875, 20.0234375, 20.767578125, 21.51171875, 22.255859375, 23.0]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 11.0, 7.0, 14.0, 15.0, 14.0, 19.0, 21.0, 30.0, 32.0, 42.0, 38.0, 36.0, 62.0, 95.0, 127.0, 204.0, 1422.0, 269.0, 122.0, 82.0, 68.0, 58.0, 37.0, 44.0, 27.0, 26.0, 25.0, 15.0, 17.0, 16.0, 12.0, 5.0, 8.0, 5.0, 4.0, 8.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.3125, -28.35205078125, -27.3916015625, -26.43115234375, -25.470703125, -24.51025390625, -23.5498046875, -22.58935546875, -21.62890625, -20.66845703125, -19.7080078125, -18.74755859375, -17.787109375, -16.82666015625, -15.8662109375, -14.90576171875, -13.9453125, -12.98486328125, -12.0244140625, -11.06396484375, -10.103515625, -9.14306640625, -8.1826171875, -7.22216796875, -6.26171875, -5.30126953125, -4.3408203125, -3.38037109375, -2.419921875, -1.45947265625, -0.4990234375, 0.46142578125, 1.421875, 2.38232421875, 3.3427734375, 4.30322265625, 5.263671875, 6.22412109375, 7.1845703125, 8.14501953125, 9.10546875, 10.06591796875, 11.0263671875, 11.98681640625, 12.947265625, 13.90771484375, 14.8681640625, 15.82861328125, 16.7890625, 17.74951171875, 18.7099609375, 19.67041015625, 20.630859375, 21.59130859375, 22.5517578125, 23.51220703125, 24.47265625, 25.43310546875, 26.3935546875, 27.35400390625, 28.314453125, 29.27490234375, 30.2353515625, 31.19580078125, 32.15625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 10.0, 11.0, 13.0, 14.0, 19.0, 33.0, 70.0, 120.0, 207.0, 393.0, 694.0, 1805.0, 28312.0, 3098305.0, 12875.0, 1422.0, 615.0, 324.0, 170.0, 105.0, 74.0, 41.0, 19.0, 14.0, 11.0, 9.0, 7.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-142.875, -138.72265625, -134.5703125, -130.41796875, -126.265625, -122.11328125, -117.9609375, -113.80859375, -109.65625, -105.50390625, -101.3515625, -97.19921875, -93.046875, -88.89453125, -84.7421875, -80.58984375, -76.4375, -72.28515625, -68.1328125, -63.98046875, -59.828125, -55.67578125, -51.5234375, -47.37109375, -43.21875, -39.06640625, -34.9140625, -30.76171875, -26.609375, -22.45703125, -18.3046875, -14.15234375, -10.0, -5.84765625, -1.6953125, 2.45703125, 6.609375, 10.76171875, 14.9140625, 19.06640625, 23.21875, 27.37109375, 31.5234375, 35.67578125, 39.828125, 43.98046875, 48.1328125, 52.28515625, 56.4375, 60.58984375, 64.7421875, 68.89453125, 73.046875, 77.19921875, 81.3515625, 85.50390625, 89.65625, 93.80859375, 97.9609375, 102.11328125, 106.265625, 110.41796875, 114.5703125, 118.72265625, 122.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 135.0, 559.0, 288.0, 26.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-315.3527526855469, -298.56707763671875, -281.78143310546875, -264.9957580566406, -248.21009826660156, -231.4244384765625, -214.63876342773438, -197.8531036376953, -181.06744384765625, -164.2817840576172, -147.49612426757812, -130.71044921875, -113.92478942871094, -97.13912963867188, -80.35346221923828, -63.56779479980469, -46.782135009765625, -29.996471405029297, -13.210807800292969, 3.5748558044433594, 20.360519409179688, 37.14617919921875, 53.931846618652344, 70.71751403808594, 87.503173828125, 104.28883361816406, 121.07450103759766, 137.86016845703125, 154.6458282470703, 171.43148803710938, 188.2171630859375, 205.00282287597656, 221.78851318359375, 238.5741729736328, 255.35983276367188, 272.1455078125, 288.93115234375, 305.7168273925781, 322.50250244140625, 339.28814697265625, 356.0738220214844, 372.8594970703125, 389.6451416015625, 406.4308166503906, 423.21649169921875, 440.00213623046875, 456.7878112792969, 473.573486328125, 490.359130859375, 507.1448059082031, 523.9304809570312, 540.7161254882812, 557.5017700195312, 574.2874755859375, 591.0731201171875, 607.8587646484375, 624.6444091796875, 641.4300537109375, 658.2157592773438, 675.0014038085938, 691.7870483398438, 708.57275390625, 725.3583984375, 742.14404296875, 758.9297485351562]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 8.0, 6.0, 11.0, 7.0, 14.0, 8.0, 19.0, 24.0, 27.0, 23.0, 28.0, 35.0, 37.0, 38.0, 36.0, 40.0, 53.0, 57.0, 47.0, 44.0, 37.0, 40.0, 48.0, 42.0, 40.0, 43.0, 27.0, 28.0, 27.0, 17.0, 17.0, 19.0, 14.0, 14.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-96.4081802368164, -93.58419799804688, -90.76020812988281, -87.93622589111328, -85.11224365234375, -82.28825378417969, -79.46427154541016, -76.64028930664062, -73.81629943847656, -70.99231719970703, -68.16832733154297, -65.34434509277344, -62.520362854003906, -59.69637680053711, -56.87239074707031, -54.04840850830078, -51.22442626953125, -48.40044021606445, -45.57645797729492, -42.752471923828125, -39.928489685058594, -37.1045036315918, -34.280517578125, -31.456533432006836, -28.632549285888672, -25.808565139770508, -22.984580993652344, -20.160594940185547, -17.336610794067383, -14.512626647949219, -11.688640594482422, -8.864656448364258, -6.040679931640625, -3.2166953086853027, -0.39271068572998047, 2.4312744140625, 5.255258560180664, 8.079242706298828, 10.903228759765625, 13.727212905883789, 16.551197052001953, 19.375181198120117, 22.19916534423828, 25.023151397705078, 27.847135543823242, 30.671119689941406, 33.4951057434082, 36.319091796875, 39.14307403564453, 41.96706008911133, 44.79104232788086, 47.615028381347656, 50.43901062011719, 53.262996673583984, 56.08698272705078, 58.91096496582031, 61.73495101928711, 64.5589370727539, 67.38291931152344, 70.2069091796875, 73.03089141845703, 75.85487365722656, 78.67886352539062, 81.50284576416016, 84.32682800292969]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 10.0, 10.0, 13.0, 19.0, 15.0, 15.0, 26.0, 17.0, 21.0, 25.0, 31.0, 27.0, 17.0, 34.0, 42.0, 46.0, 47.0, 29.0, 45.0, 31.0, 39.0, 32.0, 22.0, 40.0, 32.0, 29.0, 23.0, 26.0, 31.0, 20.0, 20.0, 17.0, 28.0, 11.0, 20.0, 11.0, 7.0, 9.0, 10.0, 7.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-11.4296875, -11.063232421875, -10.69677734375, -10.330322265625, -9.9638671875, -9.597412109375, -9.23095703125, -8.864501953125, -8.498046875, -8.131591796875, -7.76513671875, -7.398681640625, -7.0322265625, -6.665771484375, -6.29931640625, -5.932861328125, -5.56640625, -5.199951171875, -4.83349609375, -4.467041015625, -4.1005859375, -3.734130859375, -3.36767578125, -3.001220703125, -2.634765625, -2.268310546875, -1.90185546875, -1.535400390625, -1.1689453125, -0.802490234375, -0.43603515625, -0.069580078125, 0.296875, 0.663330078125, 1.02978515625, 1.396240234375, 1.7626953125, 2.129150390625, 2.49560546875, 2.862060546875, 3.228515625, 3.594970703125, 3.96142578125, 4.327880859375, 4.6943359375, 5.060791015625, 5.42724609375, 5.793701171875, 6.16015625, 6.526611328125, 6.89306640625, 7.259521484375, 7.6259765625, 7.992431640625, 8.35888671875, 8.725341796875, 9.091796875, 9.458251953125, 9.82470703125, 10.191162109375, 10.5576171875, 10.924072265625, 11.29052734375, 11.656982421875, 12.0234375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 9.0, 9.0, 10.0, 23.0, 27.0, 43.0, 52.0, 80.0, 105.0, 126.0, 212.0, 252.0, 392.0, 552.0, 859.0, 1344.0, 2325.0, 4645.0, 11164.0, 37799.0, 234563.0, 1713534.0, 1869484.0, 253496.0, 40475.0, 11468.0, 4675.0, 2340.0, 1363.0, 890.0, 541.0, 391.0, 279.0, 225.0, 152.0, 96.0, 82.0, 53.0, 55.0, 25.0, 22.0, 17.0, 12.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.40625, -25.4638671875, -24.521484375, -23.5791015625, -22.63671875, -21.6943359375, -20.751953125, -19.8095703125, -18.8671875, -17.9248046875, -16.982421875, -16.0400390625, -15.09765625, -14.1552734375, -13.212890625, -12.2705078125, -11.328125, -10.3857421875, -9.443359375, -8.5009765625, -7.55859375, -6.6162109375, -5.673828125, -4.7314453125, -3.7890625, -2.8466796875, -1.904296875, -0.9619140625, -0.01953125, 0.9228515625, 1.865234375, 2.8076171875, 3.75, 4.6923828125, 5.634765625, 6.5771484375, 7.51953125, 8.4619140625, 9.404296875, 10.3466796875, 11.2890625, 12.2314453125, 13.173828125, 14.1162109375, 15.05859375, 16.0009765625, 16.943359375, 17.8857421875, 18.828125, 19.7705078125, 20.712890625, 21.6552734375, 22.59765625, 23.5400390625, 24.482421875, 25.4248046875, 26.3671875, 27.3095703125, 28.251953125, 29.1943359375, 30.13671875, 31.0791015625, 32.021484375, 32.9638671875, 33.90625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 7.0, 5.0, 5.0, 5.0, 12.0, 9.0, 34.0, 48.0, 76.0, 86.0, 140.0, 193.0, 287.0, 397.0, 526.0, 635.0, 526.0, 321.0, 246.0, 185.0, 98.0, 74.0, 41.0, 43.0, 26.0, 15.0, 15.0, 8.0, 5.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.576171875, -22.74609375, -21.916015625, -21.0859375, -20.255859375, -19.42578125, -18.595703125, -17.765625, -16.935546875, -16.10546875, -15.275390625, -14.4453125, -13.615234375, -12.78515625, -11.955078125, -11.125, -10.294921875, -9.46484375, -8.634765625, -7.8046875, -6.974609375, -6.14453125, -5.314453125, -4.484375, -3.654296875, -2.82421875, -1.994140625, -1.1640625, -0.333984375, 0.49609375, 1.326171875, 2.15625, 2.986328125, 3.81640625, 4.646484375, 5.4765625, 6.306640625, 7.13671875, 7.966796875, 8.796875, 9.626953125, 10.45703125, 11.287109375, 12.1171875, 12.947265625, 13.77734375, 14.607421875, 15.4375, 16.267578125, 17.09765625, 17.927734375, 18.7578125, 19.587890625, 20.41796875, 21.248046875, 22.078125, 22.908203125, 23.73828125, 24.568359375, 25.3984375, 26.228515625, 27.05859375, 27.888671875, 28.71875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 12.0, 15.0, 24.0, 39.0, 67.0, 90.0, 168.0, 277.0, 586.0, 1398.0, 4496.0, 23831.0, 344274.0, 3500460.0, 290177.0, 21427.0, 4167.0, 1509.0, 556.0, 275.0, 172.0, 95.0, 52.0, 32.0, 21.0, 17.0, 9.0, 5.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.4375, -52.8583984375, -51.279296875, -49.7001953125, -48.12109375, -46.5419921875, -44.962890625, -43.3837890625, -41.8046875, -40.2255859375, -38.646484375, -37.0673828125, -35.48828125, -33.9091796875, -32.330078125, -30.7509765625, -29.171875, -27.5927734375, -26.013671875, -24.4345703125, -22.85546875, -21.2763671875, -19.697265625, -18.1181640625, -16.5390625, -14.9599609375, -13.380859375, -11.8017578125, -10.22265625, -8.6435546875, -7.064453125, -5.4853515625, -3.90625, -2.3271484375, -0.748046875, 0.8310546875, 2.41015625, 3.9892578125, 5.568359375, 7.1474609375, 8.7265625, 10.3056640625, 11.884765625, 13.4638671875, 15.04296875, 16.6220703125, 18.201171875, 19.7802734375, 21.359375, 22.9384765625, 24.517578125, 26.0966796875, 27.67578125, 29.2548828125, 30.833984375, 32.4130859375, 33.9921875, 35.5712890625, 37.150390625, 38.7294921875, 40.30859375, 41.8876953125, 43.466796875, 45.0458984375, 46.625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 21.0, 103.0, 343.0, 351.0, 156.0, 30.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-475.1687316894531, -462.69586181640625, -450.2230224609375, -437.7501525878906, -425.27728271484375, -412.804443359375, -400.3315734863281, -387.85870361328125, -375.3858642578125, -362.9129943847656, -350.4401550292969, -337.96728515625, -325.49444580078125, -313.0215759277344, -300.5487060546875, -288.07586669921875, -275.6029968261719, -263.130126953125, -250.65728759765625, -238.18441772460938, -225.71156311035156, -213.23870849609375, -200.76583862304688, -188.29298400878906, -175.82012939453125, -163.34727478027344, -150.87442016601562, -138.40155029296875, -125.92869567871094, -113.45584106445312, -100.98297882080078, -88.51011657714844, -76.0372314453125, -63.56437301635742, -51.091514587402344, -38.618656158447266, -26.145797729492188, -13.67293930053711, -1.2000808715820312, 11.272781372070312, 23.745635986328125, 36.2184944152832, 48.69135284423828, 61.16421127319336, 73.63706970214844, 86.10992431640625, 98.5827865600586, 111.05564880371094, 123.52850341796875, 136.00135803222656, 148.47421264648438, 160.94708251953125, 173.41993713378906, 185.89279174804688, 198.36566162109375, 210.83851623535156, 223.31137084960938, 235.7842254638672, 248.257080078125, 260.7299499511719, 273.20281982421875, 285.6756591796875, 298.1485290527344, 310.62139892578125, 323.09423828125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 7.0, 6.0, 9.0, 15.0, 12.0, 17.0, 24.0, 20.0, 34.0, 27.0, 36.0, 40.0, 47.0, 56.0, 53.0, 38.0, 57.0, 57.0, 42.0, 42.0, 49.0, 48.0, 30.0, 36.0, 26.0, 27.0, 36.0, 19.0, 22.0, 11.0, 10.0, 14.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-95.26493835449219, -92.54150390625, -89.81807708740234, -87.09464263916016, -84.37120819091797, -81.64778137207031, -78.92434692382812, -76.20091247558594, -73.47747802734375, -70.75404357910156, -68.0306167602539, -65.30718231201172, -62.58374786376953, -59.86031723022461, -57.13688659667969, -54.4134521484375, -51.690025329589844, -48.96659469604492, -46.243160247802734, -43.51972961425781, -40.796295166015625, -38.0728645324707, -35.34943389892578, -32.625999450683594, -29.902568817138672, -27.179136276245117, -24.455703735351562, -21.73227310180664, -19.008840560913086, -16.28540802001953, -13.56197738647461, -10.838544845581055, -8.115119934082031, -5.391687870025635, -2.6682558059692383, 0.05517578125, 2.7786083221435547, 5.502040863037109, 8.225471496582031, 10.948904037475586, 13.67233657836914, 16.395769119262695, 19.11920166015625, 21.842632293701172, 24.566064834594727, 27.28949737548828, 30.012928009033203, 32.736358642578125, 35.45979309082031, 38.183223724365234, 40.90665817260742, 43.630088806152344, 46.35352325439453, 49.07695388793945, 51.800384521484375, 54.52381896972656, 57.247249603271484, 59.970680236816406, 62.694114685058594, 65.41754150390625, 68.14097595214844, 70.86441040039062, 73.58784484863281, 76.31127166748047, 79.03470611572266]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 14.0, 6.0, 7.0, 6.0, 17.0, 9.0, 14.0, 19.0, 16.0, 21.0, 25.0, 24.0, 31.0, 32.0, 36.0, 37.0, 31.0, 33.0, 42.0, 44.0, 42.0, 37.0, 31.0, 31.0, 32.0, 31.0, 30.0, 40.0, 27.0, 28.0, 16.0, 15.0, 24.0, 22.0, 19.0, 14.0, 13.0, 14.0, 7.0, 8.0, 11.0, 7.0, 4.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.125, -9.7969970703125, -9.468994140625, -9.1409912109375, -8.81298828125, -8.4849853515625, -8.156982421875, -7.8289794921875, -7.5009765625, -7.1729736328125, -6.844970703125, -6.5169677734375, -6.18896484375, -5.8609619140625, -5.532958984375, -5.2049560546875, -4.876953125, -4.5489501953125, -4.220947265625, -3.8929443359375, -3.56494140625, -3.2369384765625, -2.908935546875, -2.5809326171875, -2.2529296875, -1.9249267578125, -1.596923828125, -1.2689208984375, -0.94091796875, -0.6129150390625, -0.284912109375, 0.0430908203125, 0.37109375, 0.6990966796875, 1.027099609375, 1.3551025390625, 1.68310546875, 2.0111083984375, 2.339111328125, 2.6671142578125, 2.9951171875, 3.3231201171875, 3.651123046875, 3.9791259765625, 4.30712890625, 4.6351318359375, 4.963134765625, 5.2911376953125, 5.619140625, 5.9471435546875, 6.275146484375, 6.6031494140625, 6.93115234375, 7.2591552734375, 7.587158203125, 7.9151611328125, 8.2431640625, 8.5711669921875, 8.899169921875, 9.2271728515625, 9.55517578125, 9.8831787109375, 10.211181640625, 10.5391845703125, 10.8671875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 11.0, 14.0, 24.0, 32.0, 39.0, 49.0, 88.0, 122.0, 211.0, 280.0, 438.0, 719.0, 1179.0, 1823.0, 3113.0, 5480.0, 9730.0, 17814.0, 34040.0, 66705.0, 137368.0, 255473.0, 247001.0, 131038.0, 63567.0, 32512.0, 17084.0, 9478.0, 5210.0, 3003.0, 1691.0, 1227.0, 682.0, 424.0, 286.0, 194.0, 141.0, 74.0, 62.0, 50.0, 23.0, 17.0, 14.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.4298248291015625, -1.382110595703125, -1.3343963623046875, -1.28668212890625, -1.2389678955078125, -1.191253662109375, -1.1435394287109375, -1.0958251953125, -1.0481109619140625, -1.000396728515625, -0.9526824951171875, -0.90496826171875, -0.8572540283203125, -0.809539794921875, -0.7618255615234375, -0.714111328125, -0.6663970947265625, -0.618682861328125, -0.5709686279296875, -0.52325439453125, -0.4755401611328125, -0.427825927734375, -0.3801116943359375, -0.3323974609375, -0.2846832275390625, -0.236968994140625, -0.1892547607421875, -0.14154052734375, -0.0938262939453125, -0.046112060546875, 0.0016021728515625, 0.04931640625, 0.0970306396484375, 0.144744873046875, 0.1924591064453125, 0.24017333984375, 0.2878875732421875, 0.335601806640625, 0.3833160400390625, 0.4310302734375, 0.4787445068359375, 0.526458740234375, 0.5741729736328125, 0.62188720703125, 0.6696014404296875, 0.717315673828125, 0.7650299072265625, 0.812744140625, 0.8604583740234375, 0.908172607421875, 0.9558868408203125, 1.00360107421875, 1.0513153076171875, 1.099029541015625, 1.1467437744140625, 1.1944580078125, 1.2421722412109375, 1.289886474609375, 1.3376007080078125, 1.38531494140625, 1.4330291748046875, 1.480743408203125, 1.5284576416015625, 1.576171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 18.0, 19.0, 26.0, 30.0, 35.0, 24.0, 37.0, 29.0, 51.0, 51.0, 40.0, 51.0, 43.0, 1067.0, 47.0, 45.0, 53.0, 38.0, 50.0, 28.0, 36.0, 38.0, 24.0, 23.0, 24.0, 12.0, 17.0, 10.0, 11.0, 8.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.1593017578125, -9.857666015625, -9.5560302734375, -9.25439453125, -8.9527587890625, -8.651123046875, -8.3494873046875, -8.0478515625, -7.7462158203125, -7.444580078125, -7.1429443359375, -6.84130859375, -6.5396728515625, -6.238037109375, -5.9364013671875, -5.634765625, -5.3331298828125, -5.031494140625, -4.7298583984375, -4.42822265625, -4.1265869140625, -3.824951171875, -3.5233154296875, -3.2216796875, -2.9200439453125, -2.618408203125, -2.3167724609375, -2.01513671875, -1.7135009765625, -1.411865234375, -1.1102294921875, -0.80859375, -0.5069580078125, -0.205322265625, 0.0963134765625, 0.39794921875, 0.6995849609375, 1.001220703125, 1.3028564453125, 1.6044921875, 1.9061279296875, 2.207763671875, 2.5093994140625, 2.81103515625, 3.1126708984375, 3.414306640625, 3.7159423828125, 4.017578125, 4.3192138671875, 4.620849609375, 4.9224853515625, 5.22412109375, 5.5257568359375, 5.827392578125, 6.1290283203125, 6.4306640625, 6.7322998046875, 7.033935546875, 7.3355712890625, 7.63720703125, 7.9388427734375, 8.240478515625, 8.5421142578125, 8.84375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 17.0, 17.0, 27.0, 42.0, 77.0, 113.0, 138.0, 206.0, 303.0, 448.0, 752.0, 1047.0, 1562.0, 2496.0, 3943.0, 6366.0, 10113.0, 16593.0, 27673.0, 46345.0, 81239.0, 142735.0, 1113394.0, 331973.0, 128759.0, 72851.0, 42393.0, 25007.0, 15179.0, 9166.0, 5790.0, 3640.0, 2288.0, 1568.0, 937.0, 629.0, 434.0, 256.0, 200.0, 153.0, 80.0, 59.0, 36.0, 24.0, 17.0, 23.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6189346313476562, -0.5967559814453125, -0.5745773315429688, -0.552398681640625, -0.5302200317382812, -0.5080413818359375, -0.48586273193359375, -0.46368408203125, -0.44150543212890625, -0.4193267822265625, -0.39714813232421875, -0.374969482421875, -0.35279083251953125, -0.3306121826171875, -0.30843353271484375, -0.2862548828125, -0.26407623291015625, -0.2418975830078125, -0.21971893310546875, -0.197540283203125, -0.17536163330078125, -0.1531829833984375, -0.13100433349609375, -0.10882568359375, -0.08664703369140625, -0.0644683837890625, -0.04228973388671875, -0.020111083984375, 0.00206756591796875, 0.0242462158203125, 0.04642486572265625, 0.068603515625, 0.09078216552734375, 0.1129608154296875, 0.13513946533203125, 0.157318115234375, 0.17949676513671875, 0.2016754150390625, 0.22385406494140625, 0.24603271484375, 0.26821136474609375, 0.2903900146484375, 0.31256866455078125, 0.334747314453125, 0.35692596435546875, 0.3791046142578125, 0.40128326416015625, 0.4234619140625, 0.44564056396484375, 0.4678192138671875, 0.48999786376953125, 0.512176513671875, 0.5343551635742188, 0.5565338134765625, 0.5787124633789062, 0.60089111328125, 0.6230697631835938, 0.6452484130859375, 0.6674270629882812, 0.689605712890625, 0.7117843627929688, 0.7339630126953125, 0.7561416625976562, 0.7783203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 9.0, 5.0, 11.0, 22.0, 22.0, 35.0, 43.0, 52.0, 72.0, 173.0, 189.0, 93.0, 50.0, 44.0, 39.0, 30.0, 13.0, 17.0, 12.0, 14.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.09540462493896484, -0.09260368347167969, -0.08980274200439453, -0.08700180053710938, -0.08420085906982422, -0.08139991760253906, -0.0785989761352539, -0.07579803466796875, -0.0729970932006836, -0.07019615173339844, -0.06739521026611328, -0.06459426879882812, -0.06179332733154297, -0.05899238586425781, -0.056191444396972656, -0.0533905029296875, -0.050589561462402344, -0.04778861999511719, -0.04498767852783203, -0.042186737060546875, -0.03938579559326172, -0.03658485412597656, -0.033783912658691406, -0.03098297119140625, -0.028182029724121094, -0.025381088256835938, -0.02258014678955078, -0.019779205322265625, -0.01697826385498047, -0.014177322387695312, -0.011376380920410156, -0.008575439453125, -0.005774497985839844, -0.0029735565185546875, -0.00017261505126953125, 0.002628326416015625, 0.005429267883300781, 0.008230209350585938, 0.011031150817871094, 0.01383209228515625, 0.016633033752441406, 0.019433975219726562, 0.02223491668701172, 0.025035858154296875, 0.02783679962158203, 0.030637741088867188, 0.033438682556152344, 0.0362396240234375, 0.039040565490722656, 0.04184150695800781, 0.04464244842529297, 0.047443389892578125, 0.05024433135986328, 0.05304527282714844, 0.055846214294433594, 0.05864715576171875, 0.061448097229003906, 0.06424903869628906, 0.06704998016357422, 0.06985092163085938, 0.07265186309814453, 0.07545280456542969, 0.07825374603271484, 0.0810546875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 10.0, 13.0, 12.0, 21.0, 34.0, 26.0, 45.0, 59.0, 68.0, 116.0, 184.0, 340.0, 1528.0, 27429.0, 1004232.0, 12554.0, 1059.0, 296.0, 153.0, 109.0, 61.0, 64.0, 27.0, 26.0, 25.0, 14.0, 12.0, 11.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30078125, -1.25653076171875, -1.2122802734375, -1.16802978515625, -1.123779296875, -1.07952880859375, -1.0352783203125, -0.99102783203125, -0.94677734375, -0.90252685546875, -0.8582763671875, -0.81402587890625, -0.769775390625, -0.72552490234375, -0.6812744140625, -0.63702392578125, -0.5927734375, -0.54852294921875, -0.5042724609375, -0.46002197265625, -0.415771484375, -0.37152099609375, -0.3272705078125, -0.28302001953125, -0.23876953125, -0.19451904296875, -0.1502685546875, -0.10601806640625, -0.061767578125, -0.01751708984375, 0.0267333984375, 0.07098388671875, 0.115234375, 0.15948486328125, 0.2037353515625, 0.24798583984375, 0.292236328125, 0.33648681640625, 0.3807373046875, 0.42498779296875, 0.46923828125, 0.51348876953125, 0.5577392578125, 0.60198974609375, 0.646240234375, 0.69049072265625, 0.7347412109375, 0.77899169921875, 0.8232421875, 0.86749267578125, 0.9117431640625, 0.95599365234375, 1.000244140625, 1.04449462890625, 1.0887451171875, 1.13299560546875, 1.17724609375, 1.22149658203125, 1.2657470703125, 1.30999755859375, 1.354248046875, 1.39849853515625, 1.4427490234375, 1.48699951171875, 1.53125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 153.0, 786.0, 47.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1769012212753296, -1.1405539512634277, -1.1042068004608154, -1.0678595304489136, -1.0315123796463013, -0.9951651096343994, -0.9588178992271423, -0.9224706888198853, -0.8861234784126282, -0.8497762680053711, -0.813429057598114, -0.7770818471908569, -0.7407345771789551, -0.7043874263763428, -0.6680401563644409, -0.6316929459571838, -0.5953457355499268, -0.5589985251426697, -0.5226513147354126, -0.48630407452583313, -0.44995686411857605, -0.41360965371131897, -0.3772624135017395, -0.3409152030944824, -0.30456799268722534, -0.26822078227996826, -0.23187355697155, -0.1955263316631317, -0.15917912125587463, -0.12283191084861755, -0.08648468554019928, -0.050137460231781006, -0.013790130615234375, 0.022557087242603302, 0.05890430510044098, 0.09525152295827866, 0.13159874081611633, 0.1679459512233734, 0.2042931765317917, 0.24064040184020996, 0.27698761224746704, 0.3133348226547241, 0.3496820330619812, 0.38602927327156067, 0.42237648367881775, 0.45872369408607483, 0.4950709342956543, 0.5314181447029114, 0.5677653551101685, 0.6041125655174255, 0.6404597759246826, 0.6768069863319397, 0.7131541967391968, 0.7495014667510986, 0.7858486771583557, 0.8221958875656128, 0.8585430979728699, 0.894890308380127, 0.931237518787384, 0.9675847291946411, 1.003931999206543, 1.0402791500091553, 1.0766264200210571, 1.112973690032959, 1.1493208408355713]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 4.0, 5.0, 9.0, 11.0, 17.0, 13.0, 10.0, 29.0, 19.0, 19.0, 38.0, 23.0, 33.0, 38.0, 53.0, 52.0, 27.0, 38.0, 46.0, 43.0, 28.0, 49.0, 30.0, 41.0, 33.0, 34.0, 32.0, 37.0, 29.0, 22.0, 16.0, 22.0, 14.0, 13.0, 11.0, 12.0, 12.0, 11.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.13943535089492798, -0.13538265228271484, -0.13132993876934052, -0.1272772252559662, -0.12322452664375305, -0.11917182058095932, -0.11511911451816559, -0.11106640845537186, -0.10701370239257812, -0.1029609963297844, -0.09890829026699066, -0.09485558420419693, -0.0908028781414032, -0.08675017207860947, -0.08269746601581573, -0.078644759953022, -0.07459205389022827, -0.07053934782743454, -0.06648664176464081, -0.062433935701847076, -0.058381229639053345, -0.05432852357625961, -0.05027581751346588, -0.04622311145067215, -0.04217040538787842, -0.038117699325084686, -0.034064993262290955, -0.030012287199497223, -0.02595958113670349, -0.02190687507390976, -0.017854169011116028, -0.013801462948322296, -0.009748756885528564, -0.005696050822734833, -0.001643344759941101, 0.0024093613028526306, 0.006462067365646362, 0.010514773428440094, 0.014567479491233826, 0.018620185554027557, 0.02267289161682129, 0.02672559767961502, 0.030778303742408752, 0.034831009805202484, 0.038883715867996216, 0.04293642193078995, 0.04698912799358368, 0.05104183405637741, 0.05509454011917114, 0.059147246181964874, 0.0631999522447586, 0.06725265830755234, 0.07130536437034607, 0.0753580704331398, 0.07941077649593353, 0.08346348255872726, 0.087516188621521, 0.09156889468431473, 0.09562160074710846, 0.09967430680990219, 0.10372701287269592, 0.10777971893548965, 0.11183242499828339, 0.11588513106107712, 0.11993783712387085]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 14.0, 6.0, 7.0, 6.0, 17.0, 9.0, 16.0, 17.0, 17.0, 21.0, 24.0, 24.0, 33.0, 30.0, 36.0, 36.0, 32.0, 34.0, 42.0, 41.0, 44.0, 37.0, 30.0, 32.0, 32.0, 30.0, 30.0, 40.0, 28.0, 26.0, 17.0, 16.0, 23.0, 21.0, 20.0, 15.0, 12.0, 15.0, 7.0, 7.0, 12.0, 7.0, 4.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.1171875, -9.78955078125, -9.4619140625, -9.13427734375, -8.806640625, -8.47900390625, -8.1513671875, -7.82373046875, -7.49609375, -7.16845703125, -6.8408203125, -6.51318359375, -6.185546875, -5.85791015625, -5.5302734375, -5.20263671875, -4.875, -4.54736328125, -4.2197265625, -3.89208984375, -3.564453125, -3.23681640625, -2.9091796875, -2.58154296875, -2.25390625, -1.92626953125, -1.5986328125, -1.27099609375, -0.943359375, -0.61572265625, -0.2880859375, 0.03955078125, 0.3671875, 0.69482421875, 1.0224609375, 1.35009765625, 1.677734375, 2.00537109375, 2.3330078125, 2.66064453125, 2.98828125, 3.31591796875, 3.6435546875, 3.97119140625, 4.298828125, 4.62646484375, 4.9541015625, 5.28173828125, 5.609375, 5.93701171875, 6.2646484375, 6.59228515625, 6.919921875, 7.24755859375, 7.5751953125, 7.90283203125, 8.23046875, 8.55810546875, 8.8857421875, 9.21337890625, 9.541015625, 9.86865234375, 10.1962890625, 10.52392578125, 10.8515625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 9.0, 6.0, 16.0, 19.0, 16.0, 18.0, 42.0, 31.0, 51.0, 54.0, 78.0, 92.0, 122.0, 156.0, 197.0, 261.0, 334.0, 501.0, 631.0, 1064.0, 1780.0, 3064.0, 5737.0, 12099.0, 28024.0, 74291.0, 218728.0, 384708.0, 198432.0, 67692.0, 25554.0, 11223.0, 5393.0, 2881.0, 1610.0, 1049.0, 655.0, 474.0, 327.0, 260.0, 214.0, 142.0, 130.0, 75.0, 71.0, 48.0, 50.0, 38.0, 38.0, 19.0, 22.0, 13.0, 7.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.1484375, -12.7166748046875, -12.284912109375, -11.8531494140625, -11.42138671875, -10.9896240234375, -10.557861328125, -10.1260986328125, -9.6943359375, -9.2625732421875, -8.830810546875, -8.3990478515625, -7.96728515625, -7.5355224609375, -7.103759765625, -6.6719970703125, -6.240234375, -5.8084716796875, -5.376708984375, -4.9449462890625, -4.51318359375, -4.0814208984375, -3.649658203125, -3.2178955078125, -2.7861328125, -2.3543701171875, -1.922607421875, -1.4908447265625, -1.05908203125, -0.6273193359375, -0.195556640625, 0.2362060546875, 0.66796875, 1.0997314453125, 1.531494140625, 1.9632568359375, 2.39501953125, 2.8267822265625, 3.258544921875, 3.6903076171875, 4.1220703125, 4.5538330078125, 4.985595703125, 5.4173583984375, 5.84912109375, 6.2808837890625, 6.712646484375, 7.1444091796875, 7.576171875, 8.0079345703125, 8.439697265625, 8.8714599609375, 9.30322265625, 9.7349853515625, 10.166748046875, 10.5985107421875, 11.0302734375, 11.4620361328125, 11.893798828125, 12.3255615234375, 12.75732421875, 13.1890869140625, 13.620849609375, 14.0526123046875, 14.484375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 9.0, 5.0, 11.0, 12.0, 16.0, 17.0, 15.0, 25.0, 29.0, 31.0, 44.0, 40.0, 51.0, 74.0, 118.0, 178.0, 1436.0, 339.0, 164.0, 92.0, 57.0, 49.0, 33.0, 34.0, 27.0, 26.0, 16.0, 19.0, 10.0, 14.0, 5.0, 9.0, 10.0, 4.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-37.75, -36.568359375, -35.38671875, -34.205078125, -33.0234375, -31.841796875, -30.66015625, -29.478515625, -28.296875, -27.115234375, -25.93359375, -24.751953125, -23.5703125, -22.388671875, -21.20703125, -20.025390625, -18.84375, -17.662109375, -16.48046875, -15.298828125, -14.1171875, -12.935546875, -11.75390625, -10.572265625, -9.390625, -8.208984375, -7.02734375, -5.845703125, -4.6640625, -3.482421875, -2.30078125, -1.119140625, 0.0625, 1.244140625, 2.42578125, 3.607421875, 4.7890625, 5.970703125, 7.15234375, 8.333984375, 9.515625, 10.697265625, 11.87890625, 13.060546875, 14.2421875, 15.423828125, 16.60546875, 17.787109375, 18.96875, 20.150390625, 21.33203125, 22.513671875, 23.6953125, 24.876953125, 26.05859375, 27.240234375, 28.421875, 29.603515625, 30.78515625, 31.966796875, 33.1484375, 34.330078125, 35.51171875, 36.693359375, 37.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 5.0, 6.0, 9.0, 9.0, 15.0, 22.0, 30.0, 41.0, 48.0, 70.0, 102.0, 137.0, 250.0, 537.0, 1411.0, 10688.0, 2814923.0, 310744.0, 4426.0, 1018.0, 421.0, 247.0, 155.0, 111.0, 53.0, 51.0, 43.0, 26.0, 22.0, 16.0, 15.0, 9.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.8125, -69.4052734375, -66.998046875, -64.5908203125, -62.18359375, -59.7763671875, -57.369140625, -54.9619140625, -52.5546875, -50.1474609375, -47.740234375, -45.3330078125, -42.92578125, -40.5185546875, -38.111328125, -35.7041015625, -33.296875, -30.8896484375, -28.482421875, -26.0751953125, -23.66796875, -21.2607421875, -18.853515625, -16.4462890625, -14.0390625, -11.6318359375, -9.224609375, -6.8173828125, -4.41015625, -2.0029296875, 0.404296875, 2.8115234375, 5.21875, 7.6259765625, 10.033203125, 12.4404296875, 14.84765625, 17.2548828125, 19.662109375, 22.0693359375, 24.4765625, 26.8837890625, 29.291015625, 31.6982421875, 34.10546875, 36.5126953125, 38.919921875, 41.3271484375, 43.734375, 46.1416015625, 48.548828125, 50.9560546875, 53.36328125, 55.7705078125, 58.177734375, 60.5849609375, 62.9921875, 65.3994140625, 67.806640625, 70.2138671875, 72.62109375, 75.0283203125, 77.435546875, 79.8427734375, 82.25]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 149.0, 591.0, 240.0, 19.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-664.5567626953125, -649.9706420898438, -635.384521484375, -620.7984008789062, -606.2122802734375, -591.626220703125, -577.0400390625, -562.4539794921875, -547.8678588867188, -533.28173828125, -518.6956176757812, -504.1094970703125, -489.5234069824219, -474.9372863769531, -460.3511657714844, -445.7650451660156, -431.1789245605469, -416.5928039550781, -402.0066833496094, -387.42059326171875, -372.83447265625, -358.24835205078125, -343.6622314453125, -329.07611083984375, -314.489990234375, -299.90386962890625, -285.3177490234375, -270.73162841796875, -256.1455383300781, -241.55941772460938, -226.97329711914062, -212.38717651367188, -197.80108642578125, -183.2149658203125, -168.6288604736328, -154.04273986816406, -139.45663452148438, -124.87051391601562, -110.28439331054688, -95.69828033447266, -81.11216735839844, -66.52605438232422, -51.939937591552734, -37.35382080078125, -22.76770782470703, -8.181594848632812, 6.4045257568359375, 20.990638732910156, 35.576751708984375, 50.162864685058594, 64.74897766113281, 79.33509826660156, 93.92121124267578, 108.50732421875, 123.09344482421875, 137.6795654296875, 152.2656707763672, 166.85179138183594, 181.43789672851562, 196.02401733398438, 210.61013793945312, 225.1962432861328, 239.78236389160156, 254.36846923828125, 268.95458984375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 19.0, 23.0, 21.0, 56.0, 49.0, 54.0, 70.0, 78.0, 81.0, 72.0, 93.0, 64.0, 59.0, 65.0, 59.0, 35.0, 32.0, 27.0, 15.0, 8.0, 2.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.67172241210938, -166.9735870361328, -162.2754669189453, -157.57733154296875, -152.87921142578125, -148.1810760498047, -143.48294067382812, -138.78482055664062, -134.08668518066406, -129.3885498046875, -124.6904296875, -119.99229431152344, -115.2941665649414, -110.59603881835938, -105.89790344238281, -101.19977569580078, -96.50164794921875, -91.80352020263672, -87.10539245605469, -82.40725708007812, -77.7091293334961, -73.01100158691406, -68.3128662109375, -63.61473846435547, -58.91661071777344, -54.218482971191406, -49.52035140991211, -44.82221984863281, -40.12409210205078, -35.42596435546875, -30.727832794189453, -26.029701232910156, -21.331573486328125, -16.63344383239746, -11.935314178466797, -7.237184524536133, -2.5390548706054688, 2.1590747833251953, 6.857204437255859, 11.555335998535156, 16.253463745117188, 20.95159339904785, 25.649723052978516, 30.34785270690918, 35.045982360839844, 39.744110107421875, 44.44224166870117, 49.14037322998047, 53.8385009765625, 58.53662872314453, 63.23476028442383, 67.93289184570312, 72.63101959228516, 77.32914733886719, 82.02728271484375, 86.72541046142578, 91.42353820800781, 96.12166595458984, 100.81979370117188, 105.51792907714844, 110.21605682373047, 114.9141845703125, 119.61231994628906, 124.3104476928711, 129.00857543945312]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 8.0, 3.0, 5.0, 5.0, 6.0, 10.0, 15.0, 10.0, 16.0, 12.0, 18.0, 21.0, 22.0, 14.0, 30.0, 23.0, 34.0, 45.0, 26.0, 35.0, 34.0, 39.0, 40.0, 38.0, 41.0, 33.0, 25.0, 37.0, 41.0, 31.0, 32.0, 35.0, 20.0, 26.0, 21.0, 21.0, 16.0, 17.0, 15.0, 11.0, 14.0, 6.0, 13.0, 4.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0], "bins": [-12.0078125, -11.62744140625, -11.2470703125, -10.86669921875, -10.486328125, -10.10595703125, -9.7255859375, -9.34521484375, -8.96484375, -8.58447265625, -8.2041015625, -7.82373046875, -7.443359375, -7.06298828125, -6.6826171875, -6.30224609375, -5.921875, -5.54150390625, -5.1611328125, -4.78076171875, -4.400390625, -4.02001953125, -3.6396484375, -3.25927734375, -2.87890625, -2.49853515625, -2.1181640625, -1.73779296875, -1.357421875, -0.97705078125, -0.5966796875, -0.21630859375, 0.1640625, 0.54443359375, 0.9248046875, 1.30517578125, 1.685546875, 2.06591796875, 2.4462890625, 2.82666015625, 3.20703125, 3.58740234375, 3.9677734375, 4.34814453125, 4.728515625, 5.10888671875, 5.4892578125, 5.86962890625, 6.25, 6.63037109375, 7.0107421875, 7.39111328125, 7.771484375, 8.15185546875, 8.5322265625, 8.91259765625, 9.29296875, 9.67333984375, 10.0537109375, 10.43408203125, 10.814453125, 11.19482421875, 11.5751953125, 11.95556640625, 12.3359375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 14.0, 9.0, 8.0, 24.0, 24.0, 35.0, 48.0, 56.0, 96.0, 133.0, 186.0, 274.0, 455.0, 796.0, 1664.0, 5070.0, 24122.0, 244108.0, 3251272.0, 610847.0, 42574.0, 7584.0, 2260.0, 981.0, 539.0, 357.0, 219.0, 154.0, 119.0, 62.0, 53.0, 35.0, 28.0, 18.0, 14.0, 8.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0625, -70.890625, -68.71875, -66.546875, -64.375, -62.203125, -60.03125, -57.859375, -55.6875, -53.515625, -51.34375, -49.171875, -47.0, -44.828125, -42.65625, -40.484375, -38.3125, -36.140625, -33.96875, -31.796875, -29.625, -27.453125, -25.28125, -23.109375, -20.9375, -18.765625, -16.59375, -14.421875, -12.25, -10.078125, -7.90625, -5.734375, -3.5625, -1.390625, 0.78125, 2.953125, 5.125, 7.296875, 9.46875, 11.640625, 13.8125, 15.984375, 18.15625, 20.328125, 22.5, 24.671875, 26.84375, 29.015625, 31.1875, 33.359375, 35.53125, 37.703125, 39.875, 42.046875, 44.21875, 46.390625, 48.5625, 50.734375, 52.90625, 55.078125, 57.25, 59.421875, 61.59375, 63.765625, 65.9375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 18.0, 27.0, 51.0, 51.0, 82.0, 94.0, 134.0, 197.0, 310.0, 410.0, 498.0, 519.0, 429.0, 327.0, 246.0, 179.0, 130.0, 102.0, 72.0, 58.0, 38.0, 24.0, 15.0, 11.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-36.90625, -35.91455078125, -34.9228515625, -33.93115234375, -32.939453125, -31.94775390625, -30.9560546875, -29.96435546875, -28.97265625, -27.98095703125, -26.9892578125, -25.99755859375, -25.005859375, -24.01416015625, -23.0224609375, -22.03076171875, -21.0390625, -20.04736328125, -19.0556640625, -18.06396484375, -17.072265625, -16.08056640625, -15.0888671875, -14.09716796875, -13.10546875, -12.11376953125, -11.1220703125, -10.13037109375, -9.138671875, -8.14697265625, -7.1552734375, -6.16357421875, -5.171875, -4.18017578125, -3.1884765625, -2.19677734375, -1.205078125, -0.21337890625, 0.7783203125, 1.77001953125, 2.76171875, 3.75341796875, 4.7451171875, 5.73681640625, 6.728515625, 7.72021484375, 8.7119140625, 9.70361328125, 10.6953125, 11.68701171875, 12.6787109375, 13.67041015625, 14.662109375, 15.65380859375, 16.6455078125, 17.63720703125, 18.62890625, 19.62060546875, 20.6123046875, 21.60400390625, 22.595703125, 23.58740234375, 24.5791015625, 25.57080078125, 26.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 8.0, 4.0, 4.0, 7.0, 11.0, 17.0, 12.0, 22.0, 50.0, 81.0, 162.0, 446.0, 1307.0, 4690.0, 28094.0, 262241.0, 2967154.0, 847359.0, 69353.0, 9826.0, 2148.0, 687.0, 303.0, 124.0, 55.0, 34.0, 24.0, 19.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-62.15625, -60.55078125, -58.9453125, -57.33984375, -55.734375, -54.12890625, -52.5234375, -50.91796875, -49.3125, -47.70703125, -46.1015625, -44.49609375, -42.890625, -41.28515625, -39.6796875, -38.07421875, -36.46875, -34.86328125, -33.2578125, -31.65234375, -30.046875, -28.44140625, -26.8359375, -25.23046875, -23.625, -22.01953125, -20.4140625, -18.80859375, -17.203125, -15.59765625, -13.9921875, -12.38671875, -10.78125, -9.17578125, -7.5703125, -5.96484375, -4.359375, -2.75390625, -1.1484375, 0.45703125, 2.0625, 3.66796875, 5.2734375, 6.87890625, 8.484375, 10.08984375, 11.6953125, 13.30078125, 14.90625, 16.51171875, 18.1171875, 19.72265625, 21.328125, 22.93359375, 24.5390625, 26.14453125, 27.75, 29.35546875, 30.9609375, 32.56640625, 34.171875, 35.77734375, 37.3828125, 38.98828125, 40.59375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 10.0, 9.0, 3.0, 13.0, 17.0, 23.0, 17.0, 30.0, 31.0, 46.0, 38.0, 55.0, 64.0, 60.0, 72.0, 55.0, 66.0, 62.0, 66.0, 54.0, 40.0, 33.0, 22.0, 27.0, 24.0, 18.0, 12.0, 6.0, 12.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-194.50086975097656, -189.0660858154297, -183.63128662109375, -178.19650268554688, -172.76171875, -167.32693481445312, -161.8921356201172, -156.4573516845703, -151.02255249023438, -145.5877685546875, -140.15296936035156, -134.7181854248047, -129.2834014892578, -123.8486099243164, -118.413818359375, -112.97903442382812, -107.54425048828125, -102.10945892333984, -96.67467498779297, -91.23988342285156, -85.80509948730469, -80.37030792236328, -74.93551635742188, -69.500732421875, -64.0659408569336, -58.63115310668945, -53.19636535644531, -47.761573791503906, -42.326786041259766, -36.891998291015625, -31.45720672607422, -26.022418975830078, -20.587646484375, -15.152857780456543, -9.718069076538086, -4.2832794189453125, 1.1515083312988281, 6.586296081542969, 12.021087646484375, 17.455875396728516, 22.890663146972656, 28.325450897216797, 33.76023864746094, 39.195030212402344, 44.629817962646484, 50.064605712890625, 55.49939727783203, 60.93418502807617, 66.36897277832031, 71.80376434326172, 77.2385482788086, 82.67333984375, 88.10812377929688, 93.54291534423828, 98.97770690917969, 104.41249084472656, 109.84728240966797, 115.28207397460938, 120.71685791015625, 126.15164947509766, 131.58644104003906, 137.02122497558594, 142.45602416992188, 147.89080810546875, 153.32559204101562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 6.0, 12.0, 7.0, 8.0, 11.0, 20.0, 21.0, 21.0, 28.0, 25.0, 29.0, 35.0, 46.0, 34.0, 33.0, 49.0, 39.0, 39.0, 49.0, 49.0, 46.0, 39.0, 32.0, 35.0, 37.0, 30.0, 32.0, 23.0, 21.0, 15.0, 22.0, 15.0, 7.0, 13.0, 10.0, 10.0, 8.0, 13.0, 4.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.61731719970703, -123.5925064086914, -119.56768798828125, -115.54287719726562, -111.51805877685547, -107.49324798583984, -103.46842956542969, -99.44361877441406, -95.41880798339844, -91.39399719238281, -87.36917877197266, -83.34436798095703, -79.31954956054688, -75.29473876953125, -71.26992797851562, -67.24510955810547, -63.22029113769531, -59.19547653198242, -55.17066192626953, -51.145851135253906, -47.12103271484375, -43.096221923828125, -39.071407318115234, -35.046592712402344, -31.021778106689453, -26.996963500976562, -22.972148895263672, -18.947336196899414, -14.922521591186523, -10.897706985473633, -6.872894287109375, -2.8480796813964844, 1.176727294921875, 5.201541423797607, 9.22635555267334, 13.251169204711914, 17.275983810424805, 21.300798416137695, 25.325611114501953, 29.350425720214844, 33.375240325927734, 37.400054931640625, 41.424869537353516, 45.449684143066406, 49.47449493408203, 53.49931335449219, 57.52412414550781, 61.5489387512207, 65.5737533569336, 69.59856414794922, 73.62338256835938, 77.648193359375, 81.67301177978516, 85.69782257080078, 89.72264099121094, 93.74745178222656, 97.77226257324219, 101.79707336425781, 105.82189178466797, 109.8467025756836, 113.87152099609375, 117.89633178710938, 121.921142578125, 125.94596099853516, 129.9707794189453]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 5.0, 14.0, 13.0, 18.0, 25.0, 7.0, 27.0, 26.0, 28.0, 27.0, 26.0, 42.0, 27.0, 47.0, 44.0, 52.0, 40.0, 35.0, 40.0, 47.0, 41.0, 49.0, 37.0, 36.0, 35.0, 26.0, 23.0, 21.0, 18.0, 13.0, 15.0, 16.0, 8.0, 10.0, 8.0, 14.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.125, -195.068359375, -188.01171875, -180.955078125, -173.8984375, -166.841796875, -159.78515625, -152.728515625, -145.671875, -138.615234375, -131.55859375, -124.501953125, -117.4453125, -110.388671875, -103.33203125, -96.275390625, -89.21875, -82.162109375, -75.10546875, -68.048828125, -60.9921875, -53.935546875, -46.87890625, -39.822265625, -32.765625, -25.708984375, -18.65234375, -11.595703125, -4.5390625, 2.517578125, 9.57421875, 16.630859375, 23.6875, 30.744140625, 37.80078125, 44.857421875, 51.9140625, 58.970703125, 66.02734375, 73.083984375, 80.140625, 87.197265625, 94.25390625, 101.310546875, 108.3671875, 115.423828125, 122.48046875, 129.537109375, 136.59375, 143.650390625, 150.70703125, 157.763671875, 164.8203125, 171.876953125, 178.93359375, 185.990234375, 193.046875, 200.103515625, 207.16015625, 214.216796875, 221.2734375, 228.330078125, 235.38671875, 242.443359375, 249.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 13.0, 12.0, 30.0, 44.0, 60.0, 84.0, 139.0, 227.0, 349.0, 515.0, 829.0, 1346.0, 1945.0, 3136.0, 4732.0, 7234.0, 10783.0, 16071.0, 25148.0, 38240.0, 58354.0, 87557.0, 129884.0, 169065.0, 157689.0, 113964.0, 76129.0, 49929.0, 32625.0, 21411.0, 14012.0, 9158.0, 6083.0, 4029.0, 2691.0, 1808.0, 1137.0, 769.0, 513.0, 287.0, 177.0, 137.0, 81.0, 51.0, 32.0, 19.0, 10.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.5234375, -10.2122802734375, -9.901123046875, -9.5899658203125, -9.27880859375, -8.9676513671875, -8.656494140625, -8.3453369140625, -8.0341796875, -7.7230224609375, -7.411865234375, -7.1007080078125, -6.78955078125, -6.4783935546875, -6.167236328125, -5.8560791015625, -5.544921875, -5.2337646484375, -4.922607421875, -4.6114501953125, -4.30029296875, -3.9891357421875, -3.677978515625, -3.3668212890625, -3.0556640625, -2.7445068359375, -2.433349609375, -2.1221923828125, -1.81103515625, -1.4998779296875, -1.188720703125, -0.8775634765625, -0.56640625, -0.2552490234375, 0.055908203125, 0.3670654296875, 0.67822265625, 0.9893798828125, 1.300537109375, 1.6116943359375, 1.9228515625, 2.2340087890625, 2.545166015625, 2.8563232421875, 3.16748046875, 3.4786376953125, 3.789794921875, 4.1009521484375, 4.412109375, 4.7232666015625, 5.034423828125, 5.3455810546875, 5.65673828125, 5.9678955078125, 6.279052734375, 6.5902099609375, 6.9013671875, 7.2125244140625, 7.523681640625, 7.8348388671875, 8.14599609375, 8.4571533203125, 8.768310546875, 9.0794677734375, 9.390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 8.0, 4.0, 5.0, 11.0, 20.0, 13.0, 9.0, 25.0, 23.0, 20.0, 23.0, 25.0, 18.0, 21.0, 36.0, 30.0, 37.0, 27.0, 33.0, 35.0, 37.0, 1061.0, 33.0, 40.0, 34.0, 30.0, 37.0, 31.0, 39.0, 29.0, 19.0, 28.0, 22.0, 17.0, 19.0, 28.0, 16.0, 18.0, 12.0, 6.0, 9.0, 3.0, 10.0, 2.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-122.1875, -118.1787109375, -114.169921875, -110.1611328125, -106.15234375, -102.1435546875, -98.134765625, -94.1259765625, -90.1171875, -86.1083984375, -82.099609375, -78.0908203125, -74.08203125, -70.0732421875, -66.064453125, -62.0556640625, -58.046875, -54.0380859375, -50.029296875, -46.0205078125, -42.01171875, -38.0029296875, -33.994140625, -29.9853515625, -25.9765625, -21.9677734375, -17.958984375, -13.9501953125, -9.94140625, -5.9326171875, -1.923828125, 2.0849609375, 6.09375, 10.1025390625, 14.111328125, 18.1201171875, 22.12890625, 26.1376953125, 30.146484375, 34.1552734375, 38.1640625, 42.1728515625, 46.181640625, 50.1904296875, 54.19921875, 58.2080078125, 62.216796875, 66.2255859375, 70.234375, 74.2431640625, 78.251953125, 82.2607421875, 86.26953125, 90.2783203125, 94.287109375, 98.2958984375, 102.3046875, 106.3134765625, 110.322265625, 114.3310546875, 118.33984375, 122.3486328125, 126.357421875, 130.3662109375, 134.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 9.0, 8.0, 8.0, 16.0, 25.0, 49.0, 73.0, 111.0, 163.0, 229.0, 332.0, 532.0, 841.0, 1219.0, 1817.0, 2857.0, 4403.0, 6877.0, 10676.0, 17414.0, 28020.0, 46223.0, 75079.0, 117245.0, 167190.0, 1229433.0, 140743.0, 92970.0, 57786.0, 35689.0, 21793.0, 13430.0, 8399.0, 5364.0, 3471.0, 2252.0, 1511.0, 997.0, 645.0, 451.0, 259.0, 179.0, 134.0, 86.0, 47.0, 33.0, 18.0, 15.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.8724365234375, -7.612060546875, -7.3516845703125, -7.09130859375, -6.8309326171875, -6.570556640625, -6.3101806640625, -6.0498046875, -5.7894287109375, -5.529052734375, -5.2686767578125, -5.00830078125, -4.7479248046875, -4.487548828125, -4.2271728515625, -3.966796875, -3.7064208984375, -3.446044921875, -3.1856689453125, -2.92529296875, -2.6649169921875, -2.404541015625, -2.1441650390625, -1.8837890625, -1.6234130859375, -1.363037109375, -1.1026611328125, -0.84228515625, -0.5819091796875, -0.321533203125, -0.0611572265625, 0.19921875, 0.4595947265625, 0.719970703125, 0.9803466796875, 1.24072265625, 1.5010986328125, 1.761474609375, 2.0218505859375, 2.2822265625, 2.5426025390625, 2.802978515625, 3.0633544921875, 3.32373046875, 3.5841064453125, 3.844482421875, 4.1048583984375, 4.365234375, 4.6256103515625, 4.885986328125, 5.1463623046875, 5.40673828125, 5.6671142578125, 5.927490234375, 6.1878662109375, 6.4482421875, 6.7086181640625, 6.968994140625, 7.2293701171875, 7.48974609375, 7.7501220703125, 8.010498046875, 8.2708740234375, 8.53125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 5.0, 2.0, 10.0, 8.0, 9.0, 8.0, 11.0, 14.0, 25.0, 16.0, 31.0, 47.0, 40.0, 35.0, 41.0, 54.0, 46.0, 43.0, 49.0, 39.0, 43.0, 37.0, 32.0, 36.0, 40.0, 44.0, 31.0, 44.0, 29.0, 23.0, 13.0, 17.0, 16.0, 6.0, 12.0, 7.0, 8.0, 13.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.080322265625, -0.07778644561767578, -0.07525062561035156, -0.07271480560302734, -0.07017898559570312, -0.0676431655883789, -0.06510734558105469, -0.06257152557373047, -0.06003570556640625, -0.05749988555908203, -0.05496406555175781, -0.052428245544433594, -0.049892425537109375, -0.047356605529785156, -0.04482078552246094, -0.04228496551513672, -0.0397491455078125, -0.03721332550048828, -0.03467750549316406, -0.032141685485839844, -0.029605865478515625, -0.027070045471191406, -0.024534225463867188, -0.02199840545654297, -0.01946258544921875, -0.01692676544189453, -0.014390945434570312, -0.011855125427246094, -0.009319305419921875, -0.006783485412597656, -0.0042476654052734375, -0.0017118453979492188, 0.000823974609375, 0.0033597946166992188, 0.0058956146240234375, 0.008431434631347656, 0.010967254638671875, 0.013503074645996094, 0.016038894653320312, 0.01857471466064453, 0.02111053466796875, 0.02364635467529297, 0.026182174682617188, 0.028717994689941406, 0.031253814697265625, 0.033789634704589844, 0.03632545471191406, 0.03886127471923828, 0.0413970947265625, 0.04393291473388672, 0.04646873474121094, 0.049004554748535156, 0.051540374755859375, 0.054076194763183594, 0.05661201477050781, 0.05914783477783203, 0.06168365478515625, 0.06421947479248047, 0.06675529479980469, 0.0692911148071289, 0.07182693481445312, 0.07436275482177734, 0.07689857482910156, 0.07943439483642578, 0.08197021484375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 8.0, 5.0, 17.0, 31.0, 39.0, 43.0, 80.0, 108.0, 184.0, 270.0, 448.0, 828.0, 1381.0, 2764.0, 5610.0, 12385.0, 28610.0, 68096.0, 167438.0, 359454.0, 234856.0, 94404.0, 39158.0, 17017.0, 7488.0, 3513.0, 1813.0, 968.0, 560.0, 357.0, 193.0, 139.0, 93.0, 55.0, 36.0, 37.0, 30.0, 10.0, 4.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.442626953125, -0.42865753173828125, -0.4146881103515625, -0.40071868896484375, -0.386749267578125, -0.37277984619140625, -0.3588104248046875, -0.34484100341796875, -0.33087158203125, -0.31690216064453125, -0.3029327392578125, -0.28896331787109375, -0.274993896484375, -0.26102447509765625, -0.2470550537109375, -0.23308563232421875, -0.2191162109375, -0.20514678955078125, -0.1911773681640625, -0.17720794677734375, -0.163238525390625, -0.14926910400390625, -0.1352996826171875, -0.12133026123046875, -0.10736083984375, -0.09339141845703125, -0.0794219970703125, -0.06545257568359375, -0.051483154296875, -0.03751373291015625, -0.0235443115234375, -0.00957489013671875, 0.00439453125, 0.01836395263671875, 0.0323333740234375, 0.04630279541015625, 0.060272216796875, 0.07424163818359375, 0.0882110595703125, 0.10218048095703125, 0.11614990234375, 0.13011932373046875, 0.1440887451171875, 0.15805816650390625, 0.172027587890625, 0.18599700927734375, 0.1999664306640625, 0.21393585205078125, 0.2279052734375, 0.24187469482421875, 0.2558441162109375, 0.26981353759765625, 0.283782958984375, 0.29775238037109375, 0.3117218017578125, 0.32569122314453125, 0.33966064453125, 0.35363006591796875, 0.3675994873046875, 0.38156890869140625, 0.395538330078125, 0.40950775146484375, 0.4234771728515625, 0.43744659423828125, 0.451416015625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 12.0, 4.0, 12.0, 10.0, 16.0, 9.0, 18.0, 20.0, 47.0, 82.0, 78.0, 122.0, 118.0, 127.0, 90.0, 72.0, 42.0, 32.0, 20.0, 14.0, 17.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.536999523639679, -0.5258423686027527, -0.5146851539611816, -0.5035279989242554, -0.4923708438873291, -0.48121365904808044, -0.4700564742088318, -0.4588993191719055, -0.44774213433265686, -0.4365849494934082, -0.42542779445648193, -0.4142706096172333, -0.4031134247779846, -0.39195626974105835, -0.3807990849018097, -0.36964190006256104, -0.35848474502563477, -0.3473275601863861, -0.33617040514945984, -0.3250132203102112, -0.3138560652732849, -0.30269888043403625, -0.2915416955947876, -0.28038454055786133, -0.26922735571861267, -0.258070170879364, -0.24691301584243774, -0.2357558310031891, -0.22459866106510162, -0.21344149112701416, -0.2022843062877655, -0.19112713634967804, -0.1799699366092682, -0.16881276667118073, -0.15765559673309326, -0.1464984118938446, -0.13534124195575714, -0.12418407201766968, -0.11302689462900162, -0.10186971724033356, -0.0907125473022461, -0.07955537736415863, -0.06839819997549057, -0.05724102631211281, -0.046083852648735046, -0.034926678985357285, -0.023769505321979523, -0.012612327933311462, -0.001455157995223999, 0.009702015668153763, 0.020859189331531525, 0.032016362994909286, 0.04317353665828705, 0.05433071032166481, 0.06548788398504257, 0.07664506137371063, 0.0878022313117981, 0.09895940124988556, 0.11011657863855362, 0.12127375602722168, 0.13243092596530914, 0.1435880959033966, 0.15474528074264526, 0.16590245068073273, 0.1770596206188202]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 8.0, 1.0, 8.0, 7.0, 11.0, 13.0, 12.0, 10.0, 16.0, 14.0, 14.0, 20.0, 24.0, 27.0, 23.0, 36.0, 26.0, 30.0, 27.0, 37.0, 39.0, 30.0, 28.0, 23.0, 43.0, 31.0, 29.0, 27.0, 34.0, 28.0, 40.0, 24.0, 33.0, 16.0, 26.0, 21.0, 28.0, 28.0, 18.0, 17.0, 12.0, 15.0, 11.0, 13.0, 13.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.21002990007400513, -0.20393536984920502, -0.1978408396244049, -0.1917463093996048, -0.1856517791748047, -0.17955724895000458, -0.17346271872520447, -0.16736818850040436, -0.16127365827560425, -0.15517912805080414, -0.14908459782600403, -0.14299006760120392, -0.1368955373764038, -0.1308010071516037, -0.12470647692680359, -0.11861194670200348, -0.11251741647720337, -0.10642288625240326, -0.10032835602760315, -0.09423382580280304, -0.08813929557800293, -0.08204476535320282, -0.07595023512840271, -0.0698557049036026, -0.06376117467880249, -0.05766664445400238, -0.05157211422920227, -0.04547758400440216, -0.03938305377960205, -0.03328852355480194, -0.02719399333000183, -0.02109946310520172, -0.015004932880401611, -0.008910402655601501, -0.0028158724308013916, 0.0032786577939987183, 0.009373188018798828, 0.015467718243598938, 0.021562248468399048, 0.027656778693199158, 0.03375130891799927, 0.03984583914279938, 0.04594036936759949, 0.0520348995923996, 0.05812942981719971, 0.06422396004199982, 0.07031849026679993, 0.07641302049160004, 0.08250755071640015, 0.08860208094120026, 0.09469661116600037, 0.10079114139080048, 0.10688567161560059, 0.1129802018404007, 0.1190747320652008, 0.12516926229000092, 0.13126379251480103, 0.13735832273960114, 0.14345285296440125, 0.14954738318920135, 0.15564191341400146, 0.16173644363880157, 0.16783097386360168, 0.1739255040884018, 0.1800200343132019]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 13.0, 20.0, 22.0, 11.0, 30.0, 20.0, 30.0, 29.0, 22.0, 46.0, 25.0, 47.0, 50.0, 47.0, 40.0, 32.0, 41.0, 49.0, 38.0, 50.0, 38.0, 36.0, 31.0, 27.0, 27.0, 18.0, 16.0, 13.0, 15.0, 16.0, 10.0, 9.0, 8.0, 13.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.375, -193.35546875, -186.3359375, -179.31640625, -172.296875, -165.27734375, -158.2578125, -151.23828125, -144.21875, -137.19921875, -130.1796875, -123.16015625, -116.140625, -109.12109375, -102.1015625, -95.08203125, -88.0625, -81.04296875, -74.0234375, -67.00390625, -59.984375, -52.96484375, -45.9453125, -38.92578125, -31.90625, -24.88671875, -17.8671875, -10.84765625, -3.828125, 3.19140625, 10.2109375, 17.23046875, 24.25, 31.26953125, 38.2890625, 45.30859375, 52.328125, 59.34765625, 66.3671875, 73.38671875, 80.40625, 87.42578125, 94.4453125, 101.46484375, 108.484375, 115.50390625, 122.5234375, 129.54296875, 136.5625, 143.58203125, 150.6015625, 157.62109375, 164.640625, 171.66015625, 178.6796875, 185.69921875, 192.71875, 199.73828125, 206.7578125, 213.77734375, 220.796875, 227.81640625, 234.8359375, 241.85546875, 248.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 15.0, 17.0, 29.0, 36.0, 38.0, 57.0, 78.0, 80.0, 129.0, 178.0, 301.0, 571.0, 1321.0, 4206.0, 19155.0, 132343.0, 592062.0, 252899.0, 35036.0, 6377.0, 1758.0, 706.0, 361.0, 235.0, 142.0, 89.0, 67.0, 40.0, 47.0, 29.0, 32.0, 15.0, 15.0, 9.0, 14.0, 12.0, 7.0, 3.0, 2.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3125, -37.94091796875, -36.5693359375, -35.19775390625, -33.826171875, -32.45458984375, -31.0830078125, -29.71142578125, -28.33984375, -26.96826171875, -25.5966796875, -24.22509765625, -22.853515625, -21.48193359375, -20.1103515625, -18.73876953125, -17.3671875, -15.99560546875, -14.6240234375, -13.25244140625, -11.880859375, -10.50927734375, -9.1376953125, -7.76611328125, -6.39453125, -5.02294921875, -3.6513671875, -2.27978515625, -0.908203125, 0.46337890625, 1.8349609375, 3.20654296875, 4.578125, 5.94970703125, 7.3212890625, 8.69287109375, 10.064453125, 11.43603515625, 12.8076171875, 14.17919921875, 15.55078125, 16.92236328125, 18.2939453125, 19.66552734375, 21.037109375, 22.40869140625, 23.7802734375, 25.15185546875, 26.5234375, 27.89501953125, 29.2666015625, 30.63818359375, 32.009765625, 33.38134765625, 34.7529296875, 36.12451171875, 37.49609375, 38.86767578125, 40.2392578125, 41.61083984375, 42.982421875, 44.35400390625, 45.7255859375, 47.09716796875, 48.46875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 10.0, 15.0, 13.0, 20.0, 23.0, 44.0, 45.0, 51.0, 69.0, 68.0, 72.0, 2109.0, 77.0, 80.0, 49.0, 57.0, 45.0, 42.0, 44.0, 29.0, 18.0, 17.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-581.5, -566.46484375, -551.4296875, -536.39453125, -521.359375, -506.32421875, -491.2890625, -476.25390625, -461.21875, -446.18359375, -431.1484375, -416.11328125, -401.078125, -386.04296875, -371.0078125, -355.97265625, -340.9375, -325.90234375, -310.8671875, -295.83203125, -280.796875, -265.76171875, -250.7265625, -235.69140625, -220.65625, -205.62109375, -190.5859375, -175.55078125, -160.515625, -145.48046875, -130.4453125, -115.41015625, -100.375, -85.33984375, -70.3046875, -55.26953125, -40.234375, -25.19921875, -10.1640625, 4.87109375, 19.90625, 34.94140625, 49.9765625, 65.01171875, 80.046875, 95.08203125, 110.1171875, 125.15234375, 140.1875, 155.22265625, 170.2578125, 185.29296875, 200.328125, 215.36328125, 230.3984375, 245.43359375, 260.46875, 275.50390625, 290.5390625, 305.57421875, 320.609375, 335.64453125, 350.6796875, 365.71484375, 380.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 13.0, 15.0, 27.0, 43.0, 57.0, 117.0, 172.0, 340.0, 706.0, 1646.0, 6081.0, 57493.0, 2732776.0, 319892.0, 20664.0, 3363.0, 1145.0, 464.0, 255.0, 152.0, 96.0, 54.0, 34.0, 23.0, 17.0, 15.0, 8.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.34375, -44.83935546875, -43.3349609375, -41.83056640625, -40.326171875, -38.82177734375, -37.3173828125, -35.81298828125, -34.30859375, -32.80419921875, -31.2998046875, -29.79541015625, -28.291015625, -26.78662109375, -25.2822265625, -23.77783203125, -22.2734375, -20.76904296875, -19.2646484375, -17.76025390625, -16.255859375, -14.75146484375, -13.2470703125, -11.74267578125, -10.23828125, -8.73388671875, -7.2294921875, -5.72509765625, -4.220703125, -2.71630859375, -1.2119140625, 0.29248046875, 1.796875, 3.30126953125, 4.8056640625, 6.31005859375, 7.814453125, 9.31884765625, 10.8232421875, 12.32763671875, 13.83203125, 15.33642578125, 16.8408203125, 18.34521484375, 19.849609375, 21.35400390625, 22.8583984375, 24.36279296875, 25.8671875, 27.37158203125, 28.8759765625, 30.38037109375, 31.884765625, 33.38916015625, 34.8935546875, 36.39794921875, 37.90234375, 39.40673828125, 40.9111328125, 42.41552734375, 43.919921875, 45.42431640625, 46.9287109375, 48.43310546875, 49.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 13.0, 24.0, 34.0, 62.0, 162.0, 215.0, 210.0, 123.0, 58.0, 25.0, 19.0, 17.0, 9.0, 6.0, 9.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-657.27001953125, -634.3551635742188, -611.4402465820312, -588.525390625, -565.6104736328125, -542.6956176757812, -519.78076171875, -496.8658752441406, -473.95098876953125, -451.0361022949219, -428.1212158203125, -405.20635986328125, -382.2914733886719, -359.3765869140625, -336.46173095703125, -313.5468444824219, -290.6319580078125, -267.7170715332031, -244.8022003173828, -221.8873291015625, -198.97244262695312, -176.05755615234375, -153.14268493652344, -130.22781372070312, -107.31292724609375, -84.3980484008789, -61.48316955566406, -38.56829071044922, -15.653411865234375, 7.261466979980469, 30.176345825195312, 53.091217041015625, 76.00604248046875, 98.9209213256836, 121.83580017089844, 144.75067138671875, 167.66555786132812, 190.5804443359375, 213.4953155517578, 236.41018676757812, 259.3250732421875, 282.2399597167969, 305.15484619140625, 328.0697021484375, 350.9845886230469, 373.89947509765625, 396.8143310546875, 419.7292175292969, 442.64410400390625, 465.5589904785156, 488.473876953125, 511.38873291015625, 534.3035888671875, 557.218505859375, 580.1333618164062, 603.0482177734375, 625.963134765625, 648.8779907226562, 671.7929077148438, 694.707763671875, 717.6226806640625, 740.5375366210938, 763.452392578125, 786.3673095703125, 809.2821655273438]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 13.0, 12.0, 15.0, 18.0, 18.0, 17.0, 25.0, 30.0, 25.0, 40.0, 45.0, 33.0, 32.0, 30.0, 35.0, 47.0, 45.0, 30.0, 42.0, 37.0, 34.0, 31.0, 35.0, 33.0, 30.0, 30.0, 31.0, 16.0, 12.0, 11.0, 15.0, 20.0, 14.0, 9.0, 13.0, 10.0, 8.0, 7.0, 12.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-464.2268371582031, -450.50079345703125, -436.7747497558594, -423.0487060546875, -409.3226623535156, -395.59661865234375, -381.87060546875, -368.14453125, -354.41851806640625, -340.6924743652344, -326.9664306640625, -313.2403869628906, -299.51434326171875, -285.7882995605469, -272.062255859375, -258.33624267578125, -244.61016845703125, -230.88412475585938, -217.1580810546875, -203.43203735351562, -189.70599365234375, -175.97994995117188, -162.25392150878906, -148.5278778076172, -134.8018341064453, -121.07579040527344, -107.34974670410156, -93.62371063232422, -79.89766693115234, -66.17162322998047, -52.445587158203125, -38.71954345703125, -24.9935302734375, -11.267488479614258, 2.4585533142089844, 16.184593200683594, 29.91063690185547, 43.636680603027344, 57.36271667480469, 71.08876037597656, 84.81480407714844, 98.54084777832031, 112.26689147949219, 125.99292755126953, 139.71896362304688, 153.44500732421875, 167.17105102539062, 180.8970947265625, 194.62313842773438, 208.34918212890625, 222.07522583007812, 235.80126953125, 249.52731323242188, 263.25335693359375, 276.9793701171875, 290.7054443359375, 304.43145751953125, 318.1575012207031, 331.883544921875, 345.6095886230469, 359.33563232421875, 373.0616760253906, 386.7877197265625, 400.51373291015625, 414.23980712890625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 17.0, 19.0, 16.0, 20.0, 34.0, 44.0, 62.0, 73.0, 87.0, 114.0, 132.0, 164.0, 187.0, 234.0, 295.0, 392.0, 572.0, 878.0, 1570.0, 3181.0, 6687.0, 1019128.0, 6599.0, 3154.0, 1617.0, 860.0, 539.0, 383.0, 293.0, 229.0, 166.0, 170.0, 145.0, 103.0, 80.0, 60.0, 57.0, 39.0, 33.0, 23.0, 9.0, 18.0, 13.0, 16.0, 9.0, 1.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-95.81563568115234, -92.77223205566406, -89.72882843017578, -86.6854248046875, -83.64202117919922, -80.59861755371094, -77.55521392822266, -74.51181030273438, -71.4684066772461, -68.42500305175781, -65.38159942626953, -62.33819580078125, -59.29479217529297, -56.25138854980469, -53.207984924316406, -50.164581298828125, -47.12118148803711, -44.07777786254883, -41.03437423706055, -37.990970611572266, -34.947566986083984, -31.904163360595703, -28.860761642456055, -25.817358016967773, -22.773954391479492, -19.73055076599121, -16.68714714050293, -13.643744468688965, -10.600340843200684, -7.556937217712402, -4.5135345458984375, -1.4701309204101562, 1.573272705078125, 4.616676330566406, 7.660079479217529, 10.703482627868652, 13.746886253356934, 16.79029083251953, 19.83369255065918, 22.87709617614746, 25.920499801635742, 28.963903427124023, 32.00730514526367, 35.05070877075195, 38.094112396240234, 41.137516021728516, 44.1809196472168, 47.22432327270508, 50.26772689819336, 53.31113052368164, 56.35453414916992, 59.3979377746582, 62.441341400146484, 65.4847412109375, 68.52814483642578, 71.57154846191406, 74.61495208740234, 77.65835571289062, 80.7017593383789, 83.74516296386719, 86.78856658935547, 89.83197021484375, 92.87537384033203, 95.91877746582031, 98.9621810913086]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 13.0, 18.0, 38.0, 81.0, 204.0, 23650.0, 51438904.0, 151.0, 43.0, 24.0, 22.0, 11.0, 7.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1442.74267578125, -1352.977294921875, -1263.2119140625, -1173.446533203125, -1083.6812744140625, -993.9158935546875, -904.1505126953125, -814.3851928710938, -724.6198120117188, -634.8544311523438, -545.089111328125, -455.32373046875, -365.5583801269531, -275.79302978515625, -186.02764892578125, -96.2623291015625, -6.4969482421875, 83.2684097290039, 173.0337677001953, 262.79913330078125, 352.5644836425781, 442.329833984375, 532.09521484375, 621.8605346679688, 711.6259155273438, 801.3912963867188, 891.1566162109375, 980.9219970703125, 1070.6873779296875, 1160.45263671875, 1250.218017578125, 1339.9833984375, 1429.748779296875, 1519.51416015625, 1609.279541015625, 1699.044921875, 1788.8101806640625, 1878.5755615234375, 1968.3409423828125, 2058.106201171875, 2147.87158203125, 2237.636962890625, 2327.40234375, 2417.167724609375, 2506.93310546875, 2596.6982421875, 2686.4638671875, 2776.22900390625, 2865.99462890625, 2955.760009765625, 3045.525390625, 3135.290771484375, 3225.05615234375, 3314.8212890625, 3404.5869140625, 3494.35205078125, 3584.117431640625, 3673.8828125, 3763.648193359375, 3853.41357421875, 3943.178955078125, 4032.9443359375, 4122.70947265625, 4212.47509765625, 4302.240234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 10.0, 6.0, 8.0, 7.0, 14.0, 24.0, 38.0, 61.0, 96.0, 123.0, 180.0, 288.0, 510.0, 825.0, 1243.0, 1867.0, 2953.0, 4557.0, 7005.0, 11123.0, 17339.0, 27194.0, 44026.0, 70579.0, 113621.0, 180721.0, 280320.0, 411455.0, 3328278.0, 767803.0, 362849.0, 243711.0, 153860.0, 96928.0, 59570.0, 37102.0, 23400.0, 14909.0, 9447.0, 6230.0, 3964.0, 2530.0, 1568.0, 1042.0, 701.0, 459.0, 315.0, 216.0, 143.0, 84.0, 53.0, 36.0, 28.0, 12.0, 10.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.125, -2.05377197265625, -1.9825439453125, -1.91131591796875, -1.840087890625, -1.76885986328125, -1.6976318359375, -1.62640380859375, -1.55517578125, -1.48394775390625, -1.4127197265625, -1.34149169921875, -1.270263671875, -1.19903564453125, -1.1278076171875, -1.05657958984375, -0.9853515625, -0.91412353515625, -0.8428955078125, -0.77166748046875, -0.700439453125, -0.62921142578125, -0.5579833984375, -0.48675537109375, -0.41552734375, -0.34429931640625, -0.2730712890625, -0.20184326171875, -0.130615234375, -0.05938720703125, 0.0118408203125, 0.08306884765625, 0.154296875, 0.22552490234375, 0.2967529296875, 0.36798095703125, 0.439208984375, 0.51043701171875, 0.5816650390625, 0.65289306640625, 0.72412109375, 0.79534912109375, 0.8665771484375, 0.93780517578125, 1.009033203125, 1.08026123046875, 1.1514892578125, 1.22271728515625, 1.2939453125, 1.36517333984375, 1.4364013671875, 1.50762939453125, 1.578857421875, 1.65008544921875, 1.7213134765625, 1.79254150390625, 1.86376953125, 1.93499755859375, 2.0062255859375, 2.07745361328125, 2.148681640625, 2.21990966796875, 2.2911376953125, 2.36236572265625, 2.43359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 9.0, 4.0, 3.0, 6.0, 11.0, 9.0, 11.0, 17.0, 26.0, 23.0, 28.0, 23.0, 31.0, 28.0, 40.0, 41.0, 48.0, 54.0, 48.0, 73.0, 1031.0, 54.0, 41.0, 49.0, 31.0, 39.0, 37.0, 34.0, 26.0, 23.0, 21.0, 14.0, 21.0, 12.0, 13.0, 9.0, 9.0, 7.0, 6.0, 8.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.25, -58.32958984375, -56.4091796875, -54.48876953125, -52.568359375, -50.64794921875, -48.7275390625, -46.80712890625, -44.88671875, -42.96630859375, -41.0458984375, -39.12548828125, -37.205078125, -35.28466796875, -33.3642578125, -31.44384765625, -29.5234375, -27.60302734375, -25.6826171875, -23.76220703125, -21.841796875, -19.92138671875, -18.0009765625, -16.08056640625, -14.16015625, -12.23974609375, -10.3193359375, -8.39892578125, -6.478515625, -4.55810546875, -2.6376953125, -0.71728515625, 1.203125, 3.12353515625, 5.0439453125, 6.96435546875, 8.884765625, 10.80517578125, 12.7255859375, 14.64599609375, 16.56640625, 18.48681640625, 20.4072265625, 22.32763671875, 24.248046875, 26.16845703125, 28.0888671875, 30.00927734375, 31.9296875, 33.85009765625, 35.7705078125, 37.69091796875, 39.611328125, 41.53173828125, 43.4521484375, 45.37255859375, 47.29296875, 49.21337890625, 51.1337890625, 53.05419921875, 54.974609375, 56.89501953125, 58.8154296875, 60.73583984375, 62.65625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 16.0, 25.0, 22.0, 43.0, 83.0, 97.0, 172.0, 251.0, 442.0, 695.0, 1101.0, 1666.0, 2532.0, 4058.0, 6341.0, 9935.0, 15322.0, 24697.0, 38299.0, 60766.0, 95421.0, 148210.0, 222687.0, 319264.0, 467347.0, 3515863.0, 437152.0, 310837.0, 215159.0, 141451.0, 91593.0, 57698.0, 36633.0, 23601.0, 15198.0, 9602.0, 6113.0, 3918.0, 2620.0, 1733.0, 1069.0, 666.0, 371.0, 252.0, 142.0, 106.0, 58.0, 38.0, 29.0, 18.0, 5.0, 14.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6826171875, -1.6273651123046875, -1.572113037109375, -1.5168609619140625, -1.46160888671875, -1.4063568115234375, -1.351104736328125, -1.2958526611328125, -1.2406005859375, -1.1853485107421875, -1.130096435546875, -1.0748443603515625, -1.01959228515625, -0.9643402099609375, -0.909088134765625, -0.8538360595703125, -0.798583984375, -0.7433319091796875, -0.688079833984375, -0.6328277587890625, -0.57757568359375, -0.5223236083984375, -0.467071533203125, -0.4118194580078125, -0.3565673828125, -0.3013153076171875, -0.246063232421875, -0.1908111572265625, -0.13555908203125, -0.0803070068359375, -0.025054931640625, 0.0301971435546875, 0.08544921875, 0.1407012939453125, 0.195953369140625, 0.2512054443359375, 0.30645751953125, 0.3617095947265625, 0.416961669921875, 0.4722137451171875, 0.5274658203125, 0.5827178955078125, 0.637969970703125, 0.6932220458984375, 0.74847412109375, 0.8037261962890625, 0.858978271484375, 0.9142303466796875, 0.969482421875, 1.0247344970703125, 1.079986572265625, 1.1352386474609375, 1.19049072265625, 1.2457427978515625, 1.300994873046875, 1.3562469482421875, 1.4114990234375, 1.4667510986328125, 1.522003173828125, 1.5772552490234375, 1.63250732421875, 1.6877593994140625, 1.743011474609375, 1.7982635498046875, 1.853515625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 2.0, 11.0, 11.0, 5.0, 9.0, 11.0, 16.0, 11.0, 20.0, 14.0, 23.0, 31.0, 30.0, 28.0, 25.0, 42.0, 45.0, 38.0, 50.0, 36.0, 42.0, 1037.0, 55.0, 50.0, 33.0, 45.0, 34.0, 28.0, 32.0, 28.0, 24.0, 22.0, 22.0, 25.0, 12.0, 17.0, 12.0, 12.0, 13.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.75, -43.28662109375, -41.8232421875, -40.35986328125, -38.896484375, -37.43310546875, -35.9697265625, -34.50634765625, -33.04296875, -31.57958984375, -30.1162109375, -28.65283203125, -27.189453125, -25.72607421875, -24.2626953125, -22.79931640625, -21.3359375, -19.87255859375, -18.4091796875, -16.94580078125, -15.482421875, -14.01904296875, -12.5556640625, -11.09228515625, -9.62890625, -8.16552734375, -6.7021484375, -5.23876953125, -3.775390625, -2.31201171875, -0.8486328125, 0.61474609375, 2.078125, 3.54150390625, 5.0048828125, 6.46826171875, 7.931640625, 9.39501953125, 10.8583984375, 12.32177734375, 13.78515625, 15.24853515625, 16.7119140625, 18.17529296875, 19.638671875, 21.10205078125, 22.5654296875, 24.02880859375, 25.4921875, 26.95556640625, 28.4189453125, 29.88232421875, 31.345703125, 32.80908203125, 34.2724609375, 35.73583984375, 37.19921875, 38.66259765625, 40.1259765625, 41.58935546875, 43.052734375, 44.51611328125, 45.9794921875, 47.44287109375, 48.90625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 7.0, 19.0, 8.0, 16.0, 34.0, 31.0, 54.0, 52.0, 74.0, 87.0, 122.0, 197.0, 299.0, 540.0, 864.0, 1750.0, 4314.0, 13810.0, 69257.0, 5911839.0, 237554.0, 35492.0, 8691.0, 2964.0, 1346.0, 644.0, 440.0, 274.0, 193.0, 120.0, 78.0, 80.0, 62.0, 39.0, 20.0, 12.0, 15.0, 9.0, 4.0, 1.0, 7.0, 6.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.890625, -17.4046630859375, -16.918701171875, -16.4327392578125, -15.94677734375, -15.4608154296875, -14.974853515625, -14.4888916015625, -14.0029296875, -13.5169677734375, -13.031005859375, -12.5450439453125, -12.05908203125, -11.5731201171875, -11.087158203125, -10.6011962890625, -10.115234375, -9.6292724609375, -9.143310546875, -8.6573486328125, -8.17138671875, -7.6854248046875, -7.199462890625, -6.7135009765625, -6.2275390625, -5.7415771484375, -5.255615234375, -4.7696533203125, -4.28369140625, -3.7977294921875, -3.311767578125, -2.8258056640625, -2.33984375, -1.8538818359375, -1.367919921875, -0.8819580078125, -0.39599609375, 0.0899658203125, 0.575927734375, 1.0618896484375, 1.5478515625, 2.0338134765625, 2.519775390625, 3.0057373046875, 3.49169921875, 3.9776611328125, 4.463623046875, 4.9495849609375, 5.435546875, 5.9215087890625, 6.407470703125, 6.8934326171875, 7.37939453125, 7.8653564453125, 8.351318359375, 8.8372802734375, 9.3232421875, 9.8092041015625, 10.295166015625, 10.7811279296875, 11.26708984375, 11.7530517578125, 12.239013671875, 12.7249755859375, 13.2109375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 8.0, 9.0, 11.0, 10.0, 20.0, 7.0, 15.0, 20.0, 13.0, 27.0, 25.0, 34.0, 26.0, 27.0, 41.0, 34.0, 49.0, 36.0, 48.0, 1030.0, 78.0, 44.0, 49.0, 47.0, 43.0, 26.0, 39.0, 28.0, 29.0, 21.0, 28.0, 28.0, 16.0, 24.0, 6.0, 10.0, 3.0, 5.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.96875, -39.59033203125, -38.2119140625, -36.83349609375, -35.455078125, -34.07666015625, -32.6982421875, -31.31982421875, -29.94140625, -28.56298828125, -27.1845703125, -25.80615234375, -24.427734375, -23.04931640625, -21.6708984375, -20.29248046875, -18.9140625, -17.53564453125, -16.1572265625, -14.77880859375, -13.400390625, -12.02197265625, -10.6435546875, -9.26513671875, -7.88671875, -6.50830078125, -5.1298828125, -3.75146484375, -2.373046875, -0.99462890625, 0.3837890625, 1.76220703125, 3.140625, 4.51904296875, 5.8974609375, 7.27587890625, 8.654296875, 10.03271484375, 11.4111328125, 12.78955078125, 14.16796875, 15.54638671875, 16.9248046875, 18.30322265625, 19.681640625, 21.06005859375, 22.4384765625, 23.81689453125, 25.1953125, 26.57373046875, 27.9521484375, 29.33056640625, 30.708984375, 32.08740234375, 33.4658203125, 34.84423828125, 36.22265625, 37.60107421875, 38.9794921875, 40.35791015625, 41.736328125, 43.11474609375, 44.4931640625, 45.87158203125, 47.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 22.0, 138.0, 746.0, 67.0, 17.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-671.114990234375, -658.53173828125, -645.9484252929688, -633.3651123046875, -620.7818603515625, -608.1986083984375, -595.6152954101562, -583.031982421875, -570.44873046875, -557.865478515625, -545.2821655273438, -532.6988525390625, -520.1156005859375, -507.5323181152344, -494.94903564453125, -482.3657531738281, -469.782470703125, -457.1991882324219, -444.61590576171875, -432.0326232910156, -419.4493408203125, -406.8660583496094, -394.28277587890625, -381.6994934082031, -369.1162109375, -356.5329284667969, -343.94964599609375, -331.3663635253906, -318.7830810546875, -306.1997985839844, -293.61651611328125, -281.0332336425781, -268.449951171875, -255.86666870117188, -243.28338623046875, -230.70010375976562, -218.1168212890625, -205.53353881835938, -192.95025634765625, -180.36697387695312, -167.78367614746094, -155.2003936767578, -142.6171112060547, -130.03382873535156, -117.45054626464844, -104.86726379394531, -92.28398132324219, -79.70069885253906, -67.11741638183594, -54.53413391113281, -41.95085144042969, -29.367568969726562, -16.784286499023438, -4.2010040283203125, 8.382278442382812, 20.965560913085938, 33.54884338378906, 46.13212585449219, 58.71540832519531, 71.29869079589844, 83.88197326660156, 96.46525573730469, 109.04853820800781, 121.63182067871094, 134.21510314941406]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 19.0, 20.0, 19.0, 22.0, 36.0, 45.0, 41.0, 48.0, 46.0, 56.0, 63.0, 39.0, 51.0, 64.0, 51.0, 54.0, 46.0, 47.0, 39.0, 32.0, 22.0, 28.0, 20.0, 20.0, 9.0, 10.0, 12.0, 5.0, 2.0, 3.0, 6.0, 4.0, 0.0, 4.0], "bins": [-152.04510498046875, -148.44219970703125, -144.8393096923828, -141.2364044189453, -137.63351440429688, -134.03060913085938, -130.42770385742188, -126.82481384277344, -123.22190856933594, -119.61901092529297, -116.01611328125, -112.4132080078125, -108.81031036376953, -105.20741271972656, -101.6045150756836, -98.00161743164062, -94.39871215820312, -90.79581451416016, -87.19291687011719, -83.59001159667969, -79.98711395263672, -76.38421630859375, -72.78131866455078, -69.17842102050781, -65.57552337646484, -61.972625732421875, -58.36972427368164, -54.76682662963867, -51.16392517089844, -47.56102752685547, -43.9581298828125, -40.355228424072266, -36.75232696533203, -33.14942932128906, -29.546527862548828, -25.94363021850586, -22.340728759765625, -18.737831115722656, -15.134931564331055, -11.532032012939453, -7.929132461547852, -4.32623291015625, -0.7233338356018066, 2.8795652389526367, 6.482464790344238, 10.085363388061523, 13.688262939453125, 17.291162490844727, 20.894062042236328, 24.49696159362793, 28.09986114501953, 31.7027587890625, 35.305660247802734, 38.9085578918457, 42.51145935058594, 46.114356994628906, 49.717254638671875, 53.320152282714844, 56.92305374145508, 60.52595138549805, 64.12885284423828, 67.73175048828125, 71.33464813232422, 74.93754577636719, 78.54045104980469]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 6.0, 6.0, 12.0, 15.0, 22.0, 29.0, 39.0, 55.0, 88.0, 87.0, 125.0, 181.0, 322.0, 512.0, 979.0, 1934.0, 5563.0, 51609.0, 4041125.0, 78853.0, 7920.0, 2417.0, 1055.0, 557.0, 305.0, 136.0, 105.0, 64.0, 45.0, 42.0, 9.0, 7.0, 17.0, 5.0, 3.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403076171875, -0.3917388916015625, -0.380401611328125, -0.3690643310546875, -0.35772705078125, -0.3463897705078125, -0.335052490234375, -0.3237152099609375, -0.3123779296875, -0.3010406494140625, -0.289703369140625, -0.2783660888671875, -0.26702880859375, -0.2556915283203125, -0.244354248046875, -0.2330169677734375, -0.2216796875, -0.2103424072265625, -0.199005126953125, -0.1876678466796875, -0.17633056640625, -0.1649932861328125, -0.153656005859375, -0.1423187255859375, -0.1309814453125, -0.1196441650390625, -0.108306884765625, -0.0969696044921875, -0.08563232421875, -0.0742950439453125, -0.062957763671875, -0.0516204833984375, -0.040283203125, -0.0289459228515625, -0.017608642578125, -0.0062713623046875, 0.00506591796875, 0.0164031982421875, 0.027740478515625, 0.0390777587890625, 0.0504150390625, 0.0617523193359375, 0.073089599609375, 0.0844268798828125, 0.09576416015625, 0.1071014404296875, 0.118438720703125, 0.1297760009765625, 0.14111328125, 0.1524505615234375, 0.163787841796875, 0.1751251220703125, 0.18646240234375, 0.1977996826171875, 0.209136962890625, 0.2204742431640625, 0.2318115234375, 0.2431488037109375, 0.254486083984375, 0.2658233642578125, 0.27716064453125, 0.2884979248046875, 0.299835205078125, 0.3111724853515625, 0.322509765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 2.0, 7.0, 13.0, 9.0, 14.0, 12.0, 13.0, 148.0, 648.0, 18.0, 10.0, 20.0, 9.0, 12.0, 6.0, 7.0, 6.0, 3.0, 6.0, 0.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.283203125, -0.2753429412841797, -0.2674827575683594, -0.25962257385253906, -0.25176239013671875, -0.24390220642089844, -0.23604202270507812, -0.2281818389892578, -0.2203216552734375, -0.2124614715576172, -0.20460128784179688, -0.19674110412597656, -0.18888092041015625, -0.18102073669433594, -0.17316055297851562, -0.1653003692626953, -0.157440185546875, -0.1495800018310547, -0.14171981811523438, -0.13385963439941406, -0.12599945068359375, -0.11813926696777344, -0.11027908325195312, -0.10241889953613281, -0.0945587158203125, -0.08669853210449219, -0.07883834838867188, -0.07097816467285156, -0.06311798095703125, -0.05525779724121094, -0.047397613525390625, -0.03953742980957031, -0.03167724609375, -0.023817062377929688, -0.015956878662109375, -0.008096694946289062, -0.00023651123046875, 0.0076236724853515625, 0.015483856201171875, 0.023344039916992188, 0.0312042236328125, 0.03906440734863281, 0.046924591064453125, 0.05478477478027344, 0.06264495849609375, 0.07050514221191406, 0.07836532592773438, 0.08622550964355469, 0.094085693359375, 0.10194587707519531, 0.10980606079101562, 0.11766624450683594, 0.12552642822265625, 0.13338661193847656, 0.14124679565429688, 0.1491069793701172, 0.1569671630859375, 0.1648273468017578, 0.17268753051757812, 0.18054771423339844, 0.18840789794921875, 0.19626808166503906, 0.20412826538085938, 0.2119884490966797, 0.2198486328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 6.0, 13.0, 14.0, 18.0, 15.0, 43.0, 38.0, 63.0, 92.0, 126.0, 225.0, 371.0, 741.0, 1474.0, 3397.0, 10685.0, 58401.0, 3940914.0, 153768.0, 16145.0, 4424.0, 1736.0, 733.0, 335.0, 216.0, 89.0, 63.0, 33.0, 28.0, 18.0, 9.0, 13.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.447540283203125, -0.43341064453125, -0.419281005859375, -0.4051513671875, -0.391021728515625, -0.37689208984375, -0.362762451171875, -0.3486328125, -0.334503173828125, -0.32037353515625, -0.306243896484375, -0.2921142578125, -0.277984619140625, -0.26385498046875, -0.249725341796875, -0.235595703125, -0.221466064453125, -0.20733642578125, -0.193206787109375, -0.1790771484375, -0.164947509765625, -0.15081787109375, -0.136688232421875, -0.12255859375, -0.108428955078125, -0.09429931640625, -0.080169677734375, -0.0660400390625, -0.051910400390625, -0.03778076171875, -0.023651123046875, -0.009521484375, 0.004608154296875, 0.01873779296875, 0.032867431640625, 0.0469970703125, 0.061126708984375, 0.07525634765625, 0.089385986328125, 0.103515625, 0.117645263671875, 0.13177490234375, 0.145904541015625, 0.1600341796875, 0.174163818359375, 0.18829345703125, 0.202423095703125, 0.216552734375, 0.230682373046875, 0.24481201171875, 0.258941650390625, 0.2730712890625, 0.287200927734375, 0.30133056640625, 0.315460205078125, 0.32958984375, 0.343719482421875, 0.35784912109375, 0.371978759765625, 0.3861083984375, 0.400238037109375, 0.41436767578125, 0.428497314453125, 0.442626953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 22.0, 22.0, 35.0, 51.0, 119.0, 428.0, 2087.0, 891.0, 201.0, 54.0, 36.0, 23.0, 16.0, 13.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31572723388671875, -0.3079681396484375, -0.30020904541015625, -0.292449951171875, -0.28469085693359375, -0.2769317626953125, -0.26917266845703125, -0.26141357421875, -0.25365447998046875, -0.2458953857421875, -0.23813629150390625, -0.230377197265625, -0.22261810302734375, -0.2148590087890625, -0.20709991455078125, -0.1993408203125, -0.19158172607421875, -0.1838226318359375, -0.17606353759765625, -0.168304443359375, -0.16054534912109375, -0.1527862548828125, -0.14502716064453125, -0.13726806640625, -0.12950897216796875, -0.1217498779296875, -0.11399078369140625, -0.106231689453125, -0.09847259521484375, -0.0907135009765625, -0.08295440673828125, -0.0751953125, -0.06743621826171875, -0.0596771240234375, -0.05191802978515625, -0.044158935546875, -0.03639984130859375, -0.0286407470703125, -0.02088165283203125, -0.01312255859375, -0.00536346435546875, 0.0023956298828125, 0.01015472412109375, 0.017913818359375, 0.02567291259765625, 0.0334320068359375, 0.04119110107421875, 0.0489501953125, 0.05670928955078125, 0.0644683837890625, 0.07222747802734375, 0.079986572265625, 0.08774566650390625, 0.0955047607421875, 0.10326385498046875, 0.11102294921875, 0.11878204345703125, 0.1265411376953125, 0.13430023193359375, 0.142059326171875, 0.14981842041015625, 0.1575775146484375, 0.16533660888671875, 0.173095703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 10.0, 22.0, 80.0, 282.0, 448.0, 110.0, 21.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3055990934371948, -1.2664577960968018, -1.2273164987564087, -1.1881752014160156, -1.1490339040756226, -1.1098926067352295, -1.0707513093948364, -1.0316100120544434, -0.9924687147140503, -0.9533274173736572, -0.9141861200332642, -0.8750448226928711, -0.835903525352478, -0.796762228012085, -0.7576209306716919, -0.7184796333312988, -0.6793383359909058, -0.6401970386505127, -0.6010557413101196, -0.5619144439697266, -0.5227731466293335, -0.48363184928894043, -0.44449055194854736, -0.4053492546081543, -0.36620795726776123, -0.32706665992736816, -0.2879253625869751, -0.24878406524658203, -0.20964276790618896, -0.1705014705657959, -0.13136017322540283, -0.09221887588500977, -0.05307745933532715, -0.013936161994934082, 0.025205135345458984, 0.06434643268585205, 0.10348773002624512, 0.14262902736663818, 0.18177032470703125, 0.22091162204742432, 0.2600529193878174, 0.29919421672821045, 0.3383355140686035, 0.3774768114089966, 0.41661810874938965, 0.4557594060897827, 0.4949007034301758, 0.5340420007705688, 0.5731832981109619, 0.612324595451355, 0.651465892791748, 0.6906071901321411, 0.7297484874725342, 0.7688897848129272, 0.8080310821533203, 0.8471723794937134, 0.8863136768341064, 0.9254549741744995, 0.9645962715148926, 1.0037375688552856, 1.0428788661956787, 1.0820201635360718, 1.1211614608764648, 1.160302758216858, 1.199444055557251]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 11.0, 17.0, 25.0, 25.0, 29.0, 44.0, 48.0, 43.0, 51.0, 67.0, 69.0, 70.0, 66.0, 79.0, 72.0, 58.0, 37.0, 35.0, 27.0, 29.0, 26.0, 16.0, 10.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6217141151428223, -0.5980504751205444, -0.5743868350982666, -0.5507232546806335, -0.5270596146583557, -0.5033959746360779, -0.47973233461380005, -0.4560687243938446, -0.43240511417388916, -0.40874147415161133, -0.3850778639316559, -0.36141422390937805, -0.3377506136894226, -0.3140869736671448, -0.29042333364486694, -0.2667597234249115, -0.24309608340263367, -0.21943245828151703, -0.1957688331604004, -0.17210519313812256, -0.14844158291816711, -0.12477795034646988, -0.10111431777477264, -0.077450692653656, -0.05378706753253937, -0.03012344054877758, -0.006459813565015793, 0.017203815281391144, 0.04086744040250778, 0.06453106552362442, 0.08819469809532166, 0.1118583232164383, 0.13552194833755493, 0.15918557345867157, 0.1828491985797882, 0.20651283860206604, 0.23017644882202148, 0.2538400888442993, 0.27750372886657715, 0.3011673390865326, 0.32483094930648804, 0.34849458932876587, 0.3721581995487213, 0.39582183957099915, 0.4194854497909546, 0.4431490898132324, 0.46681272983551025, 0.4904763400554657, 0.5141400098800659, 0.5378036499023438, 0.5614672899246216, 0.5851308703422546, 0.6087945103645325, 0.6324581503868103, 0.6561217904090881, 0.6797853708267212, 0.703449010848999, 0.7271126508712769, 0.7507762908935547, 0.7744398713111877, 0.7981035113334656, 0.8217671513557434, 0.8454307913780212, 0.8690943717956543, 0.8927580118179321]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 9.0, 15.0, 13.0, 23.0, 33.0, 34.0, 59.0, 85.0, 107.0, 168.0, 219.0, 318.0, 516.0, 719.0, 1047.0, 1613.0, 2559.0, 4126.0, 7082.0, 14318.0, 33588.0, 885583.0, 53723.0, 19386.0, 9263.0, 5119.0, 3016.0, 1934.0, 1214.0, 815.0, 534.0, 381.0, 274.0, 182.0, 131.0, 95.0, 68.0, 55.0, 33.0, 24.0, 13.0, 19.0, 7.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.095703125, -1.058807373046875, -1.02191162109375, -0.985015869140625, -0.9481201171875, -0.911224365234375, -0.87432861328125, -0.837432861328125, -0.800537109375, -0.763641357421875, -0.72674560546875, -0.689849853515625, -0.6529541015625, -0.616058349609375, -0.57916259765625, -0.542266845703125, -0.50537109375, -0.468475341796875, -0.43157958984375, -0.394683837890625, -0.3577880859375, -0.320892333984375, -0.28399658203125, -0.247100830078125, -0.210205078125, -0.173309326171875, -0.13641357421875, -0.099517822265625, -0.0626220703125, -0.025726318359375, 0.01116943359375, 0.048065185546875, 0.0849609375, 0.121856689453125, 0.15875244140625, 0.195648193359375, 0.2325439453125, 0.269439697265625, 0.30633544921875, 0.343231201171875, 0.380126953125, 0.417022705078125, 0.45391845703125, 0.490814208984375, 0.5277099609375, 0.564605712890625, 0.60150146484375, 0.638397216796875, 0.67529296875, 0.712188720703125, 0.74908447265625, 0.785980224609375, 0.8228759765625, 0.859771728515625, 0.89666748046875, 0.933563232421875, 0.970458984375, 1.007354736328125, 1.04425048828125, 1.081146240234375, 1.1180419921875, 1.154937744140625, 1.19183349609375, 1.228729248046875, 1.265625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 5.0, 1.0, 6.0, 4.0, 3.0, 9.0, 11.0, 11.0, 14.0, 11.0, 18.0, 593.0, 201.0, 15.0, 14.0, 14.0, 11.0, 14.0, 4.0, 7.0, 3.0, 6.0, 4.0, 0.0, 6.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.277587890625, -0.26983642578125, -0.2620849609375, -0.25433349609375, -0.24658203125, -0.23883056640625, -0.2310791015625, -0.22332763671875, -0.215576171875, -0.20782470703125, -0.2000732421875, -0.19232177734375, -0.1845703125, -0.17681884765625, -0.1690673828125, -0.16131591796875, -0.153564453125, -0.14581298828125, -0.1380615234375, -0.13031005859375, -0.12255859375, -0.11480712890625, -0.1070556640625, -0.09930419921875, -0.091552734375, -0.08380126953125, -0.0760498046875, -0.06829833984375, -0.060546875, -0.05279541015625, -0.0450439453125, -0.03729248046875, -0.029541015625, -0.02178955078125, -0.0140380859375, -0.00628662109375, 0.00146484375, 0.00921630859375, 0.0169677734375, 0.02471923828125, 0.032470703125, 0.04022216796875, 0.0479736328125, 0.05572509765625, 0.0634765625, 0.07122802734375, 0.0789794921875, 0.08673095703125, 0.094482421875, 0.10223388671875, 0.1099853515625, 0.11773681640625, 0.12548828125, 0.13323974609375, 0.1409912109375, 0.14874267578125, 0.156494140625, 0.16424560546875, 0.1719970703125, 0.17974853515625, 0.1875, 0.19525146484375, 0.2030029296875, 0.21075439453125, 0.218505859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 5.0, 6.0, 10.0, 18.0, 21.0, 32.0, 24.0, 39.0, 60.0, 59.0, 97.0, 125.0, 152.0, 226.0, 350.0, 501.0, 906.0, 1562.0, 3143.0, 6368.0, 14731.0, 38512.0, 128966.0, 482791.0, 261562.0, 66057.0, 22770.0, 9490.0, 4484.0, 2116.0, 1172.0, 702.0, 440.0, 264.0, 181.0, 150.0, 98.0, 72.0, 70.0, 29.0, 31.0, 41.0, 22.0, 20.0, 18.0, 17.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.50439453125, -0.48743438720703125, -0.4704742431640625, -0.45351409912109375, -0.436553955078125, -0.41959381103515625, -0.4026336669921875, -0.38567352294921875, -0.36871337890625, -0.35175323486328125, -0.3347930908203125, -0.31783294677734375, -0.300872802734375, -0.28391265869140625, -0.2669525146484375, -0.24999237060546875, -0.2330322265625, -0.21607208251953125, -0.1991119384765625, -0.18215179443359375, -0.165191650390625, -0.14823150634765625, -0.1312713623046875, -0.11431121826171875, -0.09735107421875, -0.08039093017578125, -0.0634307861328125, -0.04647064208984375, -0.029510498046875, -0.01255035400390625, 0.0044097900390625, 0.02136993408203125, 0.038330078125, 0.05529022216796875, 0.0722503662109375, 0.08921051025390625, 0.106170654296875, 0.12313079833984375, 0.1400909423828125, 0.15705108642578125, 0.17401123046875, 0.19097137451171875, 0.2079315185546875, 0.22489166259765625, 0.241851806640625, 0.25881195068359375, 0.2757720947265625, 0.29273223876953125, 0.3096923828125, 0.32665252685546875, 0.3436126708984375, 0.36057281494140625, 0.377532958984375, 0.39449310302734375, 0.4114532470703125, 0.42841339111328125, 0.44537353515625, 0.46233367919921875, 0.4792938232421875, 0.49625396728515625, 0.513214111328125, 0.5301742553710938, 0.5471343994140625, 0.5640945434570312, 0.5810546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 8.0, 3.0, 4.0, 10.0, 11.0, 10.0, 16.0, 16.0, 15.0, 25.0, 21.0, 29.0, 29.0, 30.0, 34.0, 42.0, 38.0, 31.0, 40.0, 32.0, 27.0, 32.0, 34.0, 37.0, 44.0, 38.0, 31.0, 28.0, 34.0, 30.0, 30.0, 24.0, 28.0, 16.0, 24.0, 21.0, 7.0, 13.0, 9.0, 8.0, 5.0, 9.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.69775390625, -0.6742095947265625, -0.650665283203125, -0.6271209716796875, -0.60357666015625, -0.5800323486328125, -0.556488037109375, -0.5329437255859375, -0.5093994140625, -0.4858551025390625, -0.462310791015625, -0.4387664794921875, -0.41522216796875, -0.3916778564453125, -0.368133544921875, -0.3445892333984375, -0.321044921875, -0.2975006103515625, -0.273956298828125, -0.2504119873046875, -0.22686767578125, -0.2033233642578125, -0.179779052734375, -0.1562347412109375, -0.1326904296875, -0.1091461181640625, -0.085601806640625, -0.0620574951171875, -0.03851318359375, -0.0149688720703125, 0.008575439453125, 0.0321197509765625, 0.0556640625, 0.0792083740234375, 0.102752685546875, 0.1262969970703125, 0.14984130859375, 0.1733856201171875, 0.196929931640625, 0.2204742431640625, 0.2440185546875, 0.2675628662109375, 0.291107177734375, 0.3146514892578125, 0.33819580078125, 0.3617401123046875, 0.385284423828125, 0.4088287353515625, 0.432373046875, 0.4559173583984375, 0.479461669921875, 0.5030059814453125, 0.52655029296875, 0.5500946044921875, 0.573638916015625, 0.5971832275390625, 0.6207275390625, 0.6442718505859375, 0.667816162109375, 0.6913604736328125, 0.71490478515625, 0.7384490966796875, 0.761993408203125, 0.7855377197265625, 0.80908203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 9.0, 11.0, 23.0, 40.0, 63.0, 147.0, 505.0, 4221.0, 1027217.0, 15149.0, 801.0, 222.0, 65.0, 32.0, 15.0, 15.0, 7.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.25, -2.1972503662109375, -2.144500732421875, -2.0917510986328125, -2.03900146484375, -1.9862518310546875, -1.933502197265625, -1.8807525634765625, -1.8280029296875, -1.7752532958984375, -1.722503662109375, -1.6697540283203125, -1.61700439453125, -1.5642547607421875, -1.511505126953125, -1.4587554931640625, -1.406005859375, -1.3532562255859375, -1.300506591796875, -1.2477569580078125, -1.19500732421875, -1.1422576904296875, -1.089508056640625, -1.0367584228515625, -0.9840087890625, -0.9312591552734375, -0.878509521484375, -0.8257598876953125, -0.77301025390625, -0.7202606201171875, -0.667510986328125, -0.6147613525390625, -0.56201171875, -0.5092620849609375, -0.456512451171875, -0.4037628173828125, -0.35101318359375, -0.2982635498046875, -0.245513916015625, -0.1927642822265625, -0.1400146484375, -0.0872650146484375, -0.034515380859375, 0.0182342529296875, 0.07098388671875, 0.1237335205078125, 0.176483154296875, 0.2292327880859375, 0.281982421875, 0.3347320556640625, 0.387481689453125, 0.4402313232421875, 0.49298095703125, 0.5457305908203125, 0.598480224609375, 0.6512298583984375, 0.7039794921875, 0.7567291259765625, 0.809478759765625, 0.8622283935546875, 0.91497802734375, 0.9677276611328125, 1.020477294921875, 1.0732269287109375, 1.1259765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 5.0, 6.0, 14.0, 28.0, 43.0, 73.0, 83.0, 103.0, 112.0, 103.0, 113.0, 93.0, 50.0, 49.0, 32.0, 23.0, 13.0, 11.0, 13.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.568960189819336e-05, -2.5013461709022522e-05, -2.4337321519851685e-05, -2.3661181330680847e-05, -2.298504114151001e-05, -2.2308900952339172e-05, -2.1632760763168335e-05, -2.0956620573997498e-05, -2.028048038482666e-05, -1.9604340195655823e-05, -1.8928200006484985e-05, -1.8252059817314148e-05, -1.757591962814331e-05, -1.6899779438972473e-05, -1.6223639249801636e-05, -1.55474990606308e-05, -1.4871358871459961e-05, -1.4195218682289124e-05, -1.3519078493118286e-05, -1.2842938303947449e-05, -1.2166798114776611e-05, -1.1490657925605774e-05, -1.0814517736434937e-05, -1.0138377547264099e-05, -9.462237358093262e-06, -8.786097168922424e-06, -8.109956979751587e-06, -7.4338167905807495e-06, -6.757676601409912e-06, -6.081536412239075e-06, -5.405396223068237e-06, -4.7292560338974e-06, -4.0531158447265625e-06, -3.376975655555725e-06, -2.7008354663848877e-06, -2.0246952772140503e-06, -1.3485550880432129e-06, -6.724148988723755e-07, 3.725290298461914e-09, 6.798654794692993e-07, 1.3560056686401367e-06, 2.032145857810974e-06, 2.7082860469818115e-06, 3.384426236152649e-06, 4.060566425323486e-06, 4.736706614494324e-06, 5.412846803665161e-06, 6.0889869928359985e-06, 6.765127182006836e-06, 7.441267371177673e-06, 8.11740756034851e-06, 8.793547749519348e-06, 9.469687938690186e-06, 1.0145828127861023e-05, 1.082196831703186e-05, 1.1498108506202698e-05, 1.2174248695373535e-05, 1.2850388884544373e-05, 1.352652907371521e-05, 1.4202669262886047e-05, 1.4878809452056885e-05, 1.5554949641227722e-05, 1.623108983039856e-05, 1.6907230019569397e-05, 1.7583370208740234e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 24.0, 23.0, 54.0, 78.0, 160.0, 534.0, 2064.0, 28692.0, 997232.0, 17349.0, 1604.0, 393.0, 151.0, 70.0, 43.0, 29.0, 13.0, 11.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1609878540039062, -1.1315460205078125, -1.1021041870117188, -1.072662353515625, -1.0432205200195312, -1.0137786865234375, -0.9843368530273438, -0.95489501953125, -0.9254531860351562, -0.8960113525390625, -0.8665695190429688, -0.837127685546875, -0.8076858520507812, -0.7782440185546875, -0.7488021850585938, -0.7193603515625, -0.6899185180664062, -0.6604766845703125, -0.6310348510742188, -0.601593017578125, -0.5721511840820312, -0.5427093505859375, -0.5132675170898438, -0.48382568359375, -0.45438385009765625, -0.4249420166015625, -0.39550018310546875, -0.366058349609375, -0.33661651611328125, -0.3071746826171875, -0.27773284912109375, -0.248291015625, -0.21884918212890625, -0.1894073486328125, -0.15996551513671875, -0.130523681640625, -0.10108184814453125, -0.0716400146484375, -0.04219818115234375, -0.01275634765625, 0.01668548583984375, 0.0461273193359375, 0.07556915283203125, 0.105010986328125, 0.13445281982421875, 0.1638946533203125, 0.19333648681640625, 0.2227783203125, 0.25222015380859375, 0.2816619873046875, 0.31110382080078125, 0.340545654296875, 0.36998748779296875, 0.3994293212890625, 0.42887115478515625, 0.45831298828125, 0.48775482177734375, 0.5171966552734375, 0.5466384887695312, 0.576080322265625, 0.6055221557617188, 0.6349639892578125, 0.6644058227539062, 0.69384765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 16.0, 33.0, 42.0, 92.0, 182.0, 268.0, 170.0, 83.0, 55.0, 21.0, 15.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0336685180664062, -1.0067901611328125, -0.9799118041992188, -0.953033447265625, -0.9261550903320312, -0.8992767333984375, -0.8723983764648438, -0.84552001953125, -0.8186416625976562, -0.7917633056640625, -0.7648849487304688, -0.738006591796875, -0.7111282348632812, -0.6842498779296875, -0.6573715209960938, -0.6304931640625, -0.6036148071289062, -0.5767364501953125, -0.5498580932617188, -0.522979736328125, -0.49610137939453125, -0.4692230224609375, -0.44234466552734375, -0.41546630859375, -0.38858795166015625, -0.3617095947265625, -0.33483123779296875, -0.307952880859375, -0.28107452392578125, -0.2541961669921875, -0.22731781005859375, -0.200439453125, -0.17356109619140625, -0.1466827392578125, -0.11980438232421875, -0.092926025390625, -0.06604766845703125, -0.0391693115234375, -0.01229095458984375, 0.01458740234375, 0.04146575927734375, 0.0683441162109375, 0.09522247314453125, 0.122100830078125, 0.14897918701171875, 0.1758575439453125, 0.20273590087890625, 0.2296142578125, 0.25649261474609375, 0.2833709716796875, 0.31024932861328125, 0.337127685546875, 0.36400604248046875, 0.3908843994140625, 0.41776275634765625, 0.44464111328125, 0.47151947021484375, 0.4983978271484375, 0.5252761840820312, 0.552154541015625, 0.5790328979492188, 0.6059112548828125, 0.6327896118164062, 0.65966796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 9.0, 46.0, 366.0, 501.0, 55.0, 17.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.407510757446289, -13.690621376037598, -12.973732948303223, -12.256843566894531, -11.539955139160156, -10.823065757751465, -10.106176376342773, -9.389287948608398, -8.672398567199707, -7.955509662628174, -7.238620758056641, -6.521731376647949, -5.804842472076416, -5.087953567504883, -4.371064186096191, -3.654175281524658, -2.937286376953125, -2.220397472381592, -1.5035083293914795, -0.7866191864013672, -0.06973028182983398, 0.6471586227416992, 1.3640480041503906, 2.080936908721924, 2.797825813293457, 3.5147147178649902, 4.231603622436523, 4.948493003845215, 5.665381908416748, 6.382270812988281, 7.099160194396973, 7.816049098968506, 8.532936096191406, 9.249825477600098, 9.966713905334473, 10.683603286743164, 11.400491714477539, 12.11738109588623, 12.834270477294922, 13.551158905029297, 14.268048286437988, 14.98493766784668, 15.701826095581055, 16.418716430664062, 17.135604858398438, 17.852493286132812, 18.569381713867188, 19.286272048950195, 20.00316047668457, 20.720048904418945, 21.436939239501953, 22.153827667236328, 22.870716094970703, 23.587604522705078, 24.304494857788086, 25.02138328552246, 25.73827362060547, 26.455162048339844, 27.17205238342285, 27.888940811157227, 28.6058292388916, 29.32271957397461, 30.039608001708984, 30.75649642944336, 31.473384857177734]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 8.0, 7.0, 8.0, 7.0, 19.0, 14.0, 36.0, 42.0, 73.0, 133.0, 137.0, 164.0, 124.0, 82.0, 51.0, 25.0, 15.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.19681739807129, -16.58119773864746, -15.96557903289795, -15.349960327148438, -14.73434066772461, -14.118721961975098, -13.503103256225586, -12.887483596801758, -12.27186393737793, -11.656245231628418, -11.04062557220459, -10.425006866455078, -9.80938720703125, -9.193768501281738, -8.578149795532227, -7.962530136108398, -7.346911430358887, -6.731292247772217, -6.115673065185547, -5.500054359436035, -4.884434700012207, -4.268815994262695, -3.6531968116760254, -3.0375776290893555, -2.4219584465026855, -1.8063392639160156, -1.1907202005386353, -0.5751011371612549, 0.04051804542541504, 0.656137228012085, 1.2717561721801758, 1.8873753547668457, 2.5029945373535156, 3.1186137199401855, 3.7342329025268555, 4.349851608276367, 4.965471267700195, 5.581089973449707, 6.196709156036377, 6.812328338623047, 7.427947521209717, 8.043566703796387, 8.659185409545898, 9.274805068969727, 9.890423774719238, 10.506043434143066, 11.121662139892578, 11.737281799316406, 12.352900505065918, 12.96851921081543, 13.584138870239258, 14.19975757598877, 14.815377235412598, 15.43099594116211, 16.046615600585938, 16.662235260009766, 17.27785301208496, 17.89347267150879, 18.509090423583984, 19.124710083007812, 19.74032974243164, 20.35594940185547, 20.971567153930664, 21.587186813354492, 22.20280647277832]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 3.0, 7.0, 12.0, 9.0, 14.0, 26.0, 20.0, 16.0, 39.0, 42.0, 56.0, 77.0, 105.0, 170.0, 248.0, 330.0, 523.0, 871.0, 1481.0, 2614.0, 5366.0, 12591.0, 42075.0, 3847089.0, 239244.0, 24718.0, 8500.0, 3727.0, 1874.0, 1039.0, 542.0, 325.0, 209.0, 132.0, 62.0, 46.0, 19.0, 22.0, 14.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6796875, -1.635284423828125, -1.59088134765625, -1.546478271484375, -1.5020751953125, -1.457672119140625, -1.41326904296875, -1.368865966796875, -1.324462890625, -1.280059814453125, -1.23565673828125, -1.191253662109375, -1.1468505859375, -1.102447509765625, -1.05804443359375, -1.013641357421875, -0.96923828125, -0.924835205078125, -0.88043212890625, -0.836029052734375, -0.7916259765625, -0.747222900390625, -0.70281982421875, -0.658416748046875, -0.614013671875, -0.569610595703125, -0.52520751953125, -0.480804443359375, -0.4364013671875, -0.391998291015625, -0.34759521484375, -0.303192138671875, -0.2587890625, -0.214385986328125, -0.16998291015625, -0.125579833984375, -0.0811767578125, -0.036773681640625, 0.00762939453125, 0.052032470703125, 0.096435546875, 0.140838623046875, 0.18524169921875, 0.229644775390625, 0.2740478515625, 0.318450927734375, 0.36285400390625, 0.407257080078125, 0.45166015625, 0.496063232421875, 0.54046630859375, 0.584869384765625, 0.6292724609375, 0.673675537109375, 0.71807861328125, 0.762481689453125, 0.806884765625, 0.851287841796875, 0.89569091796875, 0.940093994140625, 0.9844970703125, 1.028900146484375, 1.07330322265625, 1.117706298828125, 1.162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 11.0, 5.0, 5.0, 14.0, 11.0, 9.0, 12.0, 47.0, 312.0, 400.0, 57.0, 23.0, 14.0, 7.0, 10.0, 7.0, 12.0, 4.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.2511253356933594, -0.24468231201171875, -0.23823928833007812, -0.2317962646484375, -0.22535324096679688, -0.21891021728515625, -0.21246719360351562, -0.206024169921875, -0.19958114624023438, -0.19313812255859375, -0.18669509887695312, -0.1802520751953125, -0.17380905151367188, -0.16736602783203125, -0.16092300415039062, -0.15447998046875, -0.14803695678710938, -0.14159393310546875, -0.13515090942382812, -0.1287078857421875, -0.12226486206054688, -0.11582183837890625, -0.10937881469726562, -0.102935791015625, -0.09649276733398438, -0.09004974365234375, -0.08360671997070312, -0.0771636962890625, -0.07072067260742188, -0.06427764892578125, -0.057834625244140625, -0.0513916015625, -0.044948577880859375, -0.03850555419921875, -0.032062530517578125, -0.0256195068359375, -0.019176483154296875, -0.01273345947265625, -0.006290435791015625, 0.000152587890625, 0.006595611572265625, 0.01303863525390625, 0.019481658935546875, 0.0259246826171875, 0.032367706298828125, 0.03881072998046875, 0.045253753662109375, 0.05169677734375, 0.058139801025390625, 0.06458282470703125, 0.07102584838867188, 0.0774688720703125, 0.08391189575195312, 0.09035491943359375, 0.09679794311523438, 0.103240966796875, 0.10968399047851562, 0.11612701416015625, 0.12257003784179688, 0.1290130615234375, 0.13545608520507812, 0.14189910888671875, 0.14834213256835938, 0.15478515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 10.0, 4.0, 5.0, 16.0, 19.0, 29.0, 37.0, 50.0, 84.0, 134.0, 268.0, 519.0, 1272.0, 3357.0, 12609.0, 68390.0, 3533231.0, 523532.0, 38475.0, 7904.0, 2421.0, 922.0, 385.0, 195.0, 108.0, 87.0, 58.0, 41.0, 31.0, 18.0, 8.0, 17.0, 8.0, 6.0, 10.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90673828125, -0.8753128051757812, -0.8438873291015625, -0.8124618530273438, -0.781036376953125, -0.7496109008789062, -0.7181854248046875, -0.6867599487304688, -0.65533447265625, -0.6239089965820312, -0.5924835205078125, -0.5610580444335938, -0.529632568359375, -0.49820709228515625, -0.4667816162109375, -0.43535614013671875, -0.4039306640625, -0.37250518798828125, -0.3410797119140625, -0.30965423583984375, -0.278228759765625, -0.24680328369140625, -0.2153778076171875, -0.18395233154296875, -0.15252685546875, -0.12110137939453125, -0.0896759033203125, -0.05825042724609375, -0.026824951171875, 0.00460052490234375, 0.0360260009765625, 0.06745147705078125, 0.098876953125, 0.13030242919921875, 0.1617279052734375, 0.19315338134765625, 0.224578857421875, 0.25600433349609375, 0.2874298095703125, 0.31885528564453125, 0.35028076171875, 0.38170623779296875, 0.4131317138671875, 0.44455718994140625, 0.475982666015625, 0.5074081420898438, 0.5388336181640625, 0.5702590942382812, 0.6016845703125, 0.6331100463867188, 0.6645355224609375, 0.6959609985351562, 0.727386474609375, 0.7588119506835938, 0.7902374267578125, 0.8216629028320312, 0.85308837890625, 0.8845138549804688, 0.9159393310546875, 0.9473648071289062, 0.978790283203125, 1.0102157592773438, 1.0416412353515625, 1.0730667114257812, 1.1044921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 18.0, 17.0, 20.0, 25.0, 24.0, 29.0, 41.0, 55.0, 84.0, 147.0, 283.0, 744.0, 1638.0, 386.0, 136.0, 101.0, 68.0, 48.0, 50.0, 29.0, 21.0, 20.0, 19.0, 9.0, 7.0, 4.0, 4.0, 4.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1690673828125, -0.16382598876953125, -0.1585845947265625, -0.15334320068359375, -0.148101806640625, -0.14286041259765625, -0.1376190185546875, -0.13237762451171875, -0.12713623046875, -0.12189483642578125, -0.1166534423828125, -0.11141204833984375, -0.106170654296875, -0.10092926025390625, -0.0956878662109375, -0.09044647216796875, -0.085205078125, -0.07996368408203125, -0.0747222900390625, -0.06948089599609375, -0.064239501953125, -0.05899810791015625, -0.0537567138671875, -0.04851531982421875, -0.04327392578125, -0.03803253173828125, -0.0327911376953125, -0.02754974365234375, -0.022308349609375, -0.01706695556640625, -0.0118255615234375, -0.00658416748046875, -0.0013427734375, 0.00389862060546875, 0.0091400146484375, 0.01438140869140625, 0.019622802734375, 0.02486419677734375, 0.0301055908203125, 0.03534698486328125, 0.04058837890625, 0.04582977294921875, 0.0510711669921875, 0.05631256103515625, 0.061553955078125, 0.06679534912109375, 0.0720367431640625, 0.07727813720703125, 0.08251953125, 0.08776092529296875, 0.0930023193359375, 0.09824371337890625, 0.103485107421875, 0.10872650146484375, 0.1139678955078125, 0.11920928955078125, 0.12445068359375, 0.12969207763671875, 0.1349334716796875, 0.14017486572265625, 0.145416259765625, 0.15065765380859375, 0.1558990478515625, 0.16114044189453125, 0.1663818359375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 31.0, 449.0, 494.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.35866928100586, -11.14477825164795, -10.930887222290039, -10.716995239257812, -10.503104209899902, -10.289213180541992, -10.075322151184082, -9.861431121826172, -9.647539138793945, -9.433648109436035, -9.219757080078125, -9.005865097045898, -8.791974067687988, -8.578083038330078, -8.364192008972168, -8.150300979614258, -7.936409950256348, -7.7225189208984375, -7.508627414703369, -7.294736385345459, -7.080844879150391, -6.8669538497924805, -6.65306282043457, -6.43917179107666, -6.225280284881592, -6.011389255523682, -5.797497749328613, -5.583606719970703, -5.369715690612793, -5.155824184417725, -4.9419331550598145, -4.728041648864746, -4.514151096343994, -4.300260066986084, -4.086368560791016, -3.8724775314331055, -3.658586263656616, -3.444694995880127, -3.230803966522217, -3.0169126987457275, -2.8030214309692383, -2.589130163192749, -2.3752388954162598, -2.1613478660583496, -1.9474565982818604, -1.733565330505371, -1.5196741819381714, -1.3057830333709717, -1.0918917655944824, -0.8780005574226379, -0.6641093492507935, -0.450218141078949, -0.2363269329071045, -0.022435665130615234, 0.19145548343658447, 0.4053466320037842, 0.6192378997802734, 0.8331291079521179, 1.0470203161239624, 1.260911464691162, 1.4748027324676514, 1.6886940002441406, 1.9025851488113403, 2.11647629737854, 2.3303675651550293]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 8.0, 3.0, 10.0, 15.0, 14.0, 21.0, 35.0, 38.0, 52.0, 42.0, 57.0, 73.0, 68.0, 79.0, 78.0, 71.0, 66.0, 65.0, 52.0, 37.0, 29.0, 17.0, 15.0, 13.0, 9.0, 16.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0885677337646484, -1.0422866344451904, -0.9960055947303772, -0.949724555015564, -0.9034435153007507, -0.8571624755859375, -0.8108813762664795, -0.7646003365516663, -0.718319296836853, -0.6720382571220398, -0.6257571578025818, -0.5794761180877686, -0.5331950783729553, -0.4869140088558197, -0.4406329393386841, -0.39435189962387085, -0.34807080030441284, -0.3017897307872772, -0.255508691072464, -0.20922762155532837, -0.16294656693935394, -0.11666551232337952, -0.0703844428062439, -0.024103403091430664, 0.022177666425704956, 0.06845872104167938, 0.1147397831082344, 0.16102084517478943, 0.20730189979076385, 0.2535829544067383, 0.2998640239238739, 0.34614506363868713, 0.39242613315582275, 0.4387072026729584, 0.4849882423877716, 0.5312693119049072, 0.5775503516197205, 0.6238313913345337, 0.6701124906539917, 0.7163935303688049, 0.7626745700836182, 0.8089556097984314, 0.8552367091178894, 0.9015177488327026, 0.9477987885475159, 0.9940798282623291, 1.040360927581787, 1.0866420269012451, 1.1329231262207031, 1.1792042255401611, 1.2254852056503296, 1.2717663049697876, 1.3180474042892456, 1.364328384399414, 1.410609483718872, 1.45689058303833, 1.5031715631484985, 1.5494526624679565, 1.595733642578125, 1.642014741897583, 1.688295841217041, 1.7345768213272095, 1.7808579206466675, 1.827138900756836, 1.873420000076294]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 10.0, 19.0, 25.0, 35.0, 39.0, 61.0, 117.0, 155.0, 283.0, 523.0, 998.0, 2081.0, 4807.0, 12302.0, 46058.0, 883319.0, 71708.0, 15169.0, 5678.0, 2556.0, 1137.0, 570.0, 306.0, 198.0, 128.0, 76.0, 76.0, 28.0, 30.0, 15.0, 14.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7265625, -1.6735992431640625, -1.620635986328125, -1.5676727294921875, -1.51470947265625, -1.4617462158203125, -1.408782958984375, -1.3558197021484375, -1.3028564453125, -1.2498931884765625, -1.196929931640625, -1.1439666748046875, -1.09100341796875, -1.0380401611328125, -0.985076904296875, -0.9321136474609375, -0.879150390625, -0.8261871337890625, -0.773223876953125, -0.7202606201171875, -0.66729736328125, -0.6143341064453125, -0.561370849609375, -0.5084075927734375, -0.4554443359375, -0.4024810791015625, -0.349517822265625, -0.2965545654296875, -0.24359130859375, -0.1906280517578125, -0.137664794921875, -0.0847015380859375, -0.03173828125, 0.0212249755859375, 0.074188232421875, 0.1271514892578125, 0.18011474609375, 0.2330780029296875, 0.286041259765625, 0.3390045166015625, 0.3919677734375, 0.4449310302734375, 0.497894287109375, 0.5508575439453125, 0.60382080078125, 0.6567840576171875, 0.709747314453125, 0.7627105712890625, 0.815673828125, 0.8686370849609375, 0.921600341796875, 0.9745635986328125, 1.02752685546875, 1.0804901123046875, 1.133453369140625, 1.1864166259765625, 1.2393798828125, 1.2923431396484375, 1.345306396484375, 1.3982696533203125, 1.45123291015625, 1.5041961669921875, 1.557159423828125, 1.6101226806640625, 1.6630859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 4.0, 7.0, 7.0, 12.0, 14.0, 7.0, 24.0, 52.0, 176.0, 321.0, 198.0, 72.0, 17.0, 19.0, 13.0, 7.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2573070526123047, -0.2509422302246094, -0.24457740783691406, -0.23821258544921875, -0.23184776306152344, -0.22548294067382812, -0.2191181182861328, -0.2127532958984375, -0.2063884735107422, -0.20002365112304688, -0.19365882873535156, -0.18729400634765625, -0.18092918395996094, -0.17456436157226562, -0.1681995391845703, -0.161834716796875, -0.1554698944091797, -0.14910507202148438, -0.14274024963378906, -0.13637542724609375, -0.13001060485839844, -0.12364578247070312, -0.11728096008300781, -0.1109161376953125, -0.10455131530761719, -0.09818649291992188, -0.09182167053222656, -0.08545684814453125, -0.07909202575683594, -0.07272720336914062, -0.06636238098144531, -0.05999755859375, -0.05363273620605469, -0.047267913818359375, -0.04090309143066406, -0.03453826904296875, -0.028173446655273438, -0.021808624267578125, -0.015443801879882812, -0.0090789794921875, -0.0027141571044921875, 0.003650665283203125, 0.010015487670898438, 0.01638031005859375, 0.022745132446289062, 0.029109954833984375, 0.03547477722167969, 0.041839599609375, 0.04820442199707031, 0.054569244384765625, 0.06093406677246094, 0.06729888916015625, 0.07366371154785156, 0.08002853393554688, 0.08639335632324219, 0.0927581787109375, 0.09912300109863281, 0.10548782348632812, 0.11185264587402344, 0.11821746826171875, 0.12458229064941406, 0.13094711303710938, 0.1373119354248047, 0.1436767578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 6.0, 8.0, 6.0, 11.0, 16.0, 18.0, 14.0, 20.0, 23.0, 25.0, 45.0, 45.0, 68.0, 108.0, 155.0, 249.0, 503.0, 946.0, 2466.0, 8383.0, 35829.0, 233846.0, 632126.0, 106437.0, 19132.0, 4765.0, 1573.0, 701.0, 370.0, 177.0, 143.0, 76.0, 56.0, 37.0, 43.0, 24.0, 22.0, 13.0, 14.0, 13.0, 6.0, 7.0, 3.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.783203125, -0.7581939697265625, -0.733184814453125, -0.7081756591796875, -0.68316650390625, -0.6581573486328125, -0.633148193359375, -0.6081390380859375, -0.5831298828125, -0.5581207275390625, -0.533111572265625, -0.5081024169921875, -0.48309326171875, -0.4580841064453125, -0.433074951171875, -0.4080657958984375, -0.383056640625, -0.3580474853515625, -0.333038330078125, -0.3080291748046875, -0.28302001953125, -0.2580108642578125, -0.233001708984375, -0.2079925537109375, -0.1829833984375, -0.1579742431640625, -0.132965087890625, -0.1079559326171875, -0.08294677734375, -0.0579376220703125, -0.032928466796875, -0.0079193115234375, 0.01708984375, 0.0420989990234375, 0.067108154296875, 0.0921173095703125, 0.11712646484375, 0.1421356201171875, 0.167144775390625, 0.1921539306640625, 0.2171630859375, 0.2421722412109375, 0.267181396484375, 0.2921905517578125, 0.31719970703125, 0.3422088623046875, 0.367218017578125, 0.3922271728515625, 0.417236328125, 0.4422454833984375, 0.467254638671875, 0.4922637939453125, 0.51727294921875, 0.5422821044921875, 0.567291259765625, 0.5923004150390625, 0.6173095703125, 0.6423187255859375, 0.667327880859375, 0.6923370361328125, 0.71734619140625, 0.7423553466796875, 0.767364501953125, 0.7923736572265625, 0.8173828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 15.0, 11.0, 8.0, 18.0, 11.0, 23.0, 20.0, 20.0, 20.0, 32.0, 25.0, 33.0, 44.0, 32.0, 44.0, 55.0, 32.0, 29.0, 32.0, 43.0, 45.0, 37.0, 31.0, 29.0, 45.0, 28.0, 21.0, 22.0, 19.0, 24.0, 19.0, 19.0, 18.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.420654296875, -0.4067726135253906, -0.39289093017578125, -0.3790092468261719, -0.3651275634765625, -0.3512458801269531, -0.33736419677734375, -0.3234825134277344, -0.309600830078125, -0.2957191467285156, -0.28183746337890625, -0.2679557800292969, -0.2540740966796875, -0.24019241333007812, -0.22631072998046875, -0.21242904663085938, -0.19854736328125, -0.18466567993164062, -0.17078399658203125, -0.15690231323242188, -0.1430206298828125, -0.12913894653320312, -0.11525726318359375, -0.10137557983398438, -0.087493896484375, -0.07361221313476562, -0.05973052978515625, -0.045848846435546875, -0.0319671630859375, -0.018085479736328125, -0.00420379638671875, 0.009677886962890625, 0.0235595703125, 0.037441253662109375, 0.05132293701171875, 0.06520462036132812, 0.0790863037109375, 0.09296798706054688, 0.10684967041015625, 0.12073135375976562, 0.134613037109375, 0.14849472045898438, 0.16237640380859375, 0.17625808715820312, 0.1901397705078125, 0.20402145385742188, 0.21790313720703125, 0.23178482055664062, 0.24566650390625, 0.2595481872558594, 0.27342987060546875, 0.2873115539550781, 0.3011932373046875, 0.3150749206542969, 0.32895660400390625, 0.3428382873535156, 0.356719970703125, 0.3706016540527344, 0.38448333740234375, 0.3983650207519531, 0.4122467041015625, 0.4261283874511719, 0.44001007080078125, 0.4538917541503906, 0.4677734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 11.0, 21.0, 40.0, 78.0, 191.0, 484.0, 2750.0, 876621.0, 165636.0, 2021.0, 377.0, 143.0, 69.0, 43.0, 18.0, 9.0, 13.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.921875, -2.8553619384765625, -2.788848876953125, -2.7223358154296875, -2.65582275390625, -2.5893096923828125, -2.522796630859375, -2.4562835693359375, -2.3897705078125, -2.3232574462890625, -2.256744384765625, -2.1902313232421875, -2.12371826171875, -2.0572052001953125, -1.990692138671875, -1.9241790771484375, -1.857666015625, -1.7911529541015625, -1.724639892578125, -1.6581268310546875, -1.59161376953125, -1.5251007080078125, -1.458587646484375, -1.3920745849609375, -1.3255615234375, -1.2590484619140625, -1.192535400390625, -1.1260223388671875, -1.05950927734375, -0.9929962158203125, -0.926483154296875, -0.8599700927734375, -0.79345703125, -0.7269439697265625, -0.660430908203125, -0.5939178466796875, -0.52740478515625, -0.4608917236328125, -0.394378662109375, -0.3278656005859375, -0.2613525390625, -0.1948394775390625, -0.128326416015625, -0.0618133544921875, 0.00469970703125, 0.0712127685546875, 0.137725830078125, 0.2042388916015625, 0.270751953125, 0.3372650146484375, 0.403778076171875, 0.4702911376953125, 0.53680419921875, 0.6033172607421875, 0.669830322265625, 0.7363433837890625, 0.8028564453125, 0.8693695068359375, 0.935882568359375, 1.0023956298828125, 1.06890869140625, 1.1354217529296875, 1.201934814453125, 1.2684478759765625, 1.3349609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 11.0, 8.0, 19.0, 44.0, 179.0, 347.0, 241.0, 70.0, 21.0, 14.0, 8.0, 8.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010085105895996094, -9.755697101354599e-05, -9.426288306713104e-05, -9.09687951207161e-05, -8.767470717430115e-05, -8.43806192278862e-05, -8.108653128147125e-05, -7.77924433350563e-05, -7.449835538864136e-05, -7.120426744222641e-05, -6.791017949581146e-05, -6.461609154939651e-05, -6.132200360298157e-05, -5.802791565656662e-05, -5.473382771015167e-05, -5.1439739763736725e-05, -4.814565181732178e-05, -4.485156387090683e-05, -4.155747592449188e-05, -3.8263387978076935e-05, -3.496930003166199e-05, -3.167521208524704e-05, -2.8381124138832092e-05, -2.5087036192417145e-05, -2.1792948246002197e-05, -1.849886029958725e-05, -1.5204772353172302e-05, -1.1910684406757355e-05, -8.616596460342407e-06, -5.32250851392746e-06, -2.028420567512512e-06, 1.2656673789024353e-06, 4.559755325317383e-06, 7.85384327173233e-06, 1.1147931218147278e-05, 1.4442019164562225e-05, 1.7736107110977173e-05, 2.103019505739212e-05, 2.4324283003807068e-05, 2.7618370950222015e-05, 3.091245889663696e-05, 3.420654684305191e-05, 3.750063478946686e-05, 4.0794722735881805e-05, 4.408881068229675e-05, 4.73828986287117e-05, 5.067698657512665e-05, 5.3971074521541595e-05, 5.726516246795654e-05, 6.055925041437149e-05, 6.385333836078644e-05, 6.714742630720139e-05, 7.044151425361633e-05, 7.373560220003128e-05, 7.702969014644623e-05, 8.032377809286118e-05, 8.361786603927612e-05, 8.691195398569107e-05, 9.020604193210602e-05, 9.350012987852097e-05, 9.679421782493591e-05, 0.00010008830577135086, 0.00010338239371776581, 0.00010667648166418076, 0.0001099705696105957]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 20.0, 38.0, 69.0, 156.0, 340.0, 1309.0, 36790.0, 1005385.0, 3802.0, 419.0, 122.0, 48.0, 16.0, 16.0, 10.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0859375, -3.0206298828125, -2.955322265625, -2.8900146484375, -2.82470703125, -2.7593994140625, -2.694091796875, -2.6287841796875, -2.5634765625, -2.4981689453125, -2.432861328125, -2.3675537109375, -2.30224609375, -2.2369384765625, -2.171630859375, -2.1063232421875, -2.041015625, -1.9757080078125, -1.910400390625, -1.8450927734375, -1.77978515625, -1.7144775390625, -1.649169921875, -1.5838623046875, -1.5185546875, -1.4532470703125, -1.387939453125, -1.3226318359375, -1.25732421875, -1.1920166015625, -1.126708984375, -1.0614013671875, -0.99609375, -0.9307861328125, -0.865478515625, -0.8001708984375, -0.73486328125, -0.6695556640625, -0.604248046875, -0.5389404296875, -0.4736328125, -0.4083251953125, -0.343017578125, -0.2777099609375, -0.21240234375, -0.1470947265625, -0.081787109375, -0.0164794921875, 0.048828125, 0.1141357421875, 0.179443359375, 0.2447509765625, 0.31005859375, 0.3753662109375, 0.440673828125, 0.5059814453125, 0.5712890625, 0.6365966796875, 0.701904296875, 0.7672119140625, 0.83251953125, 0.8978271484375, 0.963134765625, 1.0284423828125, 1.09375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 23.0, 44.0, 95.0, 204.0, 281.0, 190.0, 85.0, 35.0, 19.0, 10.0, 5.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.4345703125, -1.40777587890625, -1.3809814453125, -1.35418701171875, -1.327392578125, -1.30059814453125, -1.2738037109375, -1.24700927734375, -1.22021484375, -1.19342041015625, -1.1666259765625, -1.13983154296875, -1.113037109375, -1.08624267578125, -1.0594482421875, -1.03265380859375, -1.005859375, -0.97906494140625, -0.9522705078125, -0.92547607421875, -0.898681640625, -0.87188720703125, -0.8450927734375, -0.81829833984375, -0.79150390625, -0.76470947265625, -0.7379150390625, -0.71112060546875, -0.684326171875, -0.65753173828125, -0.6307373046875, -0.60394287109375, -0.5771484375, -0.55035400390625, -0.5235595703125, -0.49676513671875, -0.469970703125, -0.44317626953125, -0.4163818359375, -0.38958740234375, -0.36279296875, -0.33599853515625, -0.3092041015625, -0.28240966796875, -0.255615234375, -0.22882080078125, -0.2020263671875, -0.17523193359375, -0.1484375, -0.12164306640625, -0.0948486328125, -0.06805419921875, -0.041259765625, -0.01446533203125, 0.0123291015625, 0.03912353515625, 0.06591796875, 0.09271240234375, 0.1195068359375, 0.14630126953125, 0.173095703125, 0.19989013671875, 0.2266845703125, 0.25347900390625, 0.2802734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 25.0, 47.0, 150.0, 401.0, 259.0, 75.0, 18.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.841560363769531, -11.599265098571777, -11.356968879699707, -11.114673614501953, -10.872377395629883, -10.630082130432129, -10.387785911560059, -10.145490646362305, -9.903194427490234, -9.66089916229248, -9.41860294342041, -9.176307678222656, -8.934011459350586, -8.691716194152832, -8.449419975280762, -8.207124710083008, -7.964828968048096, -7.722533226013184, -7.4802374839782715, -7.237941741943359, -6.995645999908447, -6.753350257873535, -6.511054992675781, -6.268758773803711, -6.026463508605957, -5.784167766571045, -5.541872024536133, -5.299576282501221, -5.057280540466309, -4.8149847984313965, -4.572689056396484, -4.3303937911987305, -4.08809757232666, -3.845801830291748, -3.603506088256836, -3.361210346221924, -3.1189146041870117, -2.8766188621520996, -2.6343233585357666, -2.3920276165008545, -2.1497321128845215, -1.9074363708496094, -1.6651406288146973, -1.4228450059890747, -1.1805492639541626, -0.9382535219192505, -0.6959578990936279, -0.4536621570587158, -0.2113664150238037, 0.03092929720878601, 0.27322500944137573, 0.5155206918716431, 0.7578164339065552, 1.0001121759414673, 1.2424077987670898, 1.484703540802002, 1.726999282836914, 1.9692950248718262, 2.2115907669067383, 2.4538865089416504, 2.6961822509765625, 2.9384779930114746, 3.1807734966278076, 3.4230692386627197, 3.665364980697632]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 9.0, 9.0, 12.0, 5.0, 20.0, 21.0, 37.0, 62.0, 73.0, 77.0, 94.0, 95.0, 101.0, 87.0, 80.0, 61.0, 40.0, 32.0, 18.0, 14.0, 12.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.269471168518066, -7.0550079345703125, -6.840544700622559, -6.626081466674805, -6.411618232727051, -6.197154998779297, -5.982691764831543, -5.768228530883789, -5.553765296936035, -5.339302062988281, -5.124838829040527, -4.910375595092773, -4.6959123611450195, -4.481449127197266, -4.266985893249512, -4.052522659301758, -3.838059902191162, -3.623596668243408, -3.4091334342956543, -3.1946702003479004, -2.9802069664001465, -2.7657437324523926, -2.5512807369232178, -2.336817502975464, -2.12235426902771, -1.907891035079956, -1.6934278011322021, -1.4789646863937378, -1.2645014524459839, -1.05003821849823, -0.8355751037597656, -0.6211118698120117, -0.4066486358642578, -0.1921854317188263, 0.022277772426605225, 0.23674094676971436, 0.45120418071746826, 0.6656674146652222, 0.8801305294036865, 1.0945937633514404, 1.3090569972991943, 1.5235202312469482, 1.7379834651947021, 1.9524465799331665, 2.166909694671631, 2.3813729286193848, 2.5958361625671387, 2.8102993965148926, 3.0247626304626465, 3.2392258644104004, 3.4536890983581543, 3.668152332305908, 3.882615566253662, 4.097078800201416, 4.311541557312012, 4.526004791259766, 4.7404680252075195, 4.954931259155273, 5.169394493103027, 5.383857727050781, 5.598320960998535, 5.812784194946289, 6.027247428894043, 6.241710662841797, 6.456173896789551]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 9.0, 7.0, 6.0, 7.0, 13.0, 7.0, 24.0, 24.0, 34.0, 31.0, 43.0, 63.0, 70.0, 103.0, 178.0, 266.0, 499.0, 985.0, 1788.0, 3919.0, 16587.0, 4064396.0, 93586.0, 7207.0, 2207.0, 1035.0, 526.0, 291.0, 156.0, 90.0, 52.0, 31.0, 13.0, 10.0, 6.0, 8.0, 3.0, 1.0, 5.0], "bins": [-5.359375, -5.2447662353515625, -5.130157470703125, -5.0155487060546875, -4.90093994140625, -4.7863311767578125, -4.671722412109375, -4.5571136474609375, -4.4425048828125, -4.3278961181640625, -4.213287353515625, -4.0986785888671875, -3.98406982421875, -3.8694610595703125, -3.754852294921875, -3.6402435302734375, -3.525634765625, -3.4110260009765625, -3.296417236328125, -3.1818084716796875, -3.06719970703125, -2.9525909423828125, -2.837982177734375, -2.7233734130859375, -2.6087646484375, -2.4941558837890625, -2.379547119140625, -2.2649383544921875, -2.15032958984375, -2.0357208251953125, -1.921112060546875, -1.8065032958984375, -1.69189453125, -1.5772857666015625, -1.462677001953125, -1.3480682373046875, -1.23345947265625, -1.1188507080078125, -1.004241943359375, -0.8896331787109375, -0.7750244140625, -0.6604156494140625, -0.545806884765625, -0.4311981201171875, -0.31658935546875, -0.2019805908203125, -0.087371826171875, 0.0272369384765625, 0.141845703125, 0.2564544677734375, 0.371063232421875, 0.4856719970703125, 0.60028076171875, 0.7148895263671875, 0.829498291015625, 0.9441070556640625, 1.0587158203125, 1.1733245849609375, 1.287933349609375, 1.4025421142578125, 1.51715087890625, 1.6317596435546875, 1.746368408203125, 1.8609771728515625, 1.9755859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 4.0, 11.0, 5.0, 15.0, 9.0, 15.0, 30.0, 84.0, 209.0, 298.0, 158.0, 55.0, 24.0, 20.0, 9.0, 9.0, 9.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.260986328125, -0.25533199310302734, -0.2496776580810547, -0.24402332305908203, -0.23836898803710938, -0.23271465301513672, -0.22706031799316406, -0.2214059829711914, -0.21575164794921875, -0.2100973129272461, -0.20444297790527344, -0.19878864288330078, -0.19313430786132812, -0.18747997283935547, -0.1818256378173828, -0.17617130279541016, -0.1705169677734375, -0.16486263275146484, -0.1592082977294922, -0.15355396270751953, -0.14789962768554688, -0.14224529266357422, -0.13659095764160156, -0.1309366226196289, -0.12528228759765625, -0.1196279525756836, -0.11397361755371094, -0.10831928253173828, -0.10266494750976562, -0.09701061248779297, -0.09135627746582031, -0.08570194244384766, -0.080047607421875, -0.07439327239990234, -0.06873893737792969, -0.06308460235595703, -0.057430267333984375, -0.05177593231201172, -0.04612159729003906, -0.040467262268066406, -0.03481292724609375, -0.029158592224121094, -0.023504257202148438, -0.01784992218017578, -0.012195587158203125, -0.006541252136230469, -0.0008869171142578125, 0.004767417907714844, 0.0104217529296875, 0.016076087951660156, 0.021730422973632812, 0.02738475799560547, 0.033039093017578125, 0.03869342803955078, 0.04434776306152344, 0.050002098083496094, 0.05565643310546875, 0.061310768127441406, 0.06696510314941406, 0.07261943817138672, 0.07827377319335938, 0.08392810821533203, 0.08958244323730469, 0.09523677825927734, 0.10089111328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 12.0, 14.0, 20.0, 33.0, 59.0, 135.0, 283.0, 1371.0, 20289.0, 4139710.0, 30159.0, 1530.0, 330.0, 154.0, 81.0, 23.0, 18.0, 19.0, 10.0, 3.0, 10.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.466461181640625, -3.34503173828125, -3.223602294921875, -3.1021728515625, -2.980743408203125, -2.85931396484375, -2.737884521484375, -2.616455078125, -2.495025634765625, -2.37359619140625, -2.252166748046875, -2.1307373046875, -2.009307861328125, -1.88787841796875, -1.766448974609375, -1.64501953125, -1.523590087890625, -1.40216064453125, -1.280731201171875, -1.1593017578125, -1.037872314453125, -0.91644287109375, -0.795013427734375, -0.673583984375, -0.552154541015625, -0.43072509765625, -0.309295654296875, -0.1878662109375, -0.066436767578125, 0.05499267578125, 0.176422119140625, 0.2978515625, 0.419281005859375, 0.54071044921875, 0.662139892578125, 0.7835693359375, 0.904998779296875, 1.02642822265625, 1.147857666015625, 1.269287109375, 1.390716552734375, 1.51214599609375, 1.633575439453125, 1.7550048828125, 1.876434326171875, 1.99786376953125, 2.119293212890625, 2.24072265625, 2.362152099609375, 2.48358154296875, 2.605010986328125, 2.7264404296875, 2.847869873046875, 2.96929931640625, 3.090728759765625, 3.212158203125, 3.333587646484375, 3.45501708984375, 3.576446533203125, 3.6978759765625, 3.819305419921875, 3.94073486328125, 4.062164306640625, 4.18359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 15.0, 17.0, 34.0, 37.0, 66.0, 164.0, 725.0, 2407.0, 352.0, 99.0, 58.0, 29.0, 18.0, 12.0, 8.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3760414123535156, -0.36438751220703125, -0.3527336120605469, -0.3410797119140625, -0.3294258117675781, -0.31777191162109375, -0.3061180114746094, -0.294464111328125, -0.2828102111816406, -0.27115631103515625, -0.2595024108886719, -0.2478485107421875, -0.23619461059570312, -0.22454071044921875, -0.21288681030273438, -0.20123291015625, -0.18957901000976562, -0.17792510986328125, -0.16627120971679688, -0.1546173095703125, -0.14296340942382812, -0.13130950927734375, -0.11965560913085938, -0.108001708984375, -0.09634780883789062, -0.08469390869140625, -0.07304000854492188, -0.0613861083984375, -0.049732208251953125, -0.03807830810546875, -0.026424407958984375, -0.0147705078125, -0.003116607666015625, 0.00853729248046875, 0.020191192626953125, 0.0318450927734375, 0.043498992919921875, 0.05515289306640625, 0.06680679321289062, 0.078460693359375, 0.09011459350585938, 0.10176849365234375, 0.11342239379882812, 0.1250762939453125, 0.13673019409179688, 0.14838409423828125, 0.16003799438476562, 0.17169189453125, 0.18334579467773438, 0.19499969482421875, 0.20665359497070312, 0.2183074951171875, 0.22996139526367188, 0.24161529541015625, 0.2532691955566406, 0.264923095703125, 0.2765769958496094, 0.28823089599609375, 0.2998847961425781, 0.3115386962890625, 0.3231925964355469, 0.33484649658203125, 0.3465003967285156, 0.358154296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 5.0, 13.0, 30.0, 209.0, 553.0, 160.0, 18.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3447232246398926, -2.2490410804748535, -2.1533589363098145, -2.0576767921447754, -1.9619946479797363, -1.8663125038146973, -1.7706303596496582, -1.6749482154846191, -1.57926607131958, -1.483583927154541, -1.387901782989502, -1.292219638824463, -1.1965374946594238, -1.1008553504943848, -1.0051732063293457, -0.9094910025596619, -0.813808798789978, -0.718126654624939, -0.6224445104598999, -0.5267623662948608, -0.4310801923274994, -0.3353980481624603, -0.23971587419509888, -0.14403373003005981, -0.04835158586502075, 0.04733056575059891, 0.14301271736621857, 0.23869487643241882, 0.3343770205974579, 0.43005916476249695, 0.5257413387298584, 0.6214234828948975, 0.7171056270599365, 0.8127877712249756, 0.9084699153900146, 1.0041520595550537, 1.0998342037200928, 1.1955163478851318, 1.291198492050171, 1.38688063621521, 1.482562780380249, 1.578244924545288, 1.6739270687103271, 1.7696092128753662, 1.8652913570404053, 1.9609735012054443, 2.0566556453704834, 2.1523377895355225, 2.2480201721191406, 2.3437023162841797, 2.4393844604492188, 2.535066604614258, 2.630748748779297, 2.726430892944336, 2.822113037109375, 2.917795181274414, 3.013477325439453, 3.109159469604492, 3.2048416137695312, 3.3005237579345703, 3.3962059020996094, 3.4918880462646484, 3.5875701904296875, 3.6832523345947266, 3.7789344787597656]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 7.0, 6.0, 11.0, 14.0, 10.0, 20.0, 20.0, 39.0, 40.0, 46.0, 58.0, 66.0, 72.0, 80.0, 71.0, 76.0, 72.0, 51.0, 51.0, 34.0, 45.0, 21.0, 24.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1454839706420898, -1.1123164892196655, -1.0791491270065308, -1.0459816455841064, -1.0128141641616821, -0.9796468019485474, -0.946479320526123, -0.9133118987083435, -0.880144476890564, -0.8469770550727844, -0.8138095736503601, -0.7806421518325806, -0.747474730014801, -0.7143073081970215, -0.6811398267745972, -0.6479724049568176, -0.6148049235343933, -0.5816375017166138, -0.5484700202941895, -0.5153025984764099, -0.48213517665863037, -0.44896772503852844, -0.4158002734184265, -0.382632851600647, -0.34946539998054504, -0.3162979483604431, -0.2831305265426636, -0.24996307492256165, -0.2167956382036209, -0.18362820148468018, -0.15046074986457825, -0.11729331314563751, -0.08412587642669678, -0.050958435982465744, -0.01779099553823471, 0.015376448631286621, 0.048543885350227356, 0.08171132206916809, 0.11487877368927002, 0.14804621040821075, 0.1812136471271515, 0.21438108384609222, 0.24754852056503296, 0.2807159721851349, 0.3138834238052368, 0.34705084562301636, 0.3802182972431183, 0.4133857488632202, 0.44655317068099976, 0.4797206223011017, 0.5128880739212036, 0.5460554957389832, 0.5792229175567627, 0.612390398979187, 0.6455578207969666, 0.6787252426147461, 0.7118927240371704, 0.74506014585495, 0.7782276272773743, 0.8113950490951538, 0.8445624709129333, 0.8777298927307129, 0.9108973741531372, 0.9440647959709167, 0.9772322177886963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 10.0, 15.0, 22.0, 20.0, 17.0, 54.0, 69.0, 104.0, 135.0, 238.0, 410.0, 753.0, 1637.0, 4226.0, 16044.0, 256202.0, 733373.0, 25397.0, 5566.0, 1949.0, 960.0, 484.0, 292.0, 159.0, 118.0, 79.0, 55.0, 39.0, 36.0, 24.0, 17.0, 11.0, 11.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5966796875, -1.545379638671875, -1.49407958984375, -1.442779541015625, -1.3914794921875, -1.340179443359375, -1.28887939453125, -1.237579345703125, -1.186279296875, -1.134979248046875, -1.08367919921875, -1.032379150390625, -0.9810791015625, -0.929779052734375, -0.87847900390625, -0.827178955078125, -0.77587890625, -0.724578857421875, -0.67327880859375, -0.621978759765625, -0.5706787109375, -0.519378662109375, -0.46807861328125, -0.416778564453125, -0.365478515625, -0.314178466796875, -0.26287841796875, -0.211578369140625, -0.1602783203125, -0.108978271484375, -0.05767822265625, -0.006378173828125, 0.044921875, 0.096221923828125, 0.14752197265625, 0.198822021484375, 0.2501220703125, 0.301422119140625, 0.35272216796875, 0.404022216796875, 0.455322265625, 0.506622314453125, 0.55792236328125, 0.609222412109375, 0.6605224609375, 0.711822509765625, 0.76312255859375, 0.814422607421875, 0.86572265625, 0.917022705078125, 0.96832275390625, 1.019622802734375, 1.0709228515625, 1.122222900390625, 1.17352294921875, 1.224822998046875, 1.276123046875, 1.327423095703125, 1.37872314453125, 1.430023193359375, 1.4813232421875, 1.532623291015625, 1.58392333984375, 1.635223388671875, 1.6865234375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 25.0, 49.0, 92.0, 184.0, 266.0, 163.0, 88.0, 39.0, 17.0, 12.0, 8.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.263427734375, -0.25785160064697266, -0.2522754669189453, -0.24669933319091797, -0.24112319946289062, -0.23554706573486328, -0.22997093200683594, -0.2243947982788086, -0.21881866455078125, -0.2132425308227539, -0.20766639709472656, -0.20209026336669922, -0.19651412963867188, -0.19093799591064453, -0.1853618621826172, -0.17978572845458984, -0.1742095947265625, -0.16863346099853516, -0.1630573272705078, -0.15748119354248047, -0.15190505981445312, -0.14632892608642578, -0.14075279235839844, -0.1351766586303711, -0.12960052490234375, -0.1240243911743164, -0.11844825744628906, -0.11287212371826172, -0.10729598999023438, -0.10171985626220703, -0.09614372253417969, -0.09056758880615234, -0.084991455078125, -0.07941532135009766, -0.07383918762207031, -0.06826305389404297, -0.06268692016601562, -0.05711078643798828, -0.05153465270996094, -0.045958518981933594, -0.04038238525390625, -0.034806251525878906, -0.029230117797851562, -0.02365398406982422, -0.018077850341796875, -0.012501716613769531, -0.0069255828857421875, -0.0013494491577148438, 0.0042266845703125, 0.009802818298339844, 0.015378952026367188, 0.02095508575439453, 0.026531219482421875, 0.03210735321044922, 0.03768348693847656, 0.043259620666503906, 0.04883575439453125, 0.054411888122558594, 0.05998802185058594, 0.06556415557861328, 0.07114028930664062, 0.07671642303466797, 0.08229255676269531, 0.08786869049072266, 0.09344482421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 12.0, 26.0, 21.0, 40.0, 46.0, 78.0, 98.0, 153.0, 242.0, 395.0, 574.0, 1038.0, 1985.0, 5309.0, 20313.0, 125023.0, 651073.0, 201035.0, 28849.0, 6872.0, 2407.0, 1109.0, 629.0, 421.0, 255.0, 162.0, 101.0, 84.0, 48.0, 28.0, 22.0, 17.0, 14.0, 11.0, 9.0, 11.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8525390625, -0.8255767822265625, -0.798614501953125, -0.7716522216796875, -0.74468994140625, -0.7177276611328125, -0.690765380859375, -0.6638031005859375, -0.6368408203125, -0.6098785400390625, -0.582916259765625, -0.5559539794921875, -0.52899169921875, -0.5020294189453125, -0.475067138671875, -0.4481048583984375, -0.421142578125, -0.3941802978515625, -0.367218017578125, -0.3402557373046875, -0.31329345703125, -0.2863311767578125, -0.259368896484375, -0.2324066162109375, -0.2054443359375, -0.1784820556640625, -0.151519775390625, -0.1245574951171875, -0.09759521484375, -0.0706329345703125, -0.043670654296875, -0.0167083740234375, 0.01025390625, 0.0372161865234375, 0.064178466796875, 0.0911407470703125, 0.11810302734375, 0.1450653076171875, 0.172027587890625, 0.1989898681640625, 0.2259521484375, 0.2529144287109375, 0.279876708984375, 0.3068389892578125, 0.33380126953125, 0.3607635498046875, 0.387725830078125, 0.4146881103515625, 0.441650390625, 0.4686126708984375, 0.495574951171875, 0.5225372314453125, 0.54949951171875, 0.5764617919921875, 0.603424072265625, 0.6303863525390625, 0.6573486328125, 0.6843109130859375, 0.711273193359375, 0.7382354736328125, 0.76519775390625, 0.7921600341796875, 0.819122314453125, 0.8460845947265625, 0.873046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 3.0, 7.0, 5.0, 11.0, 13.0, 13.0, 13.0, 23.0, 16.0, 15.0, 28.0, 27.0, 23.0, 27.0, 29.0, 34.0, 49.0, 35.0, 39.0, 51.0, 38.0, 40.0, 35.0, 34.0, 23.0, 47.0, 45.0, 22.0, 34.0, 27.0, 34.0, 22.0, 19.0, 12.0, 20.0, 13.0, 13.0, 6.0, 6.0, 6.0, 7.0, 6.0, 7.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.36572265625, -0.35418701171875, -0.3426513671875, -0.33111572265625, -0.319580078125, -0.30804443359375, -0.2965087890625, -0.28497314453125, -0.2734375, -0.26190185546875, -0.2503662109375, -0.23883056640625, -0.227294921875, -0.21575927734375, -0.2042236328125, -0.19268798828125, -0.18115234375, -0.16961669921875, -0.1580810546875, -0.14654541015625, -0.135009765625, -0.12347412109375, -0.1119384765625, -0.10040283203125, -0.0888671875, -0.07733154296875, -0.0657958984375, -0.05426025390625, -0.042724609375, -0.03118896484375, -0.0196533203125, -0.00811767578125, 0.00341796875, 0.01495361328125, 0.0264892578125, 0.03802490234375, 0.049560546875, 0.06109619140625, 0.0726318359375, 0.08416748046875, 0.095703125, 0.10723876953125, 0.1187744140625, 0.13031005859375, 0.141845703125, 0.15338134765625, 0.1649169921875, 0.17645263671875, 0.18798828125, 0.19952392578125, 0.2110595703125, 0.22259521484375, 0.234130859375, 0.24566650390625, 0.2572021484375, 0.26873779296875, 0.2802734375, 0.29180908203125, 0.3033447265625, 0.31488037109375, 0.326416015625, 0.33795166015625, 0.3494873046875, 0.36102294921875, 0.37255859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 7.0, 4.0, 6.0, 11.0, 22.0, 25.0, 56.0, 106.0, 228.0, 479.0, 1470.0, 7478.0, 154738.0, 854315.0, 25183.0, 2989.0, 769.0, 320.0, 160.0, 75.0, 42.0, 18.0, 15.0, 4.0, 15.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7289810180664062, -0.7040557861328125, -0.6791305541992188, -0.654205322265625, -0.6292800903320312, -0.6043548583984375, -0.5794296264648438, -0.55450439453125, -0.5295791625976562, -0.5046539306640625, -0.47972869873046875, -0.454803466796875, -0.42987823486328125, -0.4049530029296875, -0.38002777099609375, -0.3551025390625, -0.33017730712890625, -0.3052520751953125, -0.28032684326171875, -0.255401611328125, -0.23047637939453125, -0.2055511474609375, -0.18062591552734375, -0.15570068359375, -0.13077545166015625, -0.1058502197265625, -0.08092498779296875, -0.055999755859375, -0.03107452392578125, -0.0061492919921875, 0.01877593994140625, 0.043701171875, 0.06862640380859375, 0.0935516357421875, 0.11847686767578125, 0.143402099609375, 0.16832733154296875, 0.1932525634765625, 0.21817779541015625, 0.24310302734375, 0.26802825927734375, 0.2929534912109375, 0.31787872314453125, 0.342803955078125, 0.36772918701171875, 0.3926544189453125, 0.41757965087890625, 0.4425048828125, 0.46743011474609375, 0.4923553466796875, 0.5172805786132812, 0.542205810546875, 0.5671310424804688, 0.5920562744140625, 0.6169815063476562, 0.64190673828125, 0.6668319702148438, 0.6917572021484375, 0.7166824340820312, 0.741607666015625, 0.7665328979492188, 0.7914581298828125, 0.8163833618164062, 0.84130859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 7.0, 17.0, 23.0, 30.0, 44.0, 71.0, 72.0, 110.0, 161.0, 127.0, 100.0, 51.0, 47.0, 44.0, 30.0, 20.0, 16.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018513202667236328, -0.00017572380602359772, -0.00016631558537483215, -0.0001569073647260666, -0.00014749914407730103, -0.00013809092342853546, -0.0001286827027797699, -0.00011927448213100433, -0.00010986626148223877, -0.0001004580408334732, -9.104982018470764e-05, -8.164159953594208e-05, -7.223337888717651e-05, -6.282515823841095e-05, -5.3416937589645386e-05, -4.400871694087982e-05, -3.460049629211426e-05, -2.5192275643348694e-05, -1.578405499458313e-05, -6.375834345817566e-06, 3.032386302947998e-06, 1.2440606951713562e-05, 2.1848827600479126e-05, 3.125704824924469e-05, 4.0665268898010254e-05, 5.007348954677582e-05, 5.948171019554138e-05, 6.888993084430695e-05, 7.829815149307251e-05, 8.770637214183807e-05, 9.711459279060364e-05, 0.0001065228134393692, 0.00011593103408813477, 0.00012533925473690033, 0.0001347474753856659, 0.00014415569603443146, 0.00015356391668319702, 0.00016297213733196259, 0.00017238035798072815, 0.0001817885786294937, 0.00019119679927825928, 0.00020060501992702484, 0.0002100132405757904, 0.00021942146122455597, 0.00022882968187332153, 0.0002382379025220871, 0.00024764612317085266, 0.0002570543438196182, 0.0002664625644683838, 0.00027587078511714935, 0.0002852790057659149, 0.0002946872264146805, 0.00030409544706344604, 0.0003135036677122116, 0.00032291188836097717, 0.00033232010900974274, 0.0003417283296585083, 0.00035113655030727386, 0.00036054477095603943, 0.000369952991604805, 0.00037936121225357056, 0.0003887694329023361, 0.0003981776535511017, 0.00040758587419986725, 0.0004169940948486328]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 4.0, 12.0, 19.0, 37.0, 43.0, 83.0, 132.0, 257.0, 641.0, 1592.0, 6205.0, 67037.0, 888778.0, 74567.0, 6367.0, 1563.0, 591.0, 245.0, 143.0, 77.0, 56.0, 16.0, 15.0, 22.0, 11.0, 7.0, 6.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97509765625, -0.948394775390625, -0.92169189453125, -0.894989013671875, -0.8682861328125, -0.841583251953125, -0.81488037109375, -0.788177490234375, -0.761474609375, -0.734771728515625, -0.70806884765625, -0.681365966796875, -0.6546630859375, -0.627960205078125, -0.60125732421875, -0.574554443359375, -0.5478515625, -0.521148681640625, -0.49444580078125, -0.467742919921875, -0.4410400390625, -0.414337158203125, -0.38763427734375, -0.360931396484375, -0.334228515625, -0.307525634765625, -0.28082275390625, -0.254119873046875, -0.2274169921875, -0.200714111328125, -0.17401123046875, -0.147308349609375, -0.12060546875, -0.093902587890625, -0.06719970703125, -0.040496826171875, -0.0137939453125, 0.012908935546875, 0.03961181640625, 0.066314697265625, 0.093017578125, 0.119720458984375, 0.14642333984375, 0.173126220703125, 0.1998291015625, 0.226531982421875, 0.25323486328125, 0.279937744140625, 0.306640625, 0.333343505859375, 0.36004638671875, 0.386749267578125, 0.4134521484375, 0.440155029296875, 0.46685791015625, 0.493560791015625, 0.520263671875, 0.546966552734375, 0.57366943359375, 0.600372314453125, 0.6270751953125, 0.653778076171875, 0.68048095703125, 0.707183837890625, 0.73388671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 6.0, 17.0, 17.0, 34.0, 42.0, 52.0, 65.0, 118.0, 148.0, 148.0, 104.0, 68.0, 59.0, 29.0, 29.0, 16.0, 9.0, 10.0, 13.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6575355529785156, -0.6422195434570312, -0.6269035339355469, -0.6115875244140625, -0.5962715148925781, -0.5809555053710938, -0.5656394958496094, -0.550323486328125, -0.5350074768066406, -0.5196914672851562, -0.5043754577636719, -0.4890594482421875, -0.4737434387207031, -0.45842742919921875, -0.4431114196777344, -0.42779541015625, -0.4124794006347656, -0.39716339111328125, -0.3818473815917969, -0.3665313720703125, -0.3512153625488281, -0.33589935302734375, -0.3205833435058594, -0.305267333984375, -0.2899513244628906, -0.27463531494140625, -0.2593193054199219, -0.2440032958984375, -0.22868728637695312, -0.21337127685546875, -0.19805526733398438, -0.1827392578125, -0.16742324829101562, -0.15210723876953125, -0.13679122924804688, -0.1214752197265625, -0.10615921020507812, -0.09084320068359375, -0.07552719116210938, -0.060211181640625, -0.044895172119140625, -0.02957916259765625, -0.014263153076171875, 0.0010528564453125, 0.016368865966796875, 0.03168487548828125, 0.047000885009765625, 0.06231689453125, 0.07763290405273438, 0.09294891357421875, 0.10826492309570312, 0.1235809326171875, 0.13889694213867188, 0.15421295166015625, 0.16952896118164062, 0.184844970703125, 0.20016098022460938, 0.21547698974609375, 0.23079299926757812, 0.2461090087890625, 0.2614250183105469, 0.27674102783203125, 0.2920570373535156, 0.307373046875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 31.0, 328.0, 581.0, 51.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.163188934326172, -25.557373046875, -24.95155906677246, -24.345745086669922, -23.73992919921875, -23.134113311767578, -22.52829933166504, -21.9224853515625, -21.316669464111328, -20.710853576660156, -20.105039596557617, -19.499225616455078, -18.893409729003906, -18.287593841552734, -17.681779861450195, -17.075965881347656, -16.470149993896484, -15.864335060119629, -15.258520126342773, -14.652705192565918, -14.046890258789062, -13.441075325012207, -12.835260391235352, -12.229445457458496, -11.62363052368164, -11.017815589904785, -10.41200065612793, -9.806185722351074, -9.200370788574219, -8.594555854797363, -7.988740921020508, -7.382925987243652, -6.777109146118164, -6.171294212341309, -5.565479278564453, -4.959664344787598, -4.353849411010742, -3.7480344772338867, -3.1422195434570312, -2.536404609680176, -1.9305896759033203, -1.3247747421264648, -0.7189598083496094, -0.1131448745727539, 0.49267005920410156, 1.098484992980957, 1.7042999267578125, 2.310114860534668, 2.9159297943115234, 3.521744728088379, 4.127559661865234, 4.73337459564209, 5.339189529418945, 5.945004463195801, 6.550819396972656, 7.156634330749512, 7.762449264526367, 8.368264198303223, 8.974079132080078, 9.579894065856934, 10.185708999633789, 10.791523933410645, 11.3973388671875, 12.003153800964355, 12.608968734741211]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 6.0, 8.0, 11.0, 8.0, 15.0, 24.0, 31.0, 25.0, 37.0, 32.0, 46.0, 51.0, 50.0, 53.0, 59.0, 63.0, 61.0, 59.0, 47.0, 49.0, 47.0, 28.0, 43.0, 30.0, 27.0, 18.0, 15.0, 10.0, 12.0, 0.0, 3.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1264801025390625, -4.003203392028809, -3.8799262046813965, -3.7566492557525635, -3.6333723068237305, -3.5100955963134766, -3.3868186473846436, -3.2635416984558105, -3.1402647495269775, -3.0169878005981445, -2.8937108516693115, -2.7704339027404785, -2.6471571922302246, -2.5238800048828125, -2.4006032943725586, -2.2773263454437256, -2.1540493965148926, -2.0307724475860596, -1.9074954986572266, -1.784218668937683, -1.66094172000885, -1.537664771080017, -1.4143879413604736, -1.2911109924316406, -1.1678340435028076, -1.0445570945739746, -0.9212802052497864, -0.7980033159255981, -0.6747263669967651, -0.5514494180679321, -0.4281725287437439, -0.30489563941955566, -0.18161869049072266, -0.058341771364212036, 0.06493514776229858, 0.1882120668888092, 0.3114889860153198, 0.43476593494415283, 0.5580428242683411, 0.6813197135925293, 0.8045966625213623, 0.9278736114501953, 1.0511505603790283, 1.1744273900985718, 1.2977043390274048, 1.4209812879562378, 1.5442581176757812, 1.6675350666046143, 1.7908120155334473, 1.9140889644622803, 2.0373659133911133, 2.1606428623199463, 2.2839198112487793, 2.407196521759033, 2.530473470687866, 2.653750419616699, 2.7770273685455322, 2.9003043174743652, 3.0235812664031982, 3.1468582153320312, 3.270134925842285, 3.3934121131896973, 3.516688823699951, 3.639965772628784, 3.763242721557617]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 11.0, 16.0, 23.0, 48.0, 72.0, 153.0, 447.0, 1835.0, 232926.0, 3956656.0, 1652.0, 292.0, 78.0, 25.0, 12.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.96875, -10.73052978515625, -10.4923095703125, -10.25408935546875, -10.015869140625, -9.77764892578125, -9.5394287109375, -9.30120849609375, -9.06298828125, -8.82476806640625, -8.5865478515625, -8.34832763671875, -8.110107421875, -7.87188720703125, -7.6336669921875, -7.39544677734375, -7.1572265625, -6.91900634765625, -6.6807861328125, -6.44256591796875, -6.204345703125, -5.96612548828125, -5.7279052734375, -5.48968505859375, -5.25146484375, -5.01324462890625, -4.7750244140625, -4.53680419921875, -4.298583984375, -4.06036376953125, -3.8221435546875, -3.58392333984375, -3.345703125, -3.10748291015625, -2.8692626953125, -2.63104248046875, -2.392822265625, -2.15460205078125, -1.9163818359375, -1.67816162109375, -1.43994140625, -1.20172119140625, -0.9635009765625, -0.72528076171875, -0.487060546875, -0.24884033203125, -0.0106201171875, 0.22760009765625, 0.4658203125, 0.70404052734375, 0.9422607421875, 1.18048095703125, 1.418701171875, 1.65692138671875, 1.8951416015625, 2.13336181640625, 2.37158203125, 2.60980224609375, 2.8480224609375, 3.08624267578125, 3.324462890625, 3.56268310546875, 3.8009033203125, 4.03912353515625, 4.27734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 10.0, 23.0, 32.0, 66.0, 127.0, 225.0, 217.0, 135.0, 79.0, 27.0, 13.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.3017578125, -0.2953205108642578, -0.2888832092285156, -0.28244590759277344, -0.27600860595703125, -0.26957130432128906, -0.2631340026855469, -0.2566967010498047, -0.2502593994140625, -0.2438220977783203, -0.23738479614257812, -0.23094749450683594, -0.22451019287109375, -0.21807289123535156, -0.21163558959960938, -0.2051982879638672, -0.198760986328125, -0.1923236846923828, -0.18588638305664062, -0.17944908142089844, -0.17301177978515625, -0.16657447814941406, -0.16013717651367188, -0.1536998748779297, -0.1472625732421875, -0.1408252716064453, -0.13438796997070312, -0.12795066833496094, -0.12151336669921875, -0.11507606506347656, -0.10863876342773438, -0.10220146179199219, -0.09576416015625, -0.08932685852050781, -0.08288955688476562, -0.07645225524902344, -0.07001495361328125, -0.06357765197753906, -0.057140350341796875, -0.05070304870605469, -0.0442657470703125, -0.03782844543457031, -0.031391143798828125, -0.024953842163085938, -0.01851654052734375, -0.012079238891601562, -0.005641937255859375, 0.0007953643798828125, 0.007232666015625, 0.013669967651367188, 0.020107269287109375, 0.026544570922851562, 0.03298187255859375, 0.03941917419433594, 0.045856475830078125, 0.05229377746582031, 0.0587310791015625, 0.06516838073730469, 0.07160568237304688, 0.07804298400878906, 0.08448028564453125, 0.09091758728027344, 0.09735488891601562, 0.10379219055175781, 0.1102294921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 15.0, 22.0, 26.0, 60.0, 95.0, 237.0, 593.0, 2056.0, 12048.0, 258150.0, 3882584.0, 32841.0, 3999.0, 928.0, 300.0, 142.0, 74.0, 42.0, 24.0, 17.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.244140625, -2.1909637451171875, -2.137786865234375, -2.0846099853515625, -2.03143310546875, -1.9782562255859375, -1.925079345703125, -1.8719024658203125, -1.8187255859375, -1.7655487060546875, -1.712371826171875, -1.6591949462890625, -1.60601806640625, -1.5528411865234375, -1.499664306640625, -1.4464874267578125, -1.393310546875, -1.3401336669921875, -1.286956787109375, -1.2337799072265625, -1.18060302734375, -1.1274261474609375, -1.074249267578125, -1.0210723876953125, -0.9678955078125, -0.9147186279296875, -0.861541748046875, -0.8083648681640625, -0.75518798828125, -0.7020111083984375, -0.648834228515625, -0.5956573486328125, -0.54248046875, -0.4893035888671875, -0.436126708984375, -0.3829498291015625, -0.32977294921875, -0.2765960693359375, -0.223419189453125, -0.1702423095703125, -0.1170654296875, -0.0638885498046875, -0.010711669921875, 0.0424652099609375, 0.09564208984375, 0.1488189697265625, 0.201995849609375, 0.2551727294921875, 0.308349609375, 0.3615264892578125, 0.414703369140625, 0.4678802490234375, 0.52105712890625, 0.5742340087890625, 0.627410888671875, 0.6805877685546875, 0.7337646484375, 0.7869415283203125, 0.840118408203125, 0.8932952880859375, 0.94647216796875, 0.9996490478515625, 1.052825927734375, 1.1060028076171875, 1.1591796875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 11.0, 29.0, 37.0, 48.0, 110.0, 311.0, 1529.0, 1346.0, 281.0, 127.0, 71.0, 44.0, 33.0, 15.0, 17.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2381591796875, -0.2304668426513672, -0.22277450561523438, -0.21508216857910156, -0.20738983154296875, -0.19969749450683594, -0.19200515747070312, -0.1843128204345703, -0.1766204833984375, -0.1689281463623047, -0.16123580932617188, -0.15354347229003906, -0.14585113525390625, -0.13815879821777344, -0.13046646118164062, -0.12277412414550781, -0.115081787109375, -0.10738945007324219, -0.09969711303710938, -0.09200477600097656, -0.08431243896484375, -0.07662010192871094, -0.06892776489257812, -0.06123542785644531, -0.0535430908203125, -0.04585075378417969, -0.038158416748046875, -0.030466079711914062, -0.02277374267578125, -0.015081405639648438, -0.007389068603515625, 0.0003032684326171875, 0.00799560546875, 0.015687942504882812, 0.023380279541015625, 0.031072616577148438, 0.03876495361328125, 0.04645729064941406, 0.054149627685546875, 0.06184196472167969, 0.0695343017578125, 0.07722663879394531, 0.08491897583007812, 0.09261131286621094, 0.10030364990234375, 0.10799598693847656, 0.11568832397460938, 0.12338066101074219, 0.131072998046875, 0.1387653350830078, 0.14645767211914062, 0.15415000915527344, 0.16184234619140625, 0.16953468322753906, 0.17722702026367188, 0.1849193572998047, 0.1926116943359375, 0.2003040313720703, 0.20799636840820312, 0.21568870544433594, 0.22338104248046875, 0.23107337951660156, 0.23876571655273438, 0.2464580535888672, 0.254150390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 87.0, 648.0, 242.0, 16.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.866507053375244, -4.717939853668213, -4.569372177124023, -4.420804977416992, -4.272237777709961, -4.1236701011657715, -3.9751029014587402, -3.82653546333313, -3.6779680252075195, -3.529400587081909, -3.380833148956299, -3.2322659492492676, -3.0836985111236572, -2.935131072998047, -2.7865638732910156, -2.6379964351654053, -2.489428997039795, -2.3408615589141846, -2.192294120788574, -2.043726921081543, -1.8951594829559326, -1.7465920448303223, -1.5980247259140015, -1.4494574069976807, -1.3008899688720703, -1.15232253074646, -1.0037552118301392, -0.8551878333091736, -0.706620454788208, -0.5580530762672424, -0.40948569774627686, -0.26091837882995605, -0.1123514175415039, 0.03621596097946167, 0.18478333950042725, 0.3333507180213928, 0.4819180965423584, 0.630485475063324, 0.7790528535842896, 0.9276201725006104, 1.0761876106262207, 1.224755048751831, 1.3733223676681519, 1.5218896865844727, 1.670457124710083, 1.8190245628356934, 1.9675918817520142, 2.116159200668335, 2.2647266387939453, 2.4132940769195557, 2.561861515045166, 2.7104287147521973, 2.8589961528778076, 3.007563591003418, 3.156130790710449, 3.3046982288360596, 3.45326566696167, 3.6018331050872803, 3.7504005432128906, 3.898967742919922, 4.047534942626953, 4.196102619171143, 4.344669818878174, 4.493237495422363, 4.6418046951293945]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 13.0, 16.0, 11.0, 24.0, 24.0, 30.0, 33.0, 41.0, 33.0, 43.0, 49.0, 46.0, 67.0, 49.0, 57.0, 53.0, 50.0, 53.0, 50.0, 39.0, 40.0, 31.0, 22.0, 24.0, 11.0, 13.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8123870491981506, -0.7890617251396179, -0.7657364010810852, -0.7424110770225525, -0.7190857529640198, -0.6957604289054871, -0.6724351048469543, -0.6491097807884216, -0.6257844567298889, -0.6024591326713562, -0.5791338086128235, -0.5558084845542908, -0.5324831604957581, -0.5091578364372253, -0.4858325123786926, -0.4625071883201599, -0.4391818642616272, -0.4158565402030945, -0.39253121614456177, -0.36920589208602905, -0.34588056802749634, -0.3225552439689636, -0.2992299199104309, -0.2759045958518982, -0.2525792717933655, -0.22925394773483276, -0.20592862367630005, -0.18260329961776733, -0.15927797555923462, -0.1359526515007019, -0.11262732744216919, -0.08930200338363647, -0.06597673892974854, -0.04265141487121582, -0.019326090812683105, 0.003999233245849609, 0.027324557304382324, 0.05064988136291504, 0.07397520542144775, 0.09730052947998047, 0.12062585353851318, 0.1439511775970459, 0.1672765016555786, 0.19060182571411133, 0.21392714977264404, 0.23725247383117676, 0.2605777978897095, 0.2839031219482422, 0.3072284460067749, 0.3305537700653076, 0.35387909412384033, 0.37720441818237305, 0.40052974224090576, 0.4238550662994385, 0.4471803903579712, 0.4705057144165039, 0.4938310384750366, 0.5171563625335693, 0.540481686592102, 0.5638070106506348, 0.5871323347091675, 0.6104576587677002, 0.6337829828262329, 0.6571083068847656, 0.6804336309432983]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 3.0, 9.0, 13.0, 18.0, 30.0, 51.0, 54.0, 73.0, 118.0, 166.0, 259.0, 494.0, 894.0, 1826.0, 5834.0, 32452.0, 661137.0, 318344.0, 19203.0, 4135.0, 1558.0, 691.0, 396.0, 239.0, 172.0, 97.0, 70.0, 63.0, 59.0, 21.0, 17.0, 17.0, 15.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.266326904296875, -1.22894287109375, -1.191558837890625, -1.1541748046875, -1.116790771484375, -1.07940673828125, -1.042022705078125, -1.004638671875, -0.967254638671875, -0.92987060546875, -0.892486572265625, -0.8551025390625, -0.817718505859375, -0.78033447265625, -0.742950439453125, -0.70556640625, -0.668182373046875, -0.63079833984375, -0.593414306640625, -0.5560302734375, -0.518646240234375, -0.48126220703125, -0.443878173828125, -0.406494140625, -0.369110107421875, -0.33172607421875, -0.294342041015625, -0.2569580078125, -0.219573974609375, -0.18218994140625, -0.144805908203125, -0.107421875, -0.070037841796875, -0.03265380859375, 0.004730224609375, 0.0421142578125, 0.079498291015625, 0.11688232421875, 0.154266357421875, 0.191650390625, 0.229034423828125, 0.26641845703125, 0.303802490234375, 0.3411865234375, 0.378570556640625, 0.41595458984375, 0.453338623046875, 0.49072265625, 0.528106689453125, 0.56549072265625, 0.602874755859375, 0.6402587890625, 0.677642822265625, 0.71502685546875, 0.752410888671875, 0.789794921875, 0.827178955078125, 0.86456298828125, 0.901947021484375, 0.9393310546875, 0.976715087890625, 1.01409912109375, 1.051483154296875, 1.0888671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 16.0, 14.0, 42.0, 70.0, 134.0, 202.0, 203.0, 147.0, 84.0, 33.0, 18.0, 10.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.292724609375, -0.28661632537841797, -0.28050804138183594, -0.2743997573852539, -0.2682914733886719, -0.26218318939208984, -0.2560749053955078, -0.24996662139892578, -0.24385833740234375, -0.23775005340576172, -0.2316417694091797, -0.22553348541259766, -0.21942520141601562, -0.2133169174194336, -0.20720863342285156, -0.20110034942626953, -0.1949920654296875, -0.18888378143310547, -0.18277549743652344, -0.1766672134399414, -0.17055892944335938, -0.16445064544677734, -0.1583423614501953, -0.15223407745361328, -0.14612579345703125, -0.14001750946044922, -0.1339092254638672, -0.12780094146728516, -0.12169265747070312, -0.1155843734741211, -0.10947608947753906, -0.10336780548095703, -0.097259521484375, -0.09115123748779297, -0.08504295349121094, -0.0789346694946289, -0.07282638549804688, -0.06671810150146484, -0.06060981750488281, -0.05450153350830078, -0.04839324951171875, -0.04228496551513672, -0.03617668151855469, -0.030068397521972656, -0.023960113525390625, -0.017851829528808594, -0.011743545532226562, -0.005635261535644531, 0.0004730224609375, 0.006581306457519531, 0.012689590454101562, 0.018797874450683594, 0.024906158447265625, 0.031014442443847656, 0.03712272644042969, 0.04323101043701172, 0.04933929443359375, 0.05544757843017578, 0.06155586242675781, 0.06766414642333984, 0.07377243041992188, 0.0798807144165039, 0.08598899841308594, 0.09209728240966797, 0.09820556640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 10.0, 17.0, 20.0, 27.0, 30.0, 52.0, 83.0, 119.0, 214.0, 349.0, 645.0, 1287.0, 2910.0, 7844.0, 29371.0, 163698.0, 588359.0, 202672.0, 35210.0, 9248.0, 3309.0, 1365.0, 718.0, 360.0, 204.0, 144.0, 74.0, 56.0, 38.0, 38.0, 22.0, 17.0, 9.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5629348754882812, -0.5409088134765625, -0.5188827514648438, -0.496856689453125, -0.47483062744140625, -0.4528045654296875, -0.43077850341796875, -0.40875244140625, -0.38672637939453125, -0.3647003173828125, -0.34267425537109375, -0.320648193359375, -0.29862213134765625, -0.2765960693359375, -0.25457000732421875, -0.2325439453125, -0.21051788330078125, -0.1884918212890625, -0.16646575927734375, -0.144439697265625, -0.12241363525390625, -0.1003875732421875, -0.07836151123046875, -0.05633544921875, -0.03430938720703125, -0.0122833251953125, 0.00974273681640625, 0.031768798828125, 0.05379486083984375, 0.0758209228515625, 0.09784698486328125, 0.119873046875, 0.14189910888671875, 0.1639251708984375, 0.18595123291015625, 0.207977294921875, 0.23000335693359375, 0.2520294189453125, 0.27405548095703125, 0.29608154296875, 0.31810760498046875, 0.3401336669921875, 0.36215972900390625, 0.384185791015625, 0.40621185302734375, 0.4282379150390625, 0.45026397705078125, 0.4722900390625, 0.49431610107421875, 0.5163421630859375, 0.5383682250976562, 0.560394287109375, 0.5824203491210938, 0.6044464111328125, 0.6264724731445312, 0.64849853515625, 0.6705245971679688, 0.6925506591796875, 0.7145767211914062, 0.736602783203125, 0.7586288452148438, 0.7806549072265625, 0.8026809692382812, 0.82470703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 10.0, 16.0, 13.0, 17.0, 17.0, 22.0, 32.0, 39.0, 30.0, 36.0, 41.0, 49.0, 44.0, 34.0, 36.0, 45.0, 36.0, 36.0, 44.0, 47.0, 35.0, 28.0, 35.0, 33.0, 28.0, 18.0, 14.0, 26.0, 15.0, 19.0, 21.0, 12.0, 11.0, 11.0, 7.0, 2.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38427734375, -0.37104034423828125, -0.3578033447265625, -0.34456634521484375, -0.331329345703125, -0.31809234619140625, -0.3048553466796875, -0.29161834716796875, -0.27838134765625, -0.26514434814453125, -0.2519073486328125, -0.23867034912109375, -0.225433349609375, -0.21219635009765625, -0.1989593505859375, -0.18572235107421875, -0.1724853515625, -0.15924835205078125, -0.1460113525390625, -0.13277435302734375, -0.119537353515625, -0.10630035400390625, -0.0930633544921875, -0.07982635498046875, -0.06658935546875, -0.05335235595703125, -0.0401153564453125, -0.02687835693359375, -0.013641357421875, -0.00040435791015625, 0.0128326416015625, 0.02606964111328125, 0.039306640625, 0.05254364013671875, 0.0657806396484375, 0.07901763916015625, 0.092254638671875, 0.10549163818359375, 0.1187286376953125, 0.13196563720703125, 0.14520263671875, 0.15843963623046875, 0.1716766357421875, 0.18491363525390625, 0.198150634765625, 0.21138763427734375, 0.2246246337890625, 0.23786163330078125, 0.2510986328125, 0.26433563232421875, 0.2775726318359375, 0.29080963134765625, 0.304046630859375, 0.31728363037109375, 0.3305206298828125, 0.34375762939453125, 0.35699462890625, 0.37023162841796875, 0.3834686279296875, 0.39670562744140625, 0.409942626953125, 0.42317962646484375, 0.4364166259765625, 0.44965362548828125, 0.462890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 10.0, 11.0, 18.0, 29.0, 40.0, 78.0, 118.0, 171.0, 412.0, 1033.0, 3190.0, 14557.0, 158774.0, 813243.0, 46541.0, 7047.0, 1902.0, 707.0, 315.0, 137.0, 81.0, 45.0, 18.0, 14.0, 18.0, 11.0, 9.0, 2.0, 7.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8359375, -0.810821533203125, -0.78570556640625, -0.760589599609375, -0.7354736328125, -0.710357666015625, -0.68524169921875, -0.660125732421875, -0.635009765625, -0.609893798828125, -0.58477783203125, -0.559661865234375, -0.5345458984375, -0.509429931640625, -0.48431396484375, -0.459197998046875, -0.43408203125, -0.408966064453125, -0.38385009765625, -0.358734130859375, -0.3336181640625, -0.308502197265625, -0.28338623046875, -0.258270263671875, -0.233154296875, -0.208038330078125, -0.18292236328125, -0.157806396484375, -0.1326904296875, -0.107574462890625, -0.08245849609375, -0.057342529296875, -0.0322265625, -0.007110595703125, 0.01800537109375, 0.043121337890625, 0.0682373046875, 0.093353271484375, 0.11846923828125, 0.143585205078125, 0.168701171875, 0.193817138671875, 0.21893310546875, 0.244049072265625, 0.2691650390625, 0.294281005859375, 0.31939697265625, 0.344512939453125, 0.36962890625, 0.394744873046875, 0.41986083984375, 0.444976806640625, 0.4700927734375, 0.495208740234375, 0.52032470703125, 0.545440673828125, 0.570556640625, 0.595672607421875, 0.62078857421875, 0.645904541015625, 0.6710205078125, 0.696136474609375, 0.72125244140625, 0.746368408203125, 0.771484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 15.0, 18.0, 24.0, 30.0, 38.0, 49.0, 56.0, 73.0, 105.0, 164.0, 106.0, 73.0, 61.0, 48.0, 32.0, 26.0, 17.0, 15.0, 5.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001996755599975586, -0.00019390136003494263, -0.00018812716007232666, -0.0001823529601097107, -0.00017657876014709473, -0.00017080456018447876, -0.0001650303602218628, -0.00015925616025924683, -0.00015348196029663086, -0.0001477077603340149, -0.00014193356037139893, -0.00013615936040878296, -0.000130385160446167, -0.00012461096048355103, -0.00011883676052093506, -0.00011306256055831909, -0.00010728836059570312, -0.00010151416063308716, -9.573996067047119e-05, -8.996576070785522e-05, -8.419156074523926e-05, -7.841736078262329e-05, -7.264316082000732e-05, -6.686896085739136e-05, -6.109476089477539e-05, -5.5320560932159424e-05, -4.954636096954346e-05, -4.377216100692749e-05, -3.7997961044311523e-05, -3.222376108169556e-05, -2.644956111907959e-05, -2.0675361156463623e-05, -1.4901161193847656e-05, -9.12696123123169e-06, -3.3527612686157227e-06, 2.421438694000244e-06, 8.195638656616211e-06, 1.3969838619232178e-05, 1.9744038581848145e-05, 2.551823854446411e-05, 3.129243850708008e-05, 3.7066638469696045e-05, 4.284083843231201e-05, 4.861503839492798e-05, 5.4389238357543945e-05, 6.016343832015991e-05, 6.593763828277588e-05, 7.171183824539185e-05, 7.748603820800781e-05, 8.326023817062378e-05, 8.903443813323975e-05, 9.480863809585571e-05, 0.00010058283805847168, 0.00010635703802108765, 0.00011213123798370361, 0.00011790543794631958, 0.00012367963790893555, 0.00012945383787155151, 0.00013522803783416748, 0.00014100223779678345, 0.00014677643775939941, 0.00015255063772201538, 0.00015832483768463135, 0.00016409903764724731, 0.00016987323760986328]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 13.0, 24.0, 33.0, 55.0, 91.0, 173.0, 342.0, 843.0, 2669.0, 11886.0, 125395.0, 844874.0, 52248.0, 6870.0, 1746.0, 622.0, 283.0, 128.0, 90.0, 47.0, 29.0, 18.0, 21.0, 7.0, 7.0, 1.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9199752807617188, -0.8863372802734375, -0.8526992797851562, -0.819061279296875, -0.7854232788085938, -0.7517852783203125, -0.7181472778320312, -0.68450927734375, -0.6508712768554688, -0.6172332763671875, -0.5835952758789062, -0.549957275390625, -0.5163192749023438, -0.4826812744140625, -0.44904327392578125, -0.4154052734375, -0.38176727294921875, -0.3481292724609375, -0.31449127197265625, -0.280853271484375, -0.24721527099609375, -0.2135772705078125, -0.17993927001953125, -0.14630126953125, -0.11266326904296875, -0.0790252685546875, -0.04538726806640625, -0.011749267578125, 0.02188873291015625, 0.0555267333984375, 0.08916473388671875, 0.122802734375, 0.15644073486328125, 0.1900787353515625, 0.22371673583984375, 0.257354736328125, 0.29099273681640625, 0.3246307373046875, 0.35826873779296875, 0.39190673828125, 0.42554473876953125, 0.4591827392578125, 0.49282073974609375, 0.526458740234375, 0.5600967407226562, 0.5937347412109375, 0.6273727416992188, 0.6610107421875, 0.6946487426757812, 0.7282867431640625, 0.7619247436523438, 0.795562744140625, 0.8292007446289062, 0.8628387451171875, 0.8964767456054688, 0.93011474609375, 0.9637527465820312, 0.9973907470703125, 1.0310287475585938, 1.064666748046875, 1.0983047485351562, 1.1319427490234375, 1.1655807495117188, 1.19921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 6.0, 5.0, 8.0, 14.0, 14.0, 20.0, 24.0, 25.0, 44.0, 50.0, 82.0, 120.0, 134.0, 127.0, 92.0, 60.0, 47.0, 37.0, 23.0, 22.0, 12.0, 11.0, 9.0, 7.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6089630126953125, -0.586090087890625, -0.5632171630859375, -0.54034423828125, -0.5174713134765625, -0.494598388671875, -0.4717254638671875, -0.4488525390625, -0.4259796142578125, -0.403106689453125, -0.3802337646484375, -0.35736083984375, -0.3344879150390625, -0.311614990234375, -0.2887420654296875, -0.265869140625, -0.2429962158203125, -0.220123291015625, -0.1972503662109375, -0.17437744140625, -0.1515045166015625, -0.128631591796875, -0.1057586669921875, -0.0828857421875, -0.0600128173828125, -0.037139892578125, -0.0142669677734375, 0.00860595703125, 0.0314788818359375, 0.054351806640625, 0.0772247314453125, 0.10009765625, 0.1229705810546875, 0.145843505859375, 0.1687164306640625, 0.19158935546875, 0.2144622802734375, 0.237335205078125, 0.2602081298828125, 0.2830810546875, 0.3059539794921875, 0.328826904296875, 0.3516998291015625, 0.37457275390625, 0.3974456787109375, 0.420318603515625, 0.4431915283203125, 0.466064453125, 0.4889373779296875, 0.511810302734375, 0.5346832275390625, 0.55755615234375, 0.5804290771484375, 0.603302001953125, 0.6261749267578125, 0.6490478515625, 0.6719207763671875, 0.694793701171875, 0.7176666259765625, 0.74053955078125, 0.7634124755859375, 0.786285400390625, 0.8091583251953125, 0.83203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 25.0, 142.0, 632.0, 169.0, 14.0, 16.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.485965728759766, -27.90035057067871, -27.314735412597656, -26.729122161865234, -26.14350700378418, -25.557891845703125, -24.972278594970703, -24.38666343688965, -23.801048278808594, -23.21543312072754, -22.629817962646484, -22.044204711914062, -21.458589553833008, -20.872974395751953, -20.28736114501953, -19.701745986938477, -19.116130828857422, -18.530515670776367, -17.944900512695312, -17.35928726196289, -16.773672103881836, -16.18805694580078, -15.602442741394043, -15.016828536987305, -14.43121337890625, -13.845598220825195, -13.259984016418457, -12.674369812011719, -12.088754653930664, -11.50313949584961, -10.917525291442871, -10.331911087036133, -9.746297836303711, -9.160682678222656, -8.575068473815918, -7.9894537925720215, -7.403839111328125, -6.8182244300842285, -6.232609748840332, -5.6469950675964355, -5.061380386352539, -4.475765705108643, -3.890151023864746, -3.3045363426208496, -2.718921661376953, -2.1333069801330566, -1.5476922988891602, -0.9620776176452637, -0.3764629364013672, 0.2091517448425293, 0.7947664260864258, 1.3803811073303223, 1.9659957885742188, 2.5516104698181152, 3.1372251510620117, 3.722839832305908, 4.308454513549805, 4.894069194793701, 5.479683876037598, 6.065298557281494, 6.650913238525391, 7.236527919769287, 7.822142601013184, 8.407756805419922, 8.993371963500977]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 20.0, 15.0, 20.0, 17.0, 47.0, 23.0, 35.0, 30.0, 38.0, 45.0, 43.0, 61.0, 55.0, 67.0, 52.0, 55.0, 47.0, 42.0, 38.0, 33.0, 35.0, 34.0, 28.0, 22.0, 17.0, 9.0, 10.0, 16.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.420712947845459, -4.3009161949157715, -4.181119441986084, -4.0613226890563965, -3.941525936126709, -3.8217291831970215, -3.701932430267334, -3.5821356773376465, -3.462338924407959, -3.3425421714782715, -3.222745418548584, -3.1029486656188965, -2.983151912689209, -2.8633551597595215, -2.743558406829834, -2.6237616539001465, -2.503964900970459, -2.3841681480407715, -2.264371395111084, -2.1445746421813965, -2.024777889251709, -1.9049811363220215, -1.785184383392334, -1.6653876304626465, -1.545590877532959, -1.4257941246032715, -1.305997371673584, -1.1862006187438965, -1.066403865814209, -0.9466071128845215, -0.826810359954834, -0.7070136070251465, -0.587216854095459, -0.4674201011657715, -0.347623348236084, -0.22782659530639648, -0.10802984237670898, 0.011766910552978516, 0.13156366348266602, 0.2513604164123535, 0.371157169342041, 0.4909539222717285, 0.610750675201416, 0.7305474281311035, 0.850344181060791, 0.9701409339904785, 1.089937686920166, 1.2097344398498535, 1.329531192779541, 1.4493279457092285, 1.569124698638916, 1.6889214515686035, 1.808718204498291, 1.9285149574279785, 2.048311710357666, 2.1681084632873535, 2.287905216217041, 2.4077019691467285, 2.527498722076416, 2.6472954750061035, 2.767092227935791, 2.8868889808654785, 3.006685733795166, 3.1264824867248535, 3.246279239654541]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 7.0, 25.0, 24.0, 25.0, 38.0, 43.0, 69.0, 83.0, 95.0, 205.0, 371.0, 649.0, 1354.0, 3273.0, 12811.0, 255788.0, 3888839.0, 23337.0, 4415.0, 1503.0, 616.0, 295.0, 157.0, 83.0, 52.0, 27.0, 20.0, 9.0, 13.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8544921875, -1.8115234375, -1.7685546875, -1.7255859375, -1.6826171875, -1.6396484375, -1.5966796875, -1.5537109375, -1.5107421875, -1.4677734375, -1.4248046875, -1.3818359375, -1.3388671875, -1.2958984375, -1.2529296875, -1.2099609375, -1.1669921875, -1.1240234375, -1.0810546875, -1.0380859375, -0.9951171875, -0.9521484375, -0.9091796875, -0.8662109375, -0.8232421875, -0.7802734375, -0.7373046875, -0.6943359375, -0.6513671875, -0.6083984375, -0.5654296875, -0.5224609375, -0.4794921875, -0.4365234375, -0.3935546875, -0.3505859375, -0.3076171875, -0.2646484375, -0.2216796875, -0.1787109375, -0.1357421875, -0.0927734375, -0.0498046875, -0.0068359375, 0.0361328125, 0.0791015625, 0.1220703125, 0.1650390625, 0.2080078125, 0.2509765625, 0.2939453125, 0.3369140625, 0.3798828125, 0.4228515625, 0.4658203125, 0.5087890625, 0.5517578125, 0.5947265625, 0.6376953125, 0.6806640625, 0.7236328125, 0.7666015625, 0.8095703125, 0.8525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 15.0, 25.0, 38.0, 72.0, 98.0, 138.0, 143.0, 142.0, 125.0, 72.0, 50.0, 29.0, 13.0, 7.0, 10.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.27978515625, -0.2738943099975586, -0.2680034637451172, -0.2621126174926758, -0.2562217712402344, -0.25033092498779297, -0.24444007873535156, -0.23854923248291016, -0.23265838623046875, -0.22676753997802734, -0.22087669372558594, -0.21498584747314453, -0.20909500122070312, -0.20320415496826172, -0.1973133087158203, -0.1914224624633789, -0.1855316162109375, -0.1796407699584961, -0.1737499237060547, -0.16785907745361328, -0.16196823120117188, -0.15607738494873047, -0.15018653869628906, -0.14429569244384766, -0.13840484619140625, -0.13251399993896484, -0.12662315368652344, -0.12073230743408203, -0.11484146118164062, -0.10895061492919922, -0.10305976867675781, -0.0971689224243164, -0.091278076171875, -0.0853872299194336, -0.07949638366699219, -0.07360553741455078, -0.06771469116210938, -0.06182384490966797, -0.05593299865722656, -0.050042152404785156, -0.04415130615234375, -0.038260459899902344, -0.03236961364746094, -0.02647876739501953, -0.020587921142578125, -0.014697074890136719, -0.008806228637695312, -0.0029153823852539062, 0.0029754638671875, 0.008866310119628906, 0.014757156372070312, 0.02064800262451172, 0.026538848876953125, 0.03242969512939453, 0.03832054138183594, 0.044211387634277344, 0.05010223388671875, 0.055993080139160156, 0.06188392639160156, 0.06777477264404297, 0.07366561889648438, 0.07955646514892578, 0.08544731140136719, 0.0913381576538086, 0.09722900390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 16.0, 33.0, 47.0, 89.0, 168.0, 363.0, 806.0, 2119.0, 7246.0, 41005.0, 3817428.0, 302189.0, 16878.0, 3689.0, 1257.0, 453.0, 216.0, 108.0, 52.0, 26.0, 14.0, 17.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2236328125, -1.1903762817382812, -1.1571197509765625, -1.1238632202148438, -1.090606689453125, -1.0573501586914062, -1.0240936279296875, -0.9908370971679688, -0.95758056640625, -0.9243240356445312, -0.8910675048828125, -0.8578109741210938, -0.824554443359375, -0.7912979125976562, -0.7580413818359375, -0.7247848510742188, -0.6915283203125, -0.6582717895507812, -0.6250152587890625, -0.5917587280273438, -0.558502197265625, -0.5252456665039062, -0.4919891357421875, -0.45873260498046875, -0.42547607421875, -0.39221954345703125, -0.3589630126953125, -0.32570648193359375, -0.292449951171875, -0.25919342041015625, -0.2259368896484375, -0.19268035888671875, -0.159423828125, -0.12616729736328125, -0.0929107666015625, -0.05965423583984375, -0.026397705078125, 0.00685882568359375, 0.0401153564453125, 0.07337188720703125, 0.10662841796875, 0.13988494873046875, 0.1731414794921875, 0.20639801025390625, 0.239654541015625, 0.27291107177734375, 0.3061676025390625, 0.33942413330078125, 0.3726806640625, 0.40593719482421875, 0.4391937255859375, 0.47245025634765625, 0.505706787109375, 0.5389633178710938, 0.5722198486328125, 0.6054763793945312, 0.63873291015625, 0.6719894409179688, 0.7052459716796875, 0.7385025024414062, 0.771759033203125, 0.8050155639648438, 0.8382720947265625, 0.8715286254882812, 0.90478515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 10.0, 7.0, 18.0, 20.0, 42.0, 53.0, 130.0, 264.0, 1091.0, 1706.0, 388.0, 156.0, 58.0, 47.0, 23.0, 7.0, 12.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21713638305664062, -0.21015167236328125, -0.20316696166992188, -0.1961822509765625, -0.18919754028320312, -0.18221282958984375, -0.17522811889648438, -0.168243408203125, -0.16125869750976562, -0.15427398681640625, -0.14728927612304688, -0.1403045654296875, -0.13331985473632812, -0.12633514404296875, -0.11935043334960938, -0.11236572265625, -0.10538101196289062, -0.09839630126953125, -0.09141159057617188, -0.0844268798828125, -0.07744216918945312, -0.07045745849609375, -0.06347274780273438, -0.056488037109375, -0.049503326416015625, -0.04251861572265625, -0.035533905029296875, -0.0285491943359375, -0.021564483642578125, -0.01457977294921875, -0.007595062255859375, -0.0006103515625, 0.006374359130859375, 0.01335906982421875, 0.020343780517578125, 0.0273284912109375, 0.034313201904296875, 0.04129791259765625, 0.048282623291015625, 0.055267333984375, 0.062252044677734375, 0.06923675537109375, 0.07622146606445312, 0.0832061767578125, 0.09019088745117188, 0.09717559814453125, 0.10416030883789062, 0.11114501953125, 0.11812973022460938, 0.12511444091796875, 0.13209915161132812, 0.1390838623046875, 0.14606857299804688, 0.15305328369140625, 0.16003799438476562, 0.167022705078125, 0.17400741577148438, 0.18099212646484375, 0.18797683715820312, 0.1949615478515625, 0.20194625854492188, 0.20893096923828125, 0.21591567993164062, 0.222900390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 17.0, 33.0, 131.0, 292.0, 364.0, 118.0, 32.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6790753602981567, -1.6150943040847778, -1.551113247871399, -1.4871323108673096, -1.4231512546539307, -1.3591701984405518, -1.2951891422271729, -1.231208086013794, -1.167227029800415, -1.1032459735870361, -1.0392649173736572, -0.9752839207649231, -0.911302924156189, -0.8473218679428101, -0.7833408117294312, -0.7193597555160522, -0.6553788185119629, -0.591397762298584, -0.5274167656898499, -0.46343570947647095, -0.39945468306541443, -0.3354736566543579, -0.271492600440979, -0.20751157402992249, -0.14353054761886597, -0.07954951375722885, -0.015568479895591736, 0.04841256141662598, 0.1123935878276825, 0.176374614238739, 0.24035567045211792, 0.30433669686317444, 0.3683178424835205, 0.432298868894577, 0.49627989530563354, 0.5602609515190125, 0.6242419481277466, 0.6882230043411255, 0.7522040605545044, 0.8161851167678833, 0.8801661133766174, 0.9441471695899963, 1.0081281661987305, 1.0721092224121094, 1.1360902786254883, 1.2000713348388672, 1.264052391052246, 1.3280333280563354, 1.3920143842697144, 1.4559954404830933, 1.5199764966964722, 1.5839574337005615, 1.6479384899139404, 1.7119195461273193, 1.7759006023406982, 1.8398816585540771, 1.903862714767456, 1.967843770980835, 2.031824827194214, 2.0958058834075928, 2.1597869396209717, 2.2237677574157715, 2.2877488136291504, 2.3517298698425293, 2.415710926055908]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 16.0, 7.0, 9.0, 19.0, 23.0, 28.0, 19.0, 36.0, 35.0, 55.0, 47.0, 60.0, 53.0, 63.0, 61.0, 75.0, 61.0, 59.0, 63.0, 38.0, 34.0, 21.0, 22.0, 22.0, 23.0, 12.0, 8.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6316056847572327, -0.6094751358032227, -0.5873446464538574, -0.5652140974998474, -0.5430835485458374, -0.5209530591964722, -0.49882251024246216, -0.47669199109077454, -0.4545614719390869, -0.4324309527873993, -0.41030043363571167, -0.38816988468170166, -0.36603936553001404, -0.3439088463783264, -0.3217782974243164, -0.2996477782726288, -0.27751725912094116, -0.25538673996925354, -0.23325620591640472, -0.2111256718635559, -0.1889951527118683, -0.16686463356018066, -0.14473409950733185, -0.12260356545448303, -0.10047304630279541, -0.07834251970052719, -0.05621199309825897, -0.03408146649599075, -0.011950939893722534, 0.010179586708545685, 0.032310113310813904, 0.05444064736366272, 0.07657116651535034, 0.09870169311761856, 0.12083221971988678, 0.1429627537727356, 0.16509327292442322, 0.18722379207611084, 0.20935432612895966, 0.23148486018180847, 0.2536153793334961, 0.2757458984851837, 0.29787641763687134, 0.32000696659088135, 0.34213748574256897, 0.3642680048942566, 0.3863985538482666, 0.4085290729999542, 0.43065959215164185, 0.45279011130332947, 0.4749206304550171, 0.4970511794090271, 0.5191817283630371, 0.5413122177124023, 0.5634427666664124, 0.5855733156204224, 0.6077038049697876, 0.6298343539237976, 0.6519648432731628, 0.6740953922271729, 0.6962258815765381, 0.7183564305305481, 0.7404869794845581, 0.7626174688339233, 0.7847480177879333]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 9.0, 3.0, 12.0, 15.0, 13.0, 25.0, 34.0, 43.0, 44.0, 73.0, 79.0, 136.0, 170.0, 269.0, 472.0, 818.0, 1583.0, 3998.0, 15649.0, 165296.0, 743042.0, 98501.0, 11422.0, 3321.0, 1386.0, 780.0, 434.0, 288.0, 194.0, 135.0, 83.0, 68.0, 35.0, 35.0, 15.0, 16.0, 23.0, 10.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.703125, -0.6792144775390625, -0.655303955078125, -0.6313934326171875, -0.60748291015625, -0.5835723876953125, -0.559661865234375, -0.5357513427734375, -0.5118408203125, -0.4879302978515625, -0.464019775390625, -0.4401092529296875, -0.41619873046875, -0.3922882080078125, -0.368377685546875, -0.3444671630859375, -0.320556640625, -0.2966461181640625, -0.272735595703125, -0.2488250732421875, -0.22491455078125, -0.2010040283203125, -0.177093505859375, -0.1531829833984375, -0.1292724609375, -0.1053619384765625, -0.081451416015625, -0.0575408935546875, -0.03363037109375, -0.0097198486328125, 0.014190673828125, 0.0381011962890625, 0.06201171875, 0.0859222412109375, 0.109832763671875, 0.1337432861328125, 0.15765380859375, 0.1815643310546875, 0.205474853515625, 0.2293853759765625, 0.2532958984375, 0.2772064208984375, 0.301116943359375, 0.3250274658203125, 0.34893798828125, 0.3728485107421875, 0.396759033203125, 0.4206695556640625, 0.444580078125, 0.4684906005859375, 0.492401123046875, 0.5163116455078125, 0.54022216796875, 0.5641326904296875, 0.588043212890625, 0.6119537353515625, 0.6358642578125, 0.6597747802734375, 0.683685302734375, 0.7075958251953125, 0.73150634765625, 0.7554168701171875, 0.779327392578125, 0.8032379150390625, 0.8271484375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 12.0, 13.0, 25.0, 59.0, 79.0, 123.0, 131.0, 144.0, 146.0, 93.0, 68.0, 39.0, 24.0, 9.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.25830078125, -0.2527008056640625, -0.247100830078125, -0.2415008544921875, -0.23590087890625, -0.2303009033203125, -0.224700927734375, -0.2191009521484375, -0.2135009765625, -0.2079010009765625, -0.202301025390625, -0.1967010498046875, -0.19110107421875, -0.1855010986328125, -0.179901123046875, -0.1743011474609375, -0.168701171875, -0.1631011962890625, -0.157501220703125, -0.1519012451171875, -0.14630126953125, -0.1407012939453125, -0.135101318359375, -0.1295013427734375, -0.1239013671875, -0.1183013916015625, -0.112701416015625, -0.1071014404296875, -0.10150146484375, -0.0959014892578125, -0.090301513671875, -0.0847015380859375, -0.0791015625, -0.0735015869140625, -0.067901611328125, -0.0623016357421875, -0.05670166015625, -0.0511016845703125, -0.045501708984375, -0.0399017333984375, -0.0343017578125, -0.0287017822265625, -0.023101806640625, -0.0175018310546875, -0.01190185546875, -0.0063018798828125, -0.000701904296875, 0.0048980712890625, 0.010498046875, 0.0160980224609375, 0.021697998046875, 0.0272979736328125, 0.03289794921875, 0.0384979248046875, 0.044097900390625, 0.0496978759765625, 0.0552978515625, 0.0608978271484375, 0.066497802734375, 0.0720977783203125, 0.07769775390625, 0.0832977294921875, 0.088897705078125, 0.0944976806640625, 0.10009765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 14.0, 11.0, 16.0, 23.0, 29.0, 51.0, 68.0, 127.0, 178.0, 276.0, 460.0, 815.0, 1759.0, 3831.0, 10175.0, 31803.0, 121149.0, 420985.0, 334006.0, 85202.0, 23198.0, 7898.0, 3143.0, 1474.0, 720.0, 382.0, 256.0, 145.0, 101.0, 70.0, 67.0, 34.0, 23.0, 16.0, 12.0, 5.0, 12.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.47153472900390625, -0.4567413330078125, -0.44194793701171875, -0.427154541015625, -0.41236114501953125, -0.3975677490234375, -0.38277435302734375, -0.36798095703125, -0.35318756103515625, -0.3383941650390625, -0.32360076904296875, -0.308807373046875, -0.29401397705078125, -0.2792205810546875, -0.26442718505859375, -0.2496337890625, -0.23484039306640625, -0.2200469970703125, -0.20525360107421875, -0.190460205078125, -0.17566680908203125, -0.1608734130859375, -0.14608001708984375, -0.13128662109375, -0.11649322509765625, -0.1016998291015625, -0.08690643310546875, -0.072113037109375, -0.05731964111328125, -0.0425262451171875, -0.02773284912109375, -0.012939453125, 0.00185394287109375, 0.0166473388671875, 0.03144073486328125, 0.046234130859375, 0.06102752685546875, 0.0758209228515625, 0.09061431884765625, 0.10540771484375, 0.12020111083984375, 0.1349945068359375, 0.14978790283203125, 0.164581298828125, 0.17937469482421875, 0.1941680908203125, 0.20896148681640625, 0.2237548828125, 0.23854827880859375, 0.2533416748046875, 0.26813507080078125, 0.282928466796875, 0.29772186279296875, 0.3125152587890625, 0.32730865478515625, 0.34210205078125, 0.35689544677734375, 0.3716888427734375, 0.38648223876953125, 0.401275634765625, 0.41606903076171875, 0.4308624267578125, 0.44565582275390625, 0.46044921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 12.0, 18.0, 15.0, 24.0, 24.0, 14.0, 33.0, 26.0, 29.0, 45.0, 32.0, 36.0, 31.0, 58.0, 39.0, 47.0, 43.0, 35.0, 35.0, 52.0, 42.0, 45.0, 24.0, 32.0, 27.0, 26.0, 22.0, 19.0, 18.0, 14.0, 13.0, 8.0, 9.0, 5.0, 11.0, 3.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3689002990722656, -0.35620880126953125, -0.3435173034667969, -0.3308258056640625, -0.3181343078613281, -0.30544281005859375, -0.2927513122558594, -0.280059814453125, -0.2673683166503906, -0.25467681884765625, -0.24198532104492188, -0.2292938232421875, -0.21660232543945312, -0.20391082763671875, -0.19121932983398438, -0.17852783203125, -0.16583633422851562, -0.15314483642578125, -0.14045333862304688, -0.1277618408203125, -0.11507034301757812, -0.10237884521484375, -0.08968734741210938, -0.076995849609375, -0.06430435180664062, -0.05161285400390625, -0.038921356201171875, -0.0262298583984375, -0.013538360595703125, -0.00084686279296875, 0.011844635009765625, 0.0245361328125, 0.037227630615234375, 0.04991912841796875, 0.06261062622070312, 0.0753021240234375, 0.08799362182617188, 0.10068511962890625, 0.11337661743164062, 0.126068115234375, 0.13875961303710938, 0.15145111083984375, 0.16414260864257812, 0.1768341064453125, 0.18952560424804688, 0.20221710205078125, 0.21490859985351562, 0.22760009765625, 0.24029159545898438, 0.25298309326171875, 0.2656745910644531, 0.2783660888671875, 0.2910575866699219, 0.30374908447265625, 0.3164405822753906, 0.329132080078125, 0.3418235778808594, 0.35451507568359375, 0.3672065734863281, 0.3798980712890625, 0.3925895690917969, 0.40528106689453125, 0.4179725646972656, 0.4306640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 6.0, 8.0, 13.0, 21.0, 23.0, 31.0, 54.0, 94.0, 142.0, 207.0, 332.0, 573.0, 1080.0, 2271.0, 5845.0, 20521.0, 136193.0, 719391.0, 130907.0, 20248.0, 5769.0, 2302.0, 1068.0, 548.0, 300.0, 187.0, 116.0, 80.0, 74.0, 32.0, 38.0, 21.0, 10.0, 8.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26258087158203125, -0.2536773681640625, -0.24477386474609375, -0.235870361328125, -0.22696685791015625, -0.2180633544921875, -0.20915985107421875, -0.20025634765625, -0.19135284423828125, -0.1824493408203125, -0.17354583740234375, -0.164642333984375, -0.15573883056640625, -0.1468353271484375, -0.13793182373046875, -0.1290283203125, -0.12012481689453125, -0.1112213134765625, -0.10231781005859375, -0.093414306640625, -0.08451080322265625, -0.0756072998046875, -0.06670379638671875, -0.05780029296875, -0.04889678955078125, -0.0399932861328125, -0.03108978271484375, -0.022186279296875, -0.01328277587890625, -0.0043792724609375, 0.00452423095703125, 0.013427734375, 0.02233123779296875, 0.0312347412109375, 0.04013824462890625, 0.049041748046875, 0.05794525146484375, 0.0668487548828125, 0.07575225830078125, 0.08465576171875, 0.09355926513671875, 0.1024627685546875, 0.11136627197265625, 0.120269775390625, 0.12917327880859375, 0.1380767822265625, 0.14698028564453125, 0.1558837890625, 0.16478729248046875, 0.1736907958984375, 0.18259429931640625, 0.191497802734375, 0.20040130615234375, 0.2093048095703125, 0.21820831298828125, 0.22711181640625, 0.23601531982421875, 0.2449188232421875, 0.25382232666015625, 0.262725830078125, 0.27162933349609375, 0.2805328369140625, 0.28943634033203125, 0.29833984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 8.0, 7.0, 11.0, 15.0, 12.0, 15.0, 23.0, 26.0, 21.0, 28.0, 29.0, 43.0, 54.0, 57.0, 92.0, 106.0, 84.0, 66.0, 51.0, 46.0, 27.0, 31.0, 28.0, 14.0, 17.0, 11.0, 18.0, 6.0, 12.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.565187454223633e-05, -8.27442854642868e-05, -7.983669638633728e-05, -7.692910730838776e-05, -7.402151823043823e-05, -7.111392915248871e-05, -6.820634007453918e-05, -6.529875099658966e-05, -6.239116191864014e-05, -5.948357284069061e-05, -5.657598376274109e-05, -5.3668394684791565e-05, -5.076080560684204e-05, -4.785321652889252e-05, -4.494562745094299e-05, -4.203803837299347e-05, -3.9130449295043945e-05, -3.622286021709442e-05, -3.33152711391449e-05, -3.0407682061195374e-05, -2.750009298324585e-05, -2.4592503905296326e-05, -2.1684914827346802e-05, -1.8777325749397278e-05, -1.5869736671447754e-05, -1.296214759349823e-05, -1.0054558515548706e-05, -7.146969437599182e-06, -4.239380359649658e-06, -1.3317912817001343e-06, 1.5757977962493896e-06, 4.4833868741989136e-06, 7.3909759521484375e-06, 1.0298565030097961e-05, 1.3206154108047485e-05, 1.611374318599701e-05, 1.9021332263946533e-05, 2.1928921341896057e-05, 2.483651041984558e-05, 2.7744099497795105e-05, 3.065168857574463e-05, 3.355927765369415e-05, 3.646686673164368e-05, 3.93744558095932e-05, 4.2282044887542725e-05, 4.518963396549225e-05, 4.809722304344177e-05, 5.1004812121391296e-05, 5.391240119934082e-05, 5.6819990277290344e-05, 5.972757935523987e-05, 6.263516843318939e-05, 6.554275751113892e-05, 6.845034658908844e-05, 7.135793566703796e-05, 7.426552474498749e-05, 7.717311382293701e-05, 8.008070290088654e-05, 8.298829197883606e-05, 8.589588105678558e-05, 8.880347013473511e-05, 9.171105921268463e-05, 9.461864829063416e-05, 9.752623736858368e-05, 0.0001004338264465332]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 20.0, 17.0, 30.0, 34.0, 100.0, 160.0, 330.0, 785.0, 2352.0, 9346.0, 69983.0, 787353.0, 157216.0, 15555.0, 3328.0, 1096.0, 413.0, 179.0, 102.0, 52.0, 33.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.422607421875, -0.4083518981933594, -0.39409637451171875, -0.3798408508300781, -0.3655853271484375, -0.3513298034667969, -0.33707427978515625, -0.3228187561035156, -0.308563232421875, -0.2943077087402344, -0.28005218505859375, -0.2657966613769531, -0.2515411376953125, -0.23728561401367188, -0.22303009033203125, -0.20877456665039062, -0.19451904296875, -0.18026351928710938, -0.16600799560546875, -0.15175247192382812, -0.1374969482421875, -0.12324142456054688, -0.10898590087890625, -0.09473037719726562, -0.080474853515625, -0.06621932983398438, -0.05196380615234375, -0.037708282470703125, -0.0234527587890625, -0.009197235107421875, 0.00505828857421875, 0.019313812255859375, 0.0335693359375, 0.047824859619140625, 0.06208038330078125, 0.07633590698242188, 0.0905914306640625, 0.10484695434570312, 0.11910247802734375, 0.13335800170898438, 0.147613525390625, 0.16186904907226562, 0.17612457275390625, 0.19038009643554688, 0.2046356201171875, 0.21889114379882812, 0.23314666748046875, 0.24740219116210938, 0.26165771484375, 0.2759132385253906, 0.29016876220703125, 0.3044242858886719, 0.3186798095703125, 0.3329353332519531, 0.34719085693359375, 0.3614463806152344, 0.375701904296875, 0.3899574279785156, 0.40421295166015625, 0.4184684753417969, 0.4327239990234375, 0.4469795227050781, 0.46123504638671875, 0.4754905700683594, 0.48974609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 11.0, 8.0, 12.0, 28.0, 23.0, 33.0, 39.0, 52.0, 64.0, 86.0, 98.0, 96.0, 99.0, 81.0, 52.0, 50.0, 25.0, 22.0, 26.0, 19.0, 12.0, 8.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.2399768829345703, -0.23080825805664062, -0.22163963317871094, -0.21247100830078125, -0.20330238342285156, -0.19413375854492188, -0.1849651336669922, -0.1757965087890625, -0.1666278839111328, -0.15745925903320312, -0.14829063415527344, -0.13912200927734375, -0.12995338439941406, -0.12078475952148438, -0.11161613464355469, -0.102447509765625, -0.09327888488769531, -0.08411026000976562, -0.07494163513183594, -0.06577301025390625, -0.05660438537597656, -0.047435760498046875, -0.03826713562011719, -0.0290985107421875, -0.019929885864257812, -0.010761260986328125, -0.0015926361083984375, 0.00757598876953125, 0.016744613647460938, 0.025913238525390625, 0.03508186340332031, 0.04425048828125, 0.05341911315917969, 0.06258773803710938, 0.07175636291503906, 0.08092498779296875, 0.09009361267089844, 0.09926223754882812, 0.10843086242675781, 0.1175994873046875, 0.1267681121826172, 0.13593673706054688, 0.14510536193847656, 0.15427398681640625, 0.16344261169433594, 0.17261123657226562, 0.1817798614501953, 0.190948486328125, 0.2001171112060547, 0.20928573608398438, 0.21845436096191406, 0.22762298583984375, 0.23679161071777344, 0.24596023559570312, 0.2551288604736328, 0.2642974853515625, 0.2734661102294922, 0.2826347351074219, 0.29180335998535156, 0.30097198486328125, 0.31014060974121094, 0.3193092346191406, 0.3284778594970703, 0.337646484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 24.0, 281.0, 579.0, 100.0, 18.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.96441650390625, -23.530237197875977, -23.09605598449707, -22.661876678466797, -22.227697372436523, -21.79351806640625, -21.359336853027344, -20.92515754699707, -20.490978240966797, -20.056798934936523, -19.622617721557617, -19.188438415527344, -18.75425910949707, -18.320079803466797, -17.88589859008789, -17.451719284057617, -17.017539978027344, -16.58336067199707, -16.149179458618164, -15.71500015258789, -15.280820846557617, -14.846640586853027, -14.412460327148438, -13.978281021118164, -13.544099807739258, -13.109919548034668, -12.675740242004395, -12.241559982299805, -11.807380676269531, -11.373200416564941, -10.939020156860352, -10.504840850830078, -10.070660591125488, -9.636480331420898, -9.202301025390625, -8.768120765686035, -8.333941459655762, -7.899761199951172, -7.46558141708374, -7.031401634216309, -6.597222328186035, -6.1630425453186035, -5.728862762451172, -5.294682502746582, -4.860503196716309, -4.426322937011719, -3.992143154144287, -3.5579633712768555, -3.1237833499908447, -2.689603567123413, -2.2554235458374023, -1.8212437629699707, -1.387063980102539, -0.9528841972351074, -0.5187041759490967, -0.08452439308166504, 0.3496553897857666, 0.783835232257843, 1.2180150747299194, 1.6521949768066406, 2.0863747596740723, 2.520554542541504, 2.9547345638275146, 3.3889143466949463, 3.823094129562378]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 11.0, 14.0, 11.0, 6.0, 10.0, 17.0, 19.0, 29.0, 39.0, 40.0, 42.0, 44.0, 44.0, 47.0, 49.0, 57.0, 55.0, 41.0, 48.0, 54.0, 42.0, 45.0, 42.0, 27.0, 24.0, 27.0, 18.0, 18.0, 11.0, 16.0, 13.0, 13.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.730586051940918, -2.643235683441162, -2.5558853149414062, -2.4685347080230713, -2.3811843395233154, -2.2938339710235596, -2.2064836025238037, -2.1191329956054688, -2.031782627105713, -1.944432258605957, -1.8570817708969116, -1.7697314023971558, -1.6823809146881104, -1.5950305461883545, -1.5076801776885986, -1.4203296899795532, -1.3329793214797974, -1.2456289529800415, -1.158278465270996, -1.0709280967712402, -0.9835776090621948, -0.896227240562439, -0.8088768124580383, -0.7215263843536377, -0.6341759562492371, -0.5468255281448364, -0.4594751000404358, -0.37212470173835754, -0.2847742736339569, -0.19742384552955627, -0.11007344722747803, -0.022723019123077393, 0.06462740898132324, 0.15197783708572388, 0.23932825028896332, 0.32667866349220276, 0.4140290915966034, 0.5013794898986816, 0.5887299180030823, 0.6760803461074829, 0.7634307742118835, 0.8507812023162842, 0.9381316304206848, 1.0254820585250854, 1.1128324270248413, 1.2001829147338867, 1.2875332832336426, 1.3748836517333984, 1.4622341394424438, 1.5495845079421997, 1.6369349956512451, 1.724285364151001, 1.8116358518600464, 1.8989862203598022, 1.9863367080688477, 2.0736870765686035, 2.1610374450683594, 2.2483878135681152, 2.335738182067871, 2.423088788986206, 2.510439157485962, 2.5977895259857178, 2.6851398944854736, 2.7724905014038086, 2.8598408699035645]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 11.0, 14.0, 18.0, 24.0, 25.0, 40.0, 34.0, 80.0, 97.0, 184.0, 260.0, 464.0, 884.0, 1974.0, 4756.0, 16731.0, 205319.0, 3907735.0, 42825.0, 7859.0, 2621.0, 1090.0, 560.0, 256.0, 155.0, 89.0, 50.0, 38.0, 16.0, 16.0, 4.0, 8.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.96044921875, -0.937713623046875, -0.91497802734375, -0.892242431640625, -0.8695068359375, -0.846771240234375, -0.82403564453125, -0.801300048828125, -0.778564453125, -0.755828857421875, -0.73309326171875, -0.710357666015625, -0.6876220703125, -0.664886474609375, -0.64215087890625, -0.619415283203125, -0.5966796875, -0.573944091796875, -0.55120849609375, -0.528472900390625, -0.5057373046875, -0.483001708984375, -0.46026611328125, -0.437530517578125, -0.414794921875, -0.392059326171875, -0.36932373046875, -0.346588134765625, -0.3238525390625, -0.301116943359375, -0.27838134765625, -0.255645751953125, -0.23291015625, -0.210174560546875, -0.18743896484375, -0.164703369140625, -0.1419677734375, -0.119232177734375, -0.09649658203125, -0.073760986328125, -0.051025390625, -0.028289794921875, -0.00555419921875, 0.017181396484375, 0.0399169921875, 0.062652587890625, 0.08538818359375, 0.108123779296875, 0.130859375, 0.153594970703125, 0.17633056640625, 0.199066162109375, 0.2218017578125, 0.244537353515625, 0.26727294921875, 0.290008544921875, 0.312744140625, 0.335479736328125, 0.35821533203125, 0.380950927734375, 0.4036865234375, 0.426422119140625, 0.44915771484375, 0.471893310546875, 0.49462890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 8.0, 11.0, 22.0, 28.0, 48.0, 100.0, 125.0, 108.0, 129.0, 124.0, 110.0, 74.0, 42.0, 20.0, 15.0, 8.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.2369222640991211, -0.2312908172607422, -0.22565937042236328, -0.22002792358398438, -0.21439647674560547, -0.20876502990722656, -0.20313358306884766, -0.19750213623046875, -0.19187068939208984, -0.18623924255371094, -0.18060779571533203, -0.17497634887695312, -0.16934490203857422, -0.1637134552001953, -0.1580820083618164, -0.1524505615234375, -0.1468191146850586, -0.1411876678466797, -0.13555622100830078, -0.12992477416992188, -0.12429332733154297, -0.11866188049316406, -0.11303043365478516, -0.10739898681640625, -0.10176753997802734, -0.09613609313964844, -0.09050464630126953, -0.08487319946289062, -0.07924175262451172, -0.07361030578613281, -0.0679788589477539, -0.062347412109375, -0.056715965270996094, -0.05108451843261719, -0.04545307159423828, -0.039821624755859375, -0.03419017791748047, -0.028558731079101562, -0.022927284240722656, -0.01729583740234375, -0.011664390563964844, -0.0060329437255859375, -0.00040149688720703125, 0.005229949951171875, 0.010861396789550781, 0.016492843627929688, 0.022124290466308594, 0.0277557373046875, 0.033387184143066406, 0.03901863098144531, 0.04465007781982422, 0.050281524658203125, 0.05591297149658203, 0.06154441833496094, 0.06717586517333984, 0.07280731201171875, 0.07843875885009766, 0.08407020568847656, 0.08970165252685547, 0.09533309936523438, 0.10096454620361328, 0.10659599304199219, 0.1122274398803711, 0.11785888671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 6.0, 22.0, 24.0, 40.0, 71.0, 137.0, 390.0, 1757.0, 13020.0, 751975.0, 3406454.0, 17304.0, 2164.0, 473.0, 185.0, 98.0, 47.0, 38.0, 25.0, 20.0, 7.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.8850784301757812, -0.8546295166015625, -0.8241806030273438, -0.793731689453125, -0.7632827758789062, -0.7328338623046875, -0.7023849487304688, -0.67193603515625, -0.6414871215820312, -0.6110382080078125, -0.5805892944335938, -0.550140380859375, -0.5196914672851562, -0.4892425537109375, -0.45879364013671875, -0.4283447265625, -0.39789581298828125, -0.3674468994140625, -0.33699798583984375, -0.306549072265625, -0.27610015869140625, -0.2456512451171875, -0.21520233154296875, -0.18475341796875, -0.15430450439453125, -0.1238555908203125, -0.09340667724609375, -0.062957763671875, -0.03250885009765625, -0.0020599365234375, 0.02838897705078125, 0.058837890625, 0.08928680419921875, 0.1197357177734375, 0.15018463134765625, 0.180633544921875, 0.21108245849609375, 0.2415313720703125, 0.27198028564453125, 0.30242919921875, 0.33287811279296875, 0.3633270263671875, 0.39377593994140625, 0.424224853515625, 0.45467376708984375, 0.4851226806640625, 0.5155715942382812, 0.5460205078125, 0.5764694213867188, 0.6069183349609375, 0.6373672485351562, 0.667816162109375, 0.6982650756835938, 0.7287139892578125, 0.7591629028320312, 0.78961181640625, 0.8200607299804688, 0.8505096435546875, 0.8809585571289062, 0.911407470703125, 0.9418563842773438, 0.9723052978515625, 1.0027542114257812, 1.033203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 16.0, 20.0, 38.0, 51.0, 154.0, 469.0, 2445.0, 576.0, 158.0, 72.0, 31.0, 15.0, 11.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.1208648681640625, -0.113555908203125, -0.1062469482421875, -0.09893798828125, -0.0916290283203125, -0.084320068359375, -0.0770111083984375, -0.0697021484375, -0.0623931884765625, -0.055084228515625, -0.0477752685546875, -0.04046630859375, -0.0331573486328125, -0.025848388671875, -0.0185394287109375, -0.01123046875, -0.0039215087890625, 0.003387451171875, 0.0106964111328125, 0.01800537109375, 0.0253143310546875, 0.032623291015625, 0.0399322509765625, 0.0472412109375, 0.0545501708984375, 0.061859130859375, 0.0691680908203125, 0.07647705078125, 0.0837860107421875, 0.091094970703125, 0.0984039306640625, 0.105712890625, 0.1130218505859375, 0.120330810546875, 0.1276397705078125, 0.13494873046875, 0.1422576904296875, 0.149566650390625, 0.1568756103515625, 0.1641845703125, 0.1714935302734375, 0.178802490234375, 0.1861114501953125, 0.19342041015625, 0.2007293701171875, 0.208038330078125, 0.2153472900390625, 0.22265625, 0.2299652099609375, 0.237274169921875, 0.2445831298828125, 0.25189208984375, 0.2592010498046875, 0.266510009765625, 0.2738189697265625, 0.2811279296875, 0.2884368896484375, 0.295745849609375, 0.3030548095703125, 0.31036376953125, 0.3176727294921875, 0.324981689453125, 0.3322906494140625, 0.339599609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 24.0, 89.0, 263.0, 348.0, 200.0, 60.0, 12.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.3293261528015137, -2.2799885272979736, -2.2306509017944336, -2.1813132762908936, -2.1319756507873535, -2.0826382637023926, -2.0333006381988525, -1.9839630126953125, -1.9346253871917725, -1.8852877616882324, -1.8359501361846924, -1.786612629890442, -1.7372750043869019, -1.6879373788833618, -1.6385997533798218, -1.5892622470855713, -1.5399246215820312, -1.4905869960784912, -1.4412493705749512, -1.3919118642807007, -1.3425742387771606, -1.2932366132736206, -1.2438989877700806, -1.19456148147583, -1.1452237367630005, -1.0958861112594604, -1.0465484857559204, -0.9972109198570251, -0.9478733539581299, -0.8985357284545898, -0.8491981029510498, -0.7998605370521545, -0.7505229711532593, -0.7011853456497192, -0.651847779750824, -0.6025101542472839, -0.5531725883483887, -0.5038349628448486, -0.454497367143631, -0.40515977144241333, -0.3558221757411957, -0.306484580039978, -0.2571469843387604, -0.20780937373638153, -0.15847177803516388, -0.10913418233394623, -0.05979657173156738, -0.010458976030349731, 0.03887861967086792, 0.08821621537208557, 0.13755381107330322, 0.18689142167568207, 0.23622901737689972, 0.28556662797927856, 0.3349042236804962, 0.38424181938171387, 0.4335794150829315, 0.48291701078414917, 0.5322546362876892, 0.5815922021865845, 0.6309298276901245, 0.6802673935890198, 0.7296050190925598, 0.7789425849914551, 0.8282802104949951]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 11.0, 11.0, 10.0, 24.0, 22.0, 39.0, 29.0, 31.0, 38.0, 45.0, 56.0, 62.0, 63.0, 69.0, 56.0, 57.0, 63.0, 52.0, 50.0, 32.0, 31.0, 40.0, 28.0, 20.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44090574979782104, -0.42397254705429077, -0.4070393443107605, -0.3901061415672302, -0.37317293882369995, -0.3562397360801697, -0.3393065333366394, -0.32237333059310913, -0.30544012784957886, -0.2885069251060486, -0.2715737223625183, -0.25464051961898804, -0.23770731687545776, -0.2207741141319275, -0.20384089648723602, -0.18690769374370575, -0.16997447609901428, -0.153041273355484, -0.13610807061195374, -0.11917486041784286, -0.10224165767431259, -0.08530845493078232, -0.06837524473667145, -0.051442041993141174, -0.0345088392496109, -0.017575634643435478, -0.0006424300372600555, 0.016290776431560516, 0.03322397917509079, 0.05015718191862106, 0.06709039211273193, 0.08402359485626221, 0.10095679759979248, 0.11789000034332275, 0.13482320308685303, 0.1517564058303833, 0.16868960857391357, 0.18562281131744385, 0.20255602896213531, 0.2194892317056656, 0.23642243444919586, 0.25335565209388733, 0.2702888548374176, 0.2872220575809479, 0.30415526032447815, 0.3210884630680084, 0.3380216658115387, 0.35495486855506897, 0.37188807129859924, 0.3888212740421295, 0.4057544767856598, 0.42268767952919006, 0.43962088227272034, 0.4565540850162506, 0.47348731756210327, 0.49042052030563354, 0.5073537230491638, 0.5242869257926941, 0.5412201285362244, 0.5581533312797546, 0.5750865340232849, 0.5920197367668152, 0.6089529395103455, 0.6258861422538757, 0.642819344997406]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 5.0, 7.0, 11.0, 19.0, 25.0, 23.0, 43.0, 72.0, 102.0, 151.0, 227.0, 377.0, 670.0, 1513.0, 3905.0, 17382.0, 219267.0, 729979.0, 61697.0, 8224.0, 2400.0, 1037.0, 533.0, 300.0, 181.0, 113.0, 71.0, 55.0, 40.0, 26.0, 28.0, 19.0, 10.0, 12.0, 8.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87451171875, -0.8497238159179688, -0.8249359130859375, -0.8001480102539062, -0.775360107421875, -0.7505722045898438, -0.7257843017578125, -0.7009963989257812, -0.67620849609375, -0.6514205932617188, -0.6266326904296875, -0.6018447875976562, -0.577056884765625, -0.5522689819335938, -0.5274810791015625, -0.5026931762695312, -0.4779052734375, -0.45311737060546875, -0.4283294677734375, -0.40354156494140625, -0.378753662109375, -0.35396575927734375, -0.3291778564453125, -0.30438995361328125, -0.27960205078125, -0.25481414794921875, -0.2300262451171875, -0.20523834228515625, -0.180450439453125, -0.15566253662109375, -0.1308746337890625, -0.10608673095703125, -0.081298828125, -0.05651092529296875, -0.0317230224609375, -0.00693511962890625, 0.017852783203125, 0.04264068603515625, 0.0674285888671875, 0.09221649169921875, 0.11700439453125, 0.14179229736328125, 0.1665802001953125, 0.19136810302734375, 0.216156005859375, 0.24094390869140625, 0.2657318115234375, 0.29051971435546875, 0.3153076171875, 0.34009552001953125, 0.3648834228515625, 0.38967132568359375, 0.414459228515625, 0.43924713134765625, 0.4640350341796875, 0.48882293701171875, 0.51361083984375, 0.5383987426757812, 0.5631866455078125, 0.5879745483398438, 0.612762451171875, 0.6375503540039062, 0.6623382568359375, 0.6871261596679688, 0.7119140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 18.0, 26.0, 46.0, 68.0, 114.0, 127.0, 124.0, 123.0, 120.0, 88.0, 58.0, 18.0, 17.0, 14.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23565196990966797, -0.22997093200683594, -0.2242898941040039, -0.21860885620117188, -0.21292781829833984, -0.2072467803955078, -0.20156574249267578, -0.19588470458984375, -0.19020366668701172, -0.1845226287841797, -0.17884159088134766, -0.17316055297851562, -0.1674795150756836, -0.16179847717285156, -0.15611743927001953, -0.1504364013671875, -0.14475536346435547, -0.13907432556152344, -0.1333932876586914, -0.12771224975585938, -0.12203121185302734, -0.11635017395019531, -0.11066913604736328, -0.10498809814453125, -0.09930706024169922, -0.09362602233886719, -0.08794498443603516, -0.08226394653320312, -0.0765829086303711, -0.07090187072753906, -0.06522083282470703, -0.059539794921875, -0.05385875701904297, -0.04817771911621094, -0.042496681213378906, -0.036815643310546875, -0.031134605407714844, -0.025453567504882812, -0.01977252960205078, -0.01409149169921875, -0.008410453796386719, -0.0027294158935546875, 0.0029516220092773438, 0.008632659912109375, 0.014313697814941406, 0.019994735717773438, 0.02567577362060547, 0.0313568115234375, 0.03703784942626953, 0.04271888732910156, 0.048399925231933594, 0.054080963134765625, 0.059762001037597656, 0.06544303894042969, 0.07112407684326172, 0.07680511474609375, 0.08248615264892578, 0.08816719055175781, 0.09384822845458984, 0.09952926635742188, 0.1052103042602539, 0.11089134216308594, 0.11657238006591797, 0.12225341796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 11.0, 22.0, 18.0, 19.0, 35.0, 61.0, 77.0, 132.0, 169.0, 263.0, 408.0, 596.0, 1118.0, 2002.0, 3953.0, 8618.0, 22254.0, 64646.0, 199504.0, 397657.0, 227784.0, 74585.0, 25128.0, 9924.0, 4286.0, 2150.0, 1107.0, 678.0, 459.0, 283.0, 184.0, 132.0, 96.0, 42.0, 38.0, 28.0, 13.0, 10.0, 16.0, 8.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.317138671875, -0.30709075927734375, -0.2970428466796875, -0.28699493408203125, -0.276947021484375, -0.26689910888671875, -0.2568511962890625, -0.24680328369140625, -0.23675537109375, -0.22670745849609375, -0.2166595458984375, -0.20661163330078125, -0.196563720703125, -0.18651580810546875, -0.1764678955078125, -0.16641998291015625, -0.1563720703125, -0.14632415771484375, -0.1362762451171875, -0.12622833251953125, -0.116180419921875, -0.10613250732421875, -0.0960845947265625, -0.08603668212890625, -0.07598876953125, -0.06594085693359375, -0.0558929443359375, -0.04584503173828125, -0.035797119140625, -0.02574920654296875, -0.0157012939453125, -0.00565338134765625, 0.00439453125, 0.01444244384765625, 0.0244903564453125, 0.03453826904296875, 0.044586181640625, 0.05463409423828125, 0.0646820068359375, 0.07472991943359375, 0.08477783203125, 0.09482574462890625, 0.1048736572265625, 0.11492156982421875, 0.124969482421875, 0.13501739501953125, 0.1450653076171875, 0.15511322021484375, 0.1651611328125, 0.17520904541015625, 0.1852569580078125, 0.19530487060546875, 0.205352783203125, 0.21540069580078125, 0.2254486083984375, 0.23549652099609375, 0.24554443359375, 0.25559234619140625, 0.2656402587890625, 0.27568817138671875, 0.285736083984375, 0.29578399658203125, 0.3058319091796875, 0.31587982177734375, 0.325927734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 16.0, 25.0, 12.0, 16.0, 31.0, 35.0, 42.0, 39.0, 33.0, 50.0, 41.0, 44.0, 40.0, 53.0, 50.0, 49.0, 45.0, 36.0, 36.0, 31.0, 35.0, 28.0, 26.0, 25.0, 28.0, 15.0, 14.0, 10.0, 15.0, 7.0, 9.0, 5.0, 6.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.421142578125, -0.40863037109375, -0.3961181640625, -0.38360595703125, -0.37109375, -0.35858154296875, -0.3460693359375, -0.33355712890625, -0.321044921875, -0.30853271484375, -0.2960205078125, -0.28350830078125, -0.27099609375, -0.25848388671875, -0.2459716796875, -0.23345947265625, -0.220947265625, -0.20843505859375, -0.1959228515625, -0.18341064453125, -0.1708984375, -0.15838623046875, -0.1458740234375, -0.13336181640625, -0.120849609375, -0.10833740234375, -0.0958251953125, -0.08331298828125, -0.07080078125, -0.05828857421875, -0.0457763671875, -0.03326416015625, -0.020751953125, -0.00823974609375, 0.0042724609375, 0.01678466796875, 0.029296875, 0.04180908203125, 0.0543212890625, 0.06683349609375, 0.079345703125, 0.09185791015625, 0.1043701171875, 0.11688232421875, 0.12939453125, 0.14190673828125, 0.1544189453125, 0.16693115234375, 0.179443359375, 0.19195556640625, 0.2044677734375, 0.21697998046875, 0.2294921875, 0.24200439453125, 0.2545166015625, 0.26702880859375, 0.279541015625, 0.29205322265625, 0.3045654296875, 0.31707763671875, 0.32958984375, 0.34210205078125, 0.3546142578125, 0.36712646484375, 0.379638671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 10.0, 11.0, 12.0, 20.0, 36.0, 61.0, 100.0, 244.0, 532.0, 1320.0, 4833.0, 31489.0, 579885.0, 400982.0, 23018.0, 3939.0, 1132.0, 436.0, 237.0, 106.0, 56.0, 32.0, 19.0, 12.0, 8.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.32513427734375, -0.3155517578125, -0.30596923828125, -0.29638671875, -0.28680419921875, -0.2772216796875, -0.26763916015625, -0.258056640625, -0.24847412109375, -0.2388916015625, -0.22930908203125, -0.2197265625, -0.21014404296875, -0.2005615234375, -0.19097900390625, -0.181396484375, -0.17181396484375, -0.1622314453125, -0.15264892578125, -0.14306640625, -0.13348388671875, -0.1239013671875, -0.11431884765625, -0.104736328125, -0.09515380859375, -0.0855712890625, -0.07598876953125, -0.06640625, -0.05682373046875, -0.0472412109375, -0.03765869140625, -0.028076171875, -0.01849365234375, -0.0089111328125, 0.00067138671875, 0.01025390625, 0.01983642578125, 0.0294189453125, 0.03900146484375, 0.048583984375, 0.05816650390625, 0.0677490234375, 0.07733154296875, 0.0869140625, 0.09649658203125, 0.1060791015625, 0.11566162109375, 0.125244140625, 0.13482666015625, 0.1444091796875, 0.15399169921875, 0.16357421875, 0.17315673828125, 0.1827392578125, 0.19232177734375, 0.201904296875, 0.21148681640625, 0.2210693359375, 0.23065185546875, 0.240234375, 0.24981689453125, 0.2593994140625, 0.26898193359375, 0.278564453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 2.0, 7.0, 3.0, 8.0, 10.0, 15.0, 16.0, 14.0, 24.0, 19.0, 30.0, 45.0, 47.0, 62.0, 97.0, 120.0, 118.0, 73.0, 42.0, 40.0, 43.0, 21.0, 24.0, 20.0, 17.0, 15.0, 15.0, 8.0, 7.0, 10.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012409687042236328, -0.000120529904961586, -0.00011696293950080872, -0.00011339597404003143, -0.00010982900857925415, -0.00010626204311847687, -0.00010269507765769958, -9.91281121969223e-05, -9.556114673614502e-05, -9.199418127536774e-05, -8.842721581459045e-05, -8.486025035381317e-05, -8.129328489303589e-05, -7.77263194322586e-05, -7.415935397148132e-05, -7.059238851070404e-05, -6.702542304992676e-05, -6.345845758914948e-05, -5.989149212837219e-05, -5.632452666759491e-05, -5.275756120681763e-05, -4.9190595746040344e-05, -4.562363028526306e-05, -4.205666482448578e-05, -3.8489699363708496e-05, -3.492273390293121e-05, -3.135576844215393e-05, -2.7788802981376648e-05, -2.4221837520599365e-05, -2.0654872059822083e-05, -1.70879065990448e-05, -1.3520941138267517e-05, -9.953975677490234e-06, -6.387010216712952e-06, -2.820044755935669e-06, 7.469207048416138e-07, 4.3138861656188965e-06, 7.88085162639618e-06, 1.1447817087173462e-05, 1.5014782547950745e-05, 1.8581748008728027e-05, 2.214871346950531e-05, 2.5715678930282593e-05, 2.9282644391059875e-05, 3.284960985183716e-05, 3.641657531261444e-05, 3.9983540773391724e-05, 4.3550506234169006e-05, 4.711747169494629e-05, 5.068443715572357e-05, 5.4251402616500854e-05, 5.781836807727814e-05, 6.138533353805542e-05, 6.49522989988327e-05, 6.851926445960999e-05, 7.208622992038727e-05, 7.565319538116455e-05, 7.922016084194183e-05, 8.278712630271912e-05, 8.63540917634964e-05, 8.992105722427368e-05, 9.348802268505096e-05, 9.705498814582825e-05, 0.00010062195360660553, 0.00010418891906738281]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 19.0, 25.0, 36.0, 69.0, 106.0, 165.0, 278.0, 574.0, 1283.0, 4078.0, 20505.0, 217597.0, 715182.0, 74385.0, 9840.0, 2435.0, 963.0, 425.0, 254.0, 139.0, 65.0, 40.0, 24.0, 19.0, 7.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32666015625, -0.3168487548828125, -0.307037353515625, -0.2972259521484375, -0.28741455078125, -0.2776031494140625, -0.267791748046875, -0.2579803466796875, -0.2481689453125, -0.2383575439453125, -0.228546142578125, -0.2187347412109375, -0.20892333984375, -0.1991119384765625, -0.189300537109375, -0.1794891357421875, -0.169677734375, -0.1598663330078125, -0.150054931640625, -0.1402435302734375, -0.13043212890625, -0.1206207275390625, -0.110809326171875, -0.1009979248046875, -0.0911865234375, -0.0813751220703125, -0.071563720703125, -0.0617523193359375, -0.05194091796875, -0.0421295166015625, -0.032318115234375, -0.0225067138671875, -0.0126953125, -0.0028839111328125, 0.006927490234375, 0.0167388916015625, 0.02655029296875, 0.0363616943359375, 0.046173095703125, 0.0559844970703125, 0.0657958984375, 0.0756072998046875, 0.085418701171875, 0.0952301025390625, 0.10504150390625, 0.1148529052734375, 0.124664306640625, 0.1344757080078125, 0.144287109375, 0.1540985107421875, 0.163909912109375, 0.1737213134765625, 0.18353271484375, 0.1933441162109375, 0.203155517578125, 0.2129669189453125, 0.2227783203125, 0.2325897216796875, 0.242401123046875, 0.2522125244140625, 0.26202392578125, 0.2718353271484375, 0.281646728515625, 0.2914581298828125, 0.30126953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 11.0, 8.0, 13.0, 15.0, 28.0, 51.0, 62.0, 80.0, 101.0, 120.0, 131.0, 85.0, 86.0, 57.0, 51.0, 29.0, 26.0, 10.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2631950378417969, -0.25344085693359375, -0.24368667602539062, -0.2339324951171875, -0.22417831420898438, -0.21442413330078125, -0.20466995239257812, -0.194915771484375, -0.18516159057617188, -0.17540740966796875, -0.16565322875976562, -0.1558990478515625, -0.14614486694335938, -0.13639068603515625, -0.12663650512695312, -0.11688232421875, -0.10712814331054688, -0.09737396240234375, -0.08761978149414062, -0.0778656005859375, -0.06811141967773438, -0.05835723876953125, -0.048603057861328125, -0.038848876953125, -0.029094696044921875, -0.01934051513671875, -0.009586334228515625, 0.0001678466796875, 0.009922027587890625, 0.01967620849609375, 0.029430389404296875, 0.0391845703125, 0.048938751220703125, 0.05869293212890625, 0.06844711303710938, 0.0782012939453125, 0.08795547485351562, 0.09770965576171875, 0.10746383666992188, 0.117218017578125, 0.12697219848632812, 0.13672637939453125, 0.14648056030273438, 0.1562347412109375, 0.16598892211914062, 0.17574310302734375, 0.18549728393554688, 0.19525146484375, 0.20500564575195312, 0.21475982666015625, 0.22451400756835938, 0.2342681884765625, 0.24402236938476562, 0.25377655029296875, 0.2635307312011719, 0.273284912109375, 0.2830390930175781, 0.29279327392578125, 0.3025474548339844, 0.3123016357421875, 0.3220558166503906, 0.33180999755859375, 0.3415641784667969, 0.351318359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 13.0, 86.0, 264.0, 383.0, 162.0, 55.0, 22.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.584945678710938, -10.360420227050781, -10.135893821716309, -9.911368370056152, -9.68684196472168, -9.462316513061523, -9.23779010772705, -9.013264656066895, -8.788738250732422, -8.564212799072266, -8.339686393737793, -8.115160942077637, -7.890634536743164, -7.666109085083008, -7.441583156585693, -7.217057228088379, -6.992531776428223, -6.768005847930908, -6.543479919433594, -6.318953990936279, -6.094428062438965, -5.869902610778809, -5.645376682281494, -5.42085075378418, -5.196324825286865, -4.971798896789551, -4.747272968292236, -4.522747039794922, -4.298221588134766, -4.073695182800293, -3.8491697311401367, -3.6246438026428223, -3.400117874145508, -3.1755919456481934, -2.951066017150879, -2.7265403270721436, -2.502014398574829, -2.2774884700775146, -2.0529627799987793, -1.8284368515014648, -1.6039109230041504, -1.379384994506836, -1.154859185218811, -0.9303333163261414, -0.7058074474334717, -0.4812815189361572, -0.2567557096481323, -0.03222990036010742, 0.19229602813720703, 0.4168218970298767, 0.6413477659225464, 0.8658736348152161, 1.0903995037078857, 1.3149254322052002, 1.539451241493225, 1.76397705078125, 1.9885029792785645, 2.213028907775879, 2.4375548362731934, 2.6620805263519287, 2.886606454849243, 3.1111323833465576, 3.335658073425293, 3.5601840019226074, 3.784709930419922]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 12.0, 12.0, 17.0, 19.0, 31.0, 34.0, 27.0, 46.0, 42.0, 60.0, 58.0, 47.0, 61.0, 65.0, 56.0, 52.0, 65.0, 53.0, 58.0, 45.0, 35.0, 19.0, 18.0, 20.0, 15.0, 12.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.5222702026367188, -3.4272208213806152, -3.3321714401245117, -3.237122058868408, -3.1420726776123047, -3.0470235347747803, -2.9519741535186768, -2.8569247722625732, -2.7618753910064697, -2.666826009750366, -2.5717766284942627, -2.476727247238159, -2.3816781044006348, -2.2866287231445312, -2.1915793418884277, -2.096529960632324, -2.0014805793762207, -1.9064311981201172, -1.8113818168640137, -1.7163325548171997, -1.6212831735610962, -1.5262337923049927, -1.4311845302581787, -1.3361351490020752, -1.2410857677459717, -1.1460363864898682, -1.0509870052337646, -0.9559377431869507, -0.8608883619308472, -0.7658389806747437, -0.6707896590232849, -0.5757403373718262, -0.48069095611572266, -0.38564160466194153, -0.2905922532081604, -0.19554290175437927, -0.10049355030059814, -0.005444198846817017, 0.08960515260696411, 0.18465447425842285, 0.27970385551452637, 0.3747532069683075, 0.4698025584220886, 0.5648518800735474, 0.6599012613296509, 0.7549506425857544, 0.8499999642372131, 0.9450492858886719, 1.0400986671447754, 1.135148048400879, 1.2301974296569824, 1.3252466917037964, 1.4202960729599, 1.5153454542160034, 1.6103947162628174, 1.705444097518921, 1.8004934787750244, 1.895542860031128, 1.9905922412872314, 2.085641622543335, 2.1806907653808594, 2.275740146636963, 2.3707895278930664, 2.46583890914917, 2.5608882904052734]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 6.0, 4.0, 11.0, 18.0, 24.0, 37.0, 47.0, 71.0, 122.0, 172.0, 326.0, 545.0, 1210.0, 3305.0, 11330.0, 142948.0, 3973086.0, 50599.0, 6845.0, 2049.0, 775.0, 350.0, 142.0, 79.0, 50.0, 31.0, 25.0, 15.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.939453125, -0.9155731201171875, -0.891693115234375, -0.8678131103515625, -0.84393310546875, -0.8200531005859375, -0.796173095703125, -0.7722930908203125, -0.7484130859375, -0.7245330810546875, -0.700653076171875, -0.6767730712890625, -0.65289306640625, -0.6290130615234375, -0.605133056640625, -0.5812530517578125, -0.557373046875, -0.5334930419921875, -0.509613037109375, -0.4857330322265625, -0.46185302734375, -0.4379730224609375, -0.414093017578125, -0.3902130126953125, -0.3663330078125, -0.3424530029296875, -0.318572998046875, -0.2946929931640625, -0.27081298828125, -0.2469329833984375, -0.223052978515625, -0.1991729736328125, -0.17529296875, -0.1514129638671875, -0.127532958984375, -0.1036529541015625, -0.07977294921875, -0.0558929443359375, -0.032012939453125, -0.0081329345703125, 0.0157470703125, 0.0396270751953125, 0.063507080078125, 0.0873870849609375, 0.11126708984375, 0.1351470947265625, 0.159027099609375, 0.1829071044921875, 0.206787109375, 0.2306671142578125, 0.254547119140625, 0.2784271240234375, 0.30230712890625, 0.3261871337890625, 0.350067138671875, 0.3739471435546875, 0.3978271484375, 0.4217071533203125, 0.445587158203125, 0.4694671630859375, 0.49334716796875, 0.5172271728515625, 0.541107177734375, 0.5649871826171875, 0.5888671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 22.0, 32.0, 43.0, 68.0, 118.0, 133.0, 126.0, 127.0, 116.0, 85.0, 45.0, 21.0, 23.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2408447265625, -0.23472976684570312, -0.22861480712890625, -0.22249984741210938, -0.2163848876953125, -0.21026992797851562, -0.20415496826171875, -0.19804000854492188, -0.191925048828125, -0.18581008911132812, -0.17969512939453125, -0.17358016967773438, -0.1674652099609375, -0.16135025024414062, -0.15523529052734375, -0.14912033081054688, -0.14300537109375, -0.13689041137695312, -0.13077545166015625, -0.12466049194335938, -0.1185455322265625, -0.11243057250976562, -0.10631561279296875, -0.10020065307617188, -0.094085693359375, -0.08797073364257812, -0.08185577392578125, -0.07574081420898438, -0.0696258544921875, -0.06351089477539062, -0.05739593505859375, -0.051280975341796875, -0.045166015625, -0.039051055908203125, -0.03293609619140625, -0.026821136474609375, -0.0207061767578125, -0.014591217041015625, -0.00847625732421875, -0.002361297607421875, 0.003753662109375, 0.009868621826171875, 0.01598358154296875, 0.022098541259765625, 0.0282135009765625, 0.034328460693359375, 0.04044342041015625, 0.046558380126953125, 0.05267333984375, 0.058788299560546875, 0.06490325927734375, 0.07101821899414062, 0.0771331787109375, 0.08324813842773438, 0.08936309814453125, 0.09547805786132812, 0.101593017578125, 0.10770797729492188, 0.11382293701171875, 0.11993789672851562, 0.1260528564453125, 0.13216781616210938, 0.13828277587890625, 0.14439773559570312, 0.1505126953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 15.0, 13.0, 27.0, 71.0, 124.0, 287.0, 744.0, 2497.0, 12892.0, 226868.0, 3901271.0, 42611.0, 4935.0, 1187.0, 418.0, 161.0, 61.0, 45.0, 16.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6467742919921875, -0.622161865234375, -0.5975494384765625, -0.57293701171875, -0.5483245849609375, -0.523712158203125, -0.4990997314453125, -0.4744873046875, -0.4498748779296875, -0.425262451171875, -0.4006500244140625, -0.37603759765625, -0.3514251708984375, -0.326812744140625, -0.3022003173828125, -0.277587890625, -0.2529754638671875, -0.228363037109375, -0.2037506103515625, -0.17913818359375, -0.1545257568359375, -0.129913330078125, -0.1053009033203125, -0.0806884765625, -0.0560760498046875, -0.031463623046875, -0.0068511962890625, 0.01776123046875, 0.0423736572265625, 0.066986083984375, 0.0915985107421875, 0.1162109375, 0.1408233642578125, 0.165435791015625, 0.1900482177734375, 0.21466064453125, 0.2392730712890625, 0.263885498046875, 0.2884979248046875, 0.3131103515625, 0.3377227783203125, 0.362335205078125, 0.3869476318359375, 0.41156005859375, 0.4361724853515625, 0.460784912109375, 0.4853973388671875, 0.510009765625, 0.5346221923828125, 0.559234619140625, 0.5838470458984375, 0.60845947265625, 0.6330718994140625, 0.657684326171875, 0.6822967529296875, 0.7069091796875, 0.7315216064453125, 0.756134033203125, 0.7807464599609375, 0.80535888671875, 0.8299713134765625, 0.854583740234375, 0.8791961669921875, 0.90380859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 11.0, 10.0, 16.0, 19.0, 28.0, 39.0, 61.0, 127.0, 229.0, 693.0, 1766.0, 617.0, 224.0, 90.0, 49.0, 35.0, 18.0, 12.0, 8.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2584800720214844, -0.25157928466796875, -0.24467849731445312, -0.2377777099609375, -0.23087692260742188, -0.22397613525390625, -0.21707534790039062, -0.210174560546875, -0.20327377319335938, -0.19637298583984375, -0.18947219848632812, -0.1825714111328125, -0.17567062377929688, -0.16876983642578125, -0.16186904907226562, -0.15496826171875, -0.14806747436523438, -0.14116668701171875, -0.13426589965820312, -0.1273651123046875, -0.12046432495117188, -0.11356353759765625, -0.10666275024414062, -0.099761962890625, -0.09286117553710938, -0.08596038818359375, -0.07905960083007812, -0.0721588134765625, -0.06525802612304688, -0.05835723876953125, -0.051456451416015625, -0.0445556640625, -0.037654876708984375, -0.03075408935546875, -0.023853302001953125, -0.0169525146484375, -0.010051727294921875, -0.00315093994140625, 0.003749847412109375, 0.010650634765625, 0.017551422119140625, 0.02445220947265625, 0.031352996826171875, 0.0382537841796875, 0.045154571533203125, 0.05205535888671875, 0.058956146240234375, 0.06585693359375, 0.07275772094726562, 0.07965850830078125, 0.08655929565429688, 0.0934600830078125, 0.10036087036132812, 0.10726165771484375, 0.11416244506835938, 0.121063232421875, 0.12796401977539062, 0.13486480712890625, 0.14176559448242188, 0.1486663818359375, 0.15556716918945312, 0.16246795654296875, 0.16936874389648438, 0.17626953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 13.0, 44.0, 163.0, 405.0, 275.0, 75.0, 22.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51230525970459, -2.433605909347534, -2.3549063205718994, -2.2762069702148438, -2.197507619857788, -2.1188080310821533, -2.0401086807250977, -1.9614092111587524, -1.8827097415924072, -1.804010272026062, -1.7253109216690063, -1.6466114521026611, -1.567911982536316, -1.4892125129699707, -1.410513162612915, -1.3318136930465698, -1.2531143426895142, -1.174414873123169, -1.0957155227661133, -1.017016053199768, -0.9383165836334229, -0.8596171736717224, -0.780917763710022, -0.7022182941436768, -0.6235188841819763, -0.5448194742202759, -0.46612000465393066, -0.3874205946922302, -0.3087211549282074, -0.23002171516418457, -0.15132230520248413, -0.07262283563613892, 0.0060765743255615234, 0.08477600663900375, 0.16347543895244598, 0.24217486381530762, 0.32087430357933044, 0.39957374334335327, 0.4782731533050537, 0.5569726228713989, 0.6356720328330994, 0.7143714427947998, 0.793070912361145, 0.8717703223228455, 0.9504697322845459, 1.0291692018508911, 1.1078686714172363, 1.186568021774292, 1.2652674913406372, 1.3439669609069824, 1.422666311264038, 1.5013657808303833, 1.5800652503967285, 1.6587646007537842, 1.7374640703201294, 1.8161635398864746, 1.8948628902435303, 1.9735623598098755, 2.0522618293762207, 2.1309611797332764, 2.209660530090332, 2.288360118865967, 2.3670594692230225, 2.445758819580078, 2.524458408355713]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 11.0, 9.0, 20.0, 20.0, 22.0, 29.0, 28.0, 42.0, 47.0, 56.0, 70.0, 62.0, 62.0, 63.0, 46.0, 54.0, 49.0, 51.0, 50.0, 35.0, 33.0, 31.0, 35.0, 18.0, 10.0, 12.0, 9.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5914614200592041, -0.5689360499382019, -0.5464107394218445, -0.5238853693008423, -0.5013599991798401, -0.4788346588611603, -0.45630931854248047, -0.43378394842147827, -0.41125860810279846, -0.38873326778411865, -0.36620789766311646, -0.34368255734443665, -0.32115721702575684, -0.29863184690475464, -0.27610650658607483, -0.253581166267395, -0.23105579614639282, -0.20853044092655182, -0.18600508570671082, -0.163479745388031, -0.14095439016819, -0.118429034948349, -0.09590369462966919, -0.07337833940982819, -0.05085298418998718, -0.028327632695436478, -0.005802281200885773, 0.016723066568374634, 0.03924842178821564, 0.06177377700805664, 0.08429911732673645, 0.10682447254657745, 0.12934982776641846, 0.15187518298625946, 0.17440053820610046, 0.19692587852478027, 0.21945123374462128, 0.24197658896446228, 0.2645019292831421, 0.2870272994041443, 0.3095526397228241, 0.3320779800415039, 0.3546033501625061, 0.3771286904811859, 0.3996540307998657, 0.4221794009208679, 0.44470474123954773, 0.46723008155822754, 0.48975545167922974, 0.5122808218002319, 0.5348061323165894, 0.5573315024375916, 0.5798568725585938, 0.6023821830749512, 0.6249075531959534, 0.6474329233169556, 0.669958233833313, 0.6924836039543152, 0.7150089144706726, 0.7375342845916748, 0.760059654712677, 0.7825850248336792, 0.8051103353500366, 0.8276357054710388, 0.850161075592041]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 12.0, 10.0, 15.0, 24.0, 38.0, 43.0, 40.0, 73.0, 106.0, 185.0, 302.0, 452.0, 839.0, 1713.0, 4104.0, 15073.0, 124643.0, 745718.0, 131474.0, 15563.0, 4175.0, 1656.0, 882.0, 518.0, 272.0, 180.0, 123.0, 80.0, 55.0, 46.0, 26.0, 31.0, 17.0, 15.0, 9.0, 11.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.79052734375, -0.766937255859375, -0.74334716796875, -0.719757080078125, -0.6961669921875, -0.672576904296875, -0.64898681640625, -0.625396728515625, -0.601806640625, -0.578216552734375, -0.55462646484375, -0.531036376953125, -0.5074462890625, -0.483856201171875, -0.46026611328125, -0.436676025390625, -0.4130859375, -0.389495849609375, -0.36590576171875, -0.342315673828125, -0.3187255859375, -0.295135498046875, -0.27154541015625, -0.247955322265625, -0.224365234375, -0.200775146484375, -0.17718505859375, -0.153594970703125, -0.1300048828125, -0.106414794921875, -0.08282470703125, -0.059234619140625, -0.03564453125, -0.012054443359375, 0.01153564453125, 0.035125732421875, 0.0587158203125, 0.082305908203125, 0.10589599609375, 0.129486083984375, 0.153076171875, 0.176666259765625, 0.20025634765625, 0.223846435546875, 0.2474365234375, 0.271026611328125, 0.29461669921875, 0.318206787109375, 0.341796875, 0.365386962890625, 0.38897705078125, 0.412567138671875, 0.4361572265625, 0.459747314453125, 0.48333740234375, 0.506927490234375, 0.530517578125, 0.554107666015625, 0.57769775390625, 0.601287841796875, 0.6248779296875, 0.648468017578125, 0.67205810546875, 0.695648193359375, 0.71923828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 15.0, 26.0, 35.0, 67.0, 95.0, 125.0, 134.0, 113.0, 119.0, 94.0, 79.0, 29.0, 19.0, 14.0, 10.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2215576171875, -0.2157001495361328, -0.20984268188476562, -0.20398521423339844, -0.19812774658203125, -0.19227027893066406, -0.18641281127929688, -0.1805553436279297, -0.1746978759765625, -0.1688404083251953, -0.16298294067382812, -0.15712547302246094, -0.15126800537109375, -0.14541053771972656, -0.13955307006835938, -0.1336956024169922, -0.127838134765625, -0.12198066711425781, -0.11612319946289062, -0.11026573181152344, -0.10440826416015625, -0.09855079650878906, -0.09269332885742188, -0.08683586120605469, -0.0809783935546875, -0.07512092590332031, -0.06926345825195312, -0.06340599060058594, -0.05754852294921875, -0.05169105529785156, -0.045833587646484375, -0.03997611999511719, -0.03411865234375, -0.028261184692382812, -0.022403717041015625, -0.016546249389648438, -0.01068878173828125, -0.0048313140869140625, 0.001026153564453125, 0.0068836212158203125, 0.0127410888671875, 0.018598556518554688, 0.024456024169921875, 0.030313491821289062, 0.03617095947265625, 0.04202842712402344, 0.047885894775390625, 0.05374336242675781, 0.059600830078125, 0.06545829772949219, 0.07131576538085938, 0.07717323303222656, 0.08303070068359375, 0.08888816833496094, 0.09474563598632812, 0.10060310363769531, 0.1064605712890625, 0.11231803894042969, 0.11817550659179688, 0.12403297424316406, 0.12989044189453125, 0.13574790954589844, 0.14160537719726562, 0.1474628448486328, 0.1533203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 14.0, 14.0, 22.0, 28.0, 34.0, 48.0, 67.0, 110.0, 219.0, 265.0, 507.0, 927.0, 1904.0, 4249.0, 11113.0, 34791.0, 127296.0, 450105.0, 302259.0, 77641.0, 22781.0, 7800.0, 3119.0, 1398.0, 745.0, 379.0, 241.0, 156.0, 92.0, 65.0, 37.0, 22.0, 25.0, 23.0, 12.0, 11.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.442138671875, -0.4290618896484375, -0.415985107421875, -0.4029083251953125, -0.38983154296875, -0.3767547607421875, -0.363677978515625, -0.3506011962890625, -0.3375244140625, -0.3244476318359375, -0.311370849609375, -0.2982940673828125, -0.28521728515625, -0.2721405029296875, -0.259063720703125, -0.2459869384765625, -0.23291015625, -0.2198333740234375, -0.206756591796875, -0.1936798095703125, -0.18060302734375, -0.1675262451171875, -0.154449462890625, -0.1413726806640625, -0.1282958984375, -0.1152191162109375, -0.102142333984375, -0.0890655517578125, -0.07598876953125, -0.0629119873046875, -0.049835205078125, -0.0367584228515625, -0.023681640625, -0.0106048583984375, 0.002471923828125, 0.0155487060546875, 0.02862548828125, 0.0417022705078125, 0.054779052734375, 0.0678558349609375, 0.0809326171875, 0.0940093994140625, 0.107086181640625, 0.1201629638671875, 0.13323974609375, 0.1463165283203125, 0.159393310546875, 0.1724700927734375, 0.185546875, 0.1986236572265625, 0.211700439453125, 0.2247772216796875, 0.23785400390625, 0.2509307861328125, 0.264007568359375, 0.2770843505859375, 0.2901611328125, 0.3032379150390625, 0.316314697265625, 0.3293914794921875, 0.34246826171875, 0.3555450439453125, 0.368621826171875, 0.3816986083984375, 0.394775390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 4.0, 7.0, 7.0, 9.0, 15.0, 13.0, 17.0, 16.0, 17.0, 32.0, 27.0, 37.0, 33.0, 42.0, 50.0, 43.0, 45.0, 50.0, 36.0, 49.0, 48.0, 42.0, 38.0, 50.0, 34.0, 32.0, 33.0, 22.0, 24.0, 19.0, 23.0, 16.0, 22.0, 10.0, 8.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.434814453125, -0.4220771789550781, -0.40933990478515625, -0.3966026306152344, -0.3838653564453125, -0.3711280822753906, -0.35839080810546875, -0.3456535339355469, -0.332916259765625, -0.3201789855957031, -0.30744171142578125, -0.2947044372558594, -0.2819671630859375, -0.2692298889160156, -0.25649261474609375, -0.24375534057617188, -0.23101806640625, -0.21828079223632812, -0.20554351806640625, -0.19280624389648438, -0.1800689697265625, -0.16733169555664062, -0.15459442138671875, -0.14185714721679688, -0.129119873046875, -0.11638259887695312, -0.10364532470703125, -0.09090805053710938, -0.0781707763671875, -0.06543350219726562, -0.05269622802734375, -0.039958953857421875, -0.0272216796875, -0.014484405517578125, -0.00174713134765625, 0.010990142822265625, 0.0237274169921875, 0.036464691162109375, 0.04920196533203125, 0.061939239501953125, 0.074676513671875, 0.08741378784179688, 0.10015106201171875, 0.11288833618164062, 0.1256256103515625, 0.13836288452148438, 0.15110015869140625, 0.16383743286132812, 0.17657470703125, 0.18931198120117188, 0.20204925537109375, 0.21478652954101562, 0.2275238037109375, 0.24026107788085938, 0.25299835205078125, 0.2657356262207031, 0.278472900390625, 0.2912101745605469, 0.30394744873046875, 0.3166847229003906, 0.3294219970703125, 0.3421592712402344, 0.35489654541015625, 0.3676338195800781, 0.38037109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 14.0, 15.0, 25.0, 47.0, 96.0, 194.0, 502.0, 1401.0, 4795.0, 26651.0, 859439.0, 141161.0, 10187.0, 2578.0, 824.0, 326.0, 137.0, 67.0, 25.0, 15.0, 11.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4990234375, -0.4822540283203125, -0.465484619140625, -0.4487152099609375, -0.43194580078125, -0.4151763916015625, -0.398406982421875, -0.3816375732421875, -0.3648681640625, -0.3480987548828125, -0.331329345703125, -0.3145599365234375, -0.29779052734375, -0.2810211181640625, -0.264251708984375, -0.2474822998046875, -0.230712890625, -0.2139434814453125, -0.197174072265625, -0.1804046630859375, -0.16363525390625, -0.1468658447265625, -0.130096435546875, -0.1133270263671875, -0.0965576171875, -0.0797882080078125, -0.063018798828125, -0.0462493896484375, -0.02947998046875, -0.0127105712890625, 0.004058837890625, 0.0208282470703125, 0.03759765625, 0.0543670654296875, 0.071136474609375, 0.0879058837890625, 0.10467529296875, 0.1214447021484375, 0.138214111328125, 0.1549835205078125, 0.1717529296875, 0.1885223388671875, 0.205291748046875, 0.2220611572265625, 0.23883056640625, 0.2555999755859375, 0.272369384765625, 0.2891387939453125, 0.305908203125, 0.3226776123046875, 0.339447021484375, 0.3562164306640625, 0.37298583984375, 0.3897552490234375, 0.406524658203125, 0.4232940673828125, 0.4400634765625, 0.4568328857421875, 0.473602294921875, 0.4903717041015625, 0.50714111328125, 0.5239105224609375, 0.540679931640625, 0.5574493408203125, 0.57421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 9.0, 12.0, 13.0, 13.0, 19.0, 23.0, 31.0, 42.0, 58.0, 95.0, 113.0, 124.0, 100.0, 86.0, 52.0, 50.0, 26.0, 22.0, 19.0, 12.0, 11.0, 11.0, 10.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001061558723449707, -0.0001029549166560173, -9.97539609670639e-05, -9.65530052781105e-05, -9.33520495891571e-05, -9.01510939002037e-05, -8.69501382112503e-05, -8.37491825222969e-05, -8.05482268333435e-05, -7.73472711443901e-05, -7.41463154554367e-05, -7.094535976648331e-05, -6.774440407752991e-05, -6.454344838857651e-05, -6.134249269962311e-05, -5.814153701066971e-05, -5.494058132171631e-05, -5.173962563276291e-05, -4.853866994380951e-05, -4.533771425485611e-05, -4.213675856590271e-05, -3.893580287694931e-05, -3.573484718799591e-05, -3.253389149904251e-05, -2.933293581008911e-05, -2.613198012113571e-05, -2.2931024432182312e-05, -1.9730068743228912e-05, -1.6529113054275513e-05, -1.3328157365322113e-05, -1.0127201676368713e-05, -6.926245987415314e-06, -3.725290298461914e-06, -5.243346095085144e-07, 2.6766210794448853e-06, 5.877576768398285e-06, 9.078532457351685e-06, 1.2279488146305084e-05, 1.5480443835258484e-05, 1.8681399524211884e-05, 2.1882355213165283e-05, 2.5083310902118683e-05, 2.8284266591072083e-05, 3.148522228002548e-05, 3.468617796897888e-05, 3.788713365793228e-05, 4.108808934688568e-05, 4.428904503583908e-05, 4.749000072479248e-05, 5.069095641374588e-05, 5.389191210269928e-05, 5.709286779165268e-05, 6.029382348060608e-05, 6.349477916955948e-05, 6.669573485851288e-05, 6.989669054746628e-05, 7.309764623641968e-05, 7.629860192537308e-05, 7.949955761432648e-05, 8.270051330327988e-05, 8.590146899223328e-05, 8.910242468118668e-05, 9.230338037014008e-05, 9.550433605909348e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 2.0, 6.0, 9.0, 3.0, 10.0, 15.0, 28.0, 28.0, 50.0, 83.0, 148.0, 242.0, 478.0, 879.0, 1873.0, 4548.0, 15518.0, 108740.0, 794635.0, 98444.0, 14677.0, 4438.0, 1758.0, 903.0, 425.0, 245.0, 131.0, 71.0, 49.0, 36.0, 21.0, 14.0, 11.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34619140625, -0.3351936340332031, -0.32419586181640625, -0.3131980895996094, -0.3022003173828125, -0.2912025451660156, -0.28020477294921875, -0.2692070007324219, -0.258209228515625, -0.24721145629882812, -0.23621368408203125, -0.22521591186523438, -0.2142181396484375, -0.20322036743164062, -0.19222259521484375, -0.18122482299804688, -0.17022705078125, -0.15922927856445312, -0.14823150634765625, -0.13723373413085938, -0.1262359619140625, -0.11523818969726562, -0.10424041748046875, -0.09324264526367188, -0.082244873046875, -0.07124710083007812, -0.06024932861328125, -0.049251556396484375, -0.0382537841796875, -0.027256011962890625, -0.01625823974609375, -0.005260467529296875, 0.0057373046875, 0.016735076904296875, 0.02773284912109375, 0.038730621337890625, 0.0497283935546875, 0.060726165771484375, 0.07172393798828125, 0.08272171020507812, 0.093719482421875, 0.10471725463867188, 0.11571502685546875, 0.12671279907226562, 0.1377105712890625, 0.14870834350585938, 0.15970611572265625, 0.17070388793945312, 0.18170166015625, 0.19269943237304688, 0.20369720458984375, 0.21469497680664062, 0.2256927490234375, 0.23669052124023438, 0.24768829345703125, 0.2586860656738281, 0.269683837890625, 0.2806816101074219, 0.29167938232421875, 0.3026771545410156, 0.3136749267578125, 0.3246726989746094, 0.33567047119140625, 0.3466682434082031, 0.357666015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 23.0, 41.0, 53.0, 82.0, 168.0, 208.0, 159.0, 89.0, 63.0, 33.0, 18.0, 10.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.42317962646484375, -0.4083709716796875, -0.39356231689453125, -0.378753662109375, -0.36394500732421875, -0.3491363525390625, -0.33432769775390625, -0.31951904296875, -0.30471038818359375, -0.2899017333984375, -0.27509307861328125, -0.260284423828125, -0.24547576904296875, -0.2306671142578125, -0.21585845947265625, -0.2010498046875, -0.18624114990234375, -0.1714324951171875, -0.15662384033203125, -0.141815185546875, -0.12700653076171875, -0.1121978759765625, -0.09738922119140625, -0.08258056640625, -0.06777191162109375, -0.0529632568359375, -0.03815460205078125, -0.023345947265625, -0.00853729248046875, 0.0062713623046875, 0.02108001708984375, 0.035888671875, 0.05069732666015625, 0.0655059814453125, 0.08031463623046875, 0.095123291015625, 0.10993194580078125, 0.1247406005859375, 0.13954925537109375, 0.15435791015625, 0.16916656494140625, 0.1839752197265625, 0.19878387451171875, 0.213592529296875, 0.22840118408203125, 0.2432098388671875, 0.25801849365234375, 0.2728271484375, 0.28763580322265625, 0.3024444580078125, 0.31725311279296875, 0.332061767578125, 0.34687042236328125, 0.3616790771484375, 0.37648773193359375, 0.39129638671875, 0.40610504150390625, 0.4209136962890625, 0.43572235107421875, 0.450531005859375, 0.46533966064453125, 0.4801483154296875, 0.49495697021484375, 0.509765625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 14.0, 67.0, 273.0, 434.0, 147.0, 51.0, 15.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.775846481323242, -7.489560127258301, -7.203273773193359, -6.916987895965576, -6.630701541900635, -6.344415187835693, -6.05812931060791, -5.771842956542969, -5.485556602478027, -5.199270248413086, -4.9129838943481445, -4.626698017120361, -4.34041166305542, -4.0541253089904785, -3.767839193344116, -3.481553077697754, -3.1952667236328125, -2.908980369567871, -2.622694253921509, -2.3364081382751465, -2.050121784210205, -1.7638355493545532, -1.4775493144989014, -1.191263198852539, -0.9049768447875977, -0.6186906099319458, -0.33240437507629395, -0.04611814022064209, 0.24016809463500977, 0.5264543294906616, 0.8127405643463135, 1.0990266799926758, 1.3853130340576172, 1.671599268913269, 1.957885503768921, 2.244171619415283, 2.5304579734802246, 2.816744327545166, 3.1030304431915283, 3.3893165588378906, 3.675602912902832, 3.9618892669677734, 4.248175621032715, 4.534461498260498, 4.8207478523254395, 5.107034206390381, 5.393320083618164, 5.6796064376831055, 5.965892791748047, 6.252179145812988, 6.53846549987793, 6.824751377105713, 7.111037731170654, 7.397324085235596, 7.683609962463379, 7.96989631652832, 8.256182670593262, 8.542469024658203, 8.828755378723145, 9.115041732788086, 9.401327133178711, 9.687613487243652, 9.973899841308594, 10.260186195373535, 10.546472549438477]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 4.0, 6.0, 8.0, 8.0, 11.0, 16.0, 14.0, 22.0, 19.0, 15.0, 28.0, 27.0, 25.0, 38.0, 24.0, 35.0, 27.0, 51.0, 40.0, 31.0, 43.0, 39.0, 46.0, 38.0, 35.0, 40.0, 38.0, 36.0, 34.0, 30.0, 24.0, 24.0, 18.0, 15.0, 10.0, 8.0, 14.0, 11.0, 9.0, 6.0, 4.0, 9.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.003347873687744, -1.9367088079452515, -1.8700697422027588, -1.8034306764602661, -1.7367916107177734, -1.6701526641845703, -1.6035135984420776, -1.536874532699585, -1.4702354669570923, -1.4035964012145996, -1.336957335472107, -1.2703182697296143, -1.2036793231964111, -1.137040138244629, -1.0704011917114258, -1.003762125968933, -0.9371230602264404, -0.8704839944839478, -0.8038449287414551, -0.7372059226036072, -0.6705668568611145, -0.6039277911186218, -0.5372887849807739, -0.47064971923828125, -0.4040106534957886, -0.3373715877532959, -0.2707325518131256, -0.20409350097179413, -0.13745445013046265, -0.07081538438796997, -0.004176348447799683, 0.062462687492370605, 0.12910175323486328, 0.19574080407619476, 0.26237985491752625, 0.32901889085769653, 0.3956579566001892, 0.4622970223426819, 0.5289360284805298, 0.5955750942230225, 0.6622141599655151, 0.7288532257080078, 0.7954922914505005, 0.8621312975883484, 0.9287703633308411, 0.9954094290733337, 1.0620484352111816, 1.1286875009536743, 1.195326566696167, 1.2619656324386597, 1.3286046981811523, 1.395243763923645, 1.4618828296661377, 1.5285217761993408, 1.5951608419418335, 1.6617999076843262, 1.7284389734268188, 1.7950780391693115, 1.8617171049118042, 1.9283561706542969, 1.9949951171875, 2.0616343021392822, 2.1282732486724854, 2.1949124336242676, 2.2615513801574707]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 13.0, 14.0, 17.0, 30.0, 39.0, 65.0, 91.0, 134.0, 251.0, 418.0, 799.0, 1760.0, 5085.0, 23163.0, 2460466.0, 1671044.0, 23183.0, 4617.0, 1621.0, 684.0, 330.0, 173.0, 95.0, 66.0, 28.0, 28.0, 16.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.8408203125, -0.8207969665527344, -0.8007736206054688, -0.7807502746582031, -0.7607269287109375, -0.7407035827636719, -0.7206802368164062, -0.7006568908691406, -0.680633544921875, -0.6606101989746094, -0.6405868530273438, -0.6205635070800781, -0.6005401611328125, -0.5805168151855469, -0.5604934692382812, -0.5404701232910156, -0.52044677734375, -0.5004234313964844, -0.48040008544921875, -0.4603767395019531, -0.4403533935546875, -0.4203300476074219, -0.40030670166015625, -0.3802833557128906, -0.360260009765625, -0.3402366638183594, -0.32021331787109375, -0.3001899719238281, -0.2801666259765625, -0.2601432800292969, -0.24011993408203125, -0.22009658813476562, -0.2000732421875, -0.18004989624023438, -0.16002655029296875, -0.14000320434570312, -0.1199798583984375, -0.09995651245117188, -0.07993316650390625, -0.059909820556640625, -0.039886474609375, -0.019863128662109375, 0.00016021728515625, 0.020183563232421875, 0.0402069091796875, 0.060230255126953125, 0.08025360107421875, 0.10027694702148438, 0.12030029296875, 0.14032363891601562, 0.16034698486328125, 0.18037033081054688, 0.2003936767578125, 0.22041702270507812, 0.24044036865234375, 0.2604637145996094, 0.280487060546875, 0.3005104064941406, 0.32053375244140625, 0.3405570983886719, 0.3605804443359375, 0.3806037902832031, 0.40062713623046875, 0.4206504821777344, 0.440673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 22.0, 31.0, 26.0, 74.0, 106.0, 113.0, 117.0, 119.0, 98.0, 98.0, 60.0, 56.0, 17.0, 17.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19882583618164062, -0.19293975830078125, -0.18705368041992188, -0.1811676025390625, -0.17528152465820312, -0.16939544677734375, -0.16350936889648438, -0.157623291015625, -0.15173721313476562, -0.14585113525390625, -0.13996505737304688, -0.1340789794921875, -0.12819290161132812, -0.12230682373046875, -0.11642074584960938, -0.11053466796875, -0.10464859008789062, -0.09876251220703125, -0.09287643432617188, -0.0869903564453125, -0.08110427856445312, -0.07521820068359375, -0.06933212280273438, -0.063446044921875, -0.057559967041015625, -0.05167388916015625, -0.045787811279296875, -0.0399017333984375, -0.034015655517578125, -0.02812957763671875, -0.022243499755859375, -0.016357421875, -0.010471343994140625, -0.00458526611328125, 0.001300811767578125, 0.0071868896484375, 0.013072967529296875, 0.01895904541015625, 0.024845123291015625, 0.030731201171875, 0.036617279052734375, 0.04250335693359375, 0.048389434814453125, 0.0542755126953125, 0.060161590576171875, 0.06604766845703125, 0.07193374633789062, 0.07781982421875, 0.08370590209960938, 0.08959197998046875, 0.09547805786132812, 0.1013641357421875, 0.10725021362304688, 0.11313629150390625, 0.11902236938476562, 0.124908447265625, 0.13079452514648438, 0.13668060302734375, 0.14256668090820312, 0.1484527587890625, 0.15433883666992188, 0.16022491455078125, 0.16611099243164062, 0.1719970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 8.0, 14.0, 15.0, 30.0, 49.0, 100.0, 256.0, 575.0, 1550.0, 5347.0, 32150.0, 2414678.0, 1702405.0, 29566.0, 5164.0, 1431.0, 523.0, 226.0, 92.0, 53.0, 16.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.703125, -0.685089111328125, -0.66705322265625, -0.649017333984375, -0.6309814453125, -0.612945556640625, -0.59490966796875, -0.576873779296875, -0.558837890625, -0.540802001953125, -0.52276611328125, -0.504730224609375, -0.4866943359375, -0.468658447265625, -0.45062255859375, -0.432586669921875, -0.41455078125, -0.396514892578125, -0.37847900390625, -0.360443115234375, -0.3424072265625, -0.324371337890625, -0.30633544921875, -0.288299560546875, -0.270263671875, -0.252227783203125, -0.23419189453125, -0.216156005859375, -0.1981201171875, -0.180084228515625, -0.16204833984375, -0.144012451171875, -0.1259765625, -0.107940673828125, -0.08990478515625, -0.071868896484375, -0.0538330078125, -0.035797119140625, -0.01776123046875, 0.000274658203125, 0.018310546875, 0.036346435546875, 0.05438232421875, 0.072418212890625, 0.0904541015625, 0.108489990234375, 0.12652587890625, 0.144561767578125, 0.16259765625, 0.180633544921875, 0.19866943359375, 0.216705322265625, 0.2347412109375, 0.252777099609375, 0.27081298828125, 0.288848876953125, 0.306884765625, 0.324920654296875, 0.34295654296875, 0.360992431640625, 0.3790283203125, 0.397064208984375, 0.41510009765625, 0.433135986328125, 0.451171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 6.0, 14.0, 17.0, 32.0, 34.0, 44.0, 80.0, 185.0, 499.0, 1601.0, 951.0, 303.0, 124.0, 54.0, 26.0, 29.0, 12.0, 11.0, 12.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.1390094757080078, -0.13434219360351562, -0.12967491149902344, -0.12500762939453125, -0.12034034729003906, -0.11567306518554688, -0.11100578308105469, -0.1063385009765625, -0.10167121887207031, -0.09700393676757812, -0.09233665466308594, -0.08766937255859375, -0.08300209045410156, -0.07833480834960938, -0.07366752624511719, -0.069000244140625, -0.06433296203613281, -0.059665679931640625, -0.05499839782714844, -0.05033111572265625, -0.04566383361816406, -0.040996551513671875, -0.03632926940917969, -0.0316619873046875, -0.026994705200195312, -0.022327423095703125, -0.017660140991210938, -0.01299285888671875, -0.008325576782226562, -0.003658294677734375, 0.0010089874267578125, 0.00567626953125, 0.010343551635742188, 0.015010833740234375, 0.019678115844726562, 0.02434539794921875, 0.029012680053710938, 0.033679962158203125, 0.03834724426269531, 0.0430145263671875, 0.04768180847167969, 0.052349090576171875, 0.05701637268066406, 0.06168365478515625, 0.06635093688964844, 0.07101821899414062, 0.07568550109863281, 0.080352783203125, 0.08502006530761719, 0.08968734741210938, 0.09435462951660156, 0.09902191162109375, 0.10368919372558594, 0.10835647583007812, 0.11302375793457031, 0.1176910400390625, 0.12235832214355469, 0.12702560424804688, 0.13169288635253906, 0.13636016845703125, 0.14102745056152344, 0.14569473266601562, 0.1503620147705078, 0.155029296875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 16.0, 20.0, 53.0, 73.0, 119.0, 170.0, 184.0, 162.0, 81.0, 55.0, 26.0, 14.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.856290340423584, -0.8283697366714478, -0.8004491329193115, -0.7725285291671753, -0.7446079254150391, -0.7166873216629028, -0.6887667179107666, -0.6608460545539856, -0.6329254508018494, -0.6050048470497131, -0.5770842432975769, -0.5491636395454407, -0.5212430357933044, -0.4933224022388458, -0.4654017984867096, -0.437481164932251, -0.40956059098243713, -0.3816399872303009, -0.3537193834781647, -0.32579874992370605, -0.2978781461715698, -0.2699575424194336, -0.24203693866729736, -0.21411632001399994, -0.1861957162618637, -0.15827511250972748, -0.13035449385643005, -0.10243389010429382, -0.074513278901577, -0.04659266769886017, -0.018672063946723938, 0.009248554706573486, 0.03716915845870972, 0.06508976966142654, 0.09301038086414337, 0.1209309846162796, 0.14885160326957703, 0.17677220702171326, 0.2046928107738495, 0.2326134294271469, 0.26053404808044434, 0.28845465183258057, 0.3163752555847168, 0.344295859336853, 0.37221649289131165, 0.4001370966434479, 0.4280577003955841, 0.4559783339500427, 0.48389890789985657, 0.5118195414543152, 0.5397401452064514, 0.5676607489585876, 0.5955813527107239, 0.6235019564628601, 0.6514225602149963, 0.6793431639671326, 0.7072637677192688, 0.735184371471405, 0.7631049752235413, 0.7910255789756775, 0.8189461827278137, 0.8468668460845947, 0.874787449836731, 0.9027080535888672, 0.9306286573410034]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 3.0, 9.0, 18.0, 28.0, 22.0, 39.0, 40.0, 45.0, 37.0, 52.0, 55.0, 53.0, 56.0, 67.0, 64.0, 74.0, 55.0, 41.0, 38.0, 41.0, 40.0, 20.0, 22.0, 18.0, 18.0, 14.0, 10.0, 6.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5382129549980164, -0.5204073190689087, -0.502601683139801, -0.48479604721069336, -0.4669904112815857, -0.449184775352478, -0.43137913942337036, -0.4135735034942627, -0.39576786756515503, -0.37796223163604736, -0.3601565957069397, -0.34235095977783203, -0.32454532384872437, -0.3067396879196167, -0.28893405199050903, -0.27112841606140137, -0.2533227801322937, -0.23551714420318604, -0.21771150827407837, -0.1999058723449707, -0.18210023641586304, -0.16429460048675537, -0.1464889645576477, -0.12868332862854004, -0.11087769269943237, -0.09307205677032471, -0.07526642084121704, -0.057460784912109375, -0.03965514898300171, -0.021849513053894043, -0.004043877124786377, 0.013761758804321289, 0.03156733512878418, 0.049372971057891846, 0.06717860698699951, 0.08498424291610718, 0.10278987884521484, 0.12059551477432251, 0.13840115070343018, 0.15620678663253784, 0.1740124225616455, 0.19181805849075317, 0.20962369441986084, 0.2274293303489685, 0.24523496627807617, 0.26304060220718384, 0.2808462381362915, 0.29865187406539917, 0.31645750999450684, 0.3342631459236145, 0.35206878185272217, 0.36987441778182983, 0.3876800537109375, 0.40548568964004517, 0.42329132556915283, 0.4410969614982605, 0.45890259742736816, 0.47670823335647583, 0.4945138692855835, 0.5123195052146912, 0.5301251411437988, 0.5479307770729065, 0.5657364130020142, 0.5835420489311218, 0.6013476848602295]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 18.0, 16.0, 22.0, 43.0, 44.0, 97.0, 126.0, 261.0, 407.0, 837.0, 1887.0, 5746.0, 31308.0, 494774.0, 473879.0, 29713.0, 5504.0, 1917.0, 821.0, 451.0, 253.0, 138.0, 96.0, 55.0, 46.0, 29.0, 14.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8679885864257812, -0.8399810791015625, -0.8119735717773438, -0.783966064453125, -0.7559585571289062, -0.7279510498046875, -0.6999435424804688, -0.67193603515625, -0.6439285278320312, -0.6159210205078125, -0.5879135131835938, -0.559906005859375, -0.5318984985351562, -0.5038909912109375, -0.47588348388671875, -0.4478759765625, -0.41986846923828125, -0.3918609619140625, -0.36385345458984375, -0.335845947265625, -0.30783843994140625, -0.2798309326171875, -0.25182342529296875, -0.22381591796875, -0.19580841064453125, -0.1678009033203125, -0.13979339599609375, -0.111785888671875, -0.08377838134765625, -0.0557708740234375, -0.02776336669921875, 0.000244140625, 0.02825164794921875, 0.0562591552734375, 0.08426666259765625, 0.112274169921875, 0.14028167724609375, 0.1682891845703125, 0.19629669189453125, 0.22430419921875, 0.25231170654296875, 0.2803192138671875, 0.30832672119140625, 0.336334228515625, 0.36434173583984375, 0.3923492431640625, 0.42035675048828125, 0.4483642578125, 0.47637176513671875, 0.5043792724609375, 0.5323867797851562, 0.560394287109375, 0.5884017944335938, 0.6164093017578125, 0.6444168090820312, 0.67242431640625, 0.7004318237304688, 0.7284393310546875, 0.7564468383789062, 0.784454345703125, 0.8124618530273438, 0.8404693603515625, 0.8684768676757812, 0.896484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 7.0, 10.0, 24.0, 28.0, 43.0, 68.0, 114.0, 125.0, 112.0, 113.0, 98.0, 83.0, 62.0, 48.0, 19.0, 15.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.1951160430908203, -0.18930435180664062, -0.18349266052246094, -0.17768096923828125, -0.17186927795410156, -0.16605758666992188, -0.1602458953857422, -0.1544342041015625, -0.1486225128173828, -0.14281082153320312, -0.13699913024902344, -0.13118743896484375, -0.12537574768066406, -0.11956405639648438, -0.11375236511230469, -0.107940673828125, -0.10212898254394531, -0.09631729125976562, -0.09050559997558594, -0.08469390869140625, -0.07888221740722656, -0.07307052612304688, -0.06725883483886719, -0.0614471435546875, -0.05563545227050781, -0.049823760986328125, -0.04401206970214844, -0.03820037841796875, -0.03238868713378906, -0.026576995849609375, -0.020765304565429688, -0.01495361328125, -0.009141921997070312, -0.003330230712890625, 0.0024814605712890625, 0.00829315185546875, 0.014104843139648438, 0.019916534423828125, 0.025728225708007812, 0.0315399169921875, 0.03735160827636719, 0.043163299560546875, 0.04897499084472656, 0.05478668212890625, 0.06059837341308594, 0.06641006469726562, 0.07222175598144531, 0.078033447265625, 0.08384513854980469, 0.08965682983398438, 0.09546852111816406, 0.10128021240234375, 0.10709190368652344, 0.11290359497070312, 0.11871528625488281, 0.1245269775390625, 0.1303386688232422, 0.13615036010742188, 0.14196205139160156, 0.14777374267578125, 0.15358543395996094, 0.15939712524414062, 0.1652088165283203, 0.1710205078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 5.0, 8.0, 19.0, 16.0, 27.0, 36.0, 43.0, 57.0, 87.0, 124.0, 167.0, 258.0, 350.0, 558.0, 847.0, 1424.0, 2541.0, 4704.0, 9531.0, 20049.0, 44897.0, 107053.0, 244265.0, 320629.0, 163189.0, 69107.0, 29906.0, 13477.0, 6598.0, 3501.0, 1832.0, 1151.0, 713.0, 453.0, 297.0, 182.0, 109.0, 82.0, 66.0, 46.0, 51.0, 26.0, 22.0, 12.0, 13.0, 7.0, 6.0, 9.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.2652130126953125, -0.256988525390625, -0.2487640380859375, -0.24053955078125, -0.2323150634765625, -0.224090576171875, -0.2158660888671875, -0.2076416015625, -0.1994171142578125, -0.191192626953125, -0.1829681396484375, -0.17474365234375, -0.1665191650390625, -0.158294677734375, -0.1500701904296875, -0.141845703125, -0.1336212158203125, -0.125396728515625, -0.1171722412109375, -0.10894775390625, -0.1007232666015625, -0.092498779296875, -0.0842742919921875, -0.0760498046875, -0.0678253173828125, -0.059600830078125, -0.0513763427734375, -0.04315185546875, -0.0349273681640625, -0.026702880859375, -0.0184783935546875, -0.01025390625, -0.0020294189453125, 0.006195068359375, 0.0144195556640625, 0.02264404296875, 0.0308685302734375, 0.039093017578125, 0.0473175048828125, 0.0555419921875, 0.0637664794921875, 0.071990966796875, 0.0802154541015625, 0.08843994140625, 0.0966644287109375, 0.104888916015625, 0.1131134033203125, 0.121337890625, 0.1295623779296875, 0.137786865234375, 0.1460113525390625, 0.15423583984375, 0.1624603271484375, 0.170684814453125, 0.1789093017578125, 0.1871337890625, 0.1953582763671875, 0.203582763671875, 0.2118072509765625, 0.22003173828125, 0.2282562255859375, 0.236480712890625, 0.2447052001953125, 0.2529296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 9.0, 11.0, 12.0, 16.0, 16.0, 22.0, 21.0, 23.0, 18.0, 33.0, 27.0, 34.0, 40.0, 37.0, 46.0, 43.0, 34.0, 45.0, 37.0, 57.0, 35.0, 35.0, 36.0, 37.0, 41.0, 38.0, 24.0, 15.0, 19.0, 27.0, 19.0, 13.0, 19.0, 8.0, 9.0, 4.0, 9.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.387939453125, -0.3761177062988281, -0.36429595947265625, -0.3524742126464844, -0.3406524658203125, -0.3288307189941406, -0.31700897216796875, -0.3051872253417969, -0.293365478515625, -0.2815437316894531, -0.26972198486328125, -0.2579002380371094, -0.2460784912109375, -0.23425674438476562, -0.22243499755859375, -0.21061325073242188, -0.19879150390625, -0.18696975708007812, -0.17514801025390625, -0.16332626342773438, -0.1515045166015625, -0.13968276977539062, -0.12786102294921875, -0.11603927612304688, -0.104217529296875, -0.09239578247070312, -0.08057403564453125, -0.06875228881835938, -0.0569305419921875, -0.045108795166015625, -0.03328704833984375, -0.021465301513671875, -0.0096435546875, 0.002178192138671875, 0.01399993896484375, 0.025821685791015625, 0.0376434326171875, 0.049465179443359375, 0.06128692626953125, 0.07310867309570312, 0.084930419921875, 0.09675216674804688, 0.10857391357421875, 0.12039566040039062, 0.1322174072265625, 0.14403915405273438, 0.15586090087890625, 0.16768264770507812, 0.17950439453125, 0.19132614135742188, 0.20314788818359375, 0.21496963500976562, 0.2267913818359375, 0.23861312866210938, 0.25043487548828125, 0.2622566223144531, 0.274078369140625, 0.2859001159667969, 0.29772186279296875, 0.3095436096191406, 0.3213653564453125, 0.3331871032714844, 0.34500885009765625, 0.3568305969238281, 0.36865234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 8.0, 9.0, 5.0, 16.0, 35.0, 44.0, 65.0, 131.0, 242.0, 488.0, 983.0, 2409.0, 7462.0, 40318.0, 619894.0, 340885.0, 26191.0, 5680.0, 1947.0, 779.0, 432.0, 209.0, 121.0, 70.0, 39.0, 30.0, 15.0, 14.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.333251953125, -0.3231201171875, -0.31298828125, -0.3028564453125, -0.292724609375, -0.2825927734375, -0.2724609375, -0.2623291015625, -0.252197265625, -0.2420654296875, -0.23193359375, -0.2218017578125, -0.211669921875, -0.2015380859375, -0.19140625, -0.1812744140625, -0.171142578125, -0.1610107421875, -0.15087890625, -0.1407470703125, -0.130615234375, -0.1204833984375, -0.1103515625, -0.1002197265625, -0.090087890625, -0.0799560546875, -0.06982421875, -0.0596923828125, -0.049560546875, -0.0394287109375, -0.029296875, -0.0191650390625, -0.009033203125, 0.0010986328125, 0.01123046875, 0.0213623046875, 0.031494140625, 0.0416259765625, 0.0517578125, 0.0618896484375, 0.072021484375, 0.0821533203125, 0.09228515625, 0.1024169921875, 0.112548828125, 0.1226806640625, 0.1328125, 0.1429443359375, 0.153076171875, 0.1632080078125, 0.17333984375, 0.1834716796875, 0.193603515625, 0.2037353515625, 0.2138671875, 0.2239990234375, 0.234130859375, 0.2442626953125, 0.25439453125, 0.2645263671875, 0.274658203125, 0.2847900390625, 0.294921875, 0.3050537109375, 0.315185546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 0.0, 4.0, 7.0, 10.0, 14.0, 17.0, 17.0, 22.0, 28.0, 34.0, 41.0, 52.0, 65.0, 79.0, 114.0, 105.0, 76.0, 54.0, 60.0, 34.0, 28.0, 20.0, 26.0, 22.0, 20.0, 9.0, 11.0, 10.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010508298873901367, -0.00010134372860193253, -9.760446846485138e-05, -9.386520832777023e-05, -9.012594819068909e-05, -8.638668805360794e-05, -8.26474279165268e-05, -7.890816777944565e-05, -7.51689076423645e-05, -7.142964750528336e-05, -6.769038736820221e-05, -6.395112723112106e-05, -6.021186709403992e-05, -5.647260695695877e-05, -5.2733346819877625e-05, -4.899408668279648e-05, -4.525482654571533e-05, -4.1515566408634186e-05, -3.777630627155304e-05, -3.403704613447189e-05, -3.0297785997390747e-05, -2.65585258603096e-05, -2.2819265723228455e-05, -1.908000558614731e-05, -1.5340745449066162e-05, -1.1601485311985016e-05, -7.86222517490387e-06, -4.122965037822723e-06, -3.8370490074157715e-07, 3.355555236339569e-06, 7.094815373420715e-06, 1.0834075510501862e-05, 1.4573335647583008e-05, 1.8312595784664154e-05, 2.20518559217453e-05, 2.5791116058826447e-05, 2.9530376195907593e-05, 3.326963633298874e-05, 3.7008896470069885e-05, 4.074815660715103e-05, 4.448741674423218e-05, 4.8226676881313324e-05, 5.196593701839447e-05, 5.5705197155475616e-05, 5.944445729255676e-05, 6.318371742963791e-05, 6.692297756671906e-05, 7.06622377038002e-05, 7.440149784088135e-05, 7.81407579779625e-05, 8.188001811504364e-05, 8.561927825212479e-05, 8.935853838920593e-05, 9.309779852628708e-05, 9.683705866336823e-05, 0.00010057631880044937, 0.00010431557893753052, 0.00010805483907461166, 0.00011179409921169281, 0.00011553335934877396, 0.0001192726194858551, 0.00012301187962293625, 0.0001267511397600174, 0.00013049039989709854, 0.0001342296600341797]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 12.0, 24.0, 30.0, 47.0, 85.0, 132.0, 272.0, 646.0, 1640.0, 5252.0, 21809.0, 194329.0, 739852.0, 68070.0, 11178.0, 3122.0, 1104.0, 470.0, 210.0, 98.0, 68.0, 31.0, 24.0, 14.0, 6.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3199882507324219, -0.30867767333984375, -0.2973670959472656, -0.2860565185546875, -0.2747459411621094, -0.26343536376953125, -0.2521247863769531, -0.240814208984375, -0.22950363159179688, -0.21819305419921875, -0.20688247680664062, -0.1955718994140625, -0.18426132202148438, -0.17295074462890625, -0.16164016723632812, -0.15032958984375, -0.13901901245117188, -0.12770843505859375, -0.11639785766601562, -0.1050872802734375, -0.09377670288085938, -0.08246612548828125, -0.07115554809570312, -0.059844970703125, -0.048534393310546875, -0.03722381591796875, -0.025913238525390625, -0.0146026611328125, -0.003292083740234375, 0.00801849365234375, 0.019329071044921875, 0.0306396484375, 0.041950225830078125, 0.05326080322265625, 0.06457138061523438, 0.0758819580078125, 0.08719253540039062, 0.09850311279296875, 0.10981369018554688, 0.121124267578125, 0.13243484497070312, 0.14374542236328125, 0.15505599975585938, 0.1663665771484375, 0.17767715454101562, 0.18898773193359375, 0.20029830932617188, 0.21160888671875, 0.22291946411132812, 0.23423004150390625, 0.24554061889648438, 0.2568511962890625, 0.2681617736816406, 0.27947235107421875, 0.2907829284667969, 0.302093505859375, 0.3134040832519531, 0.32471466064453125, 0.3360252380371094, 0.3473358154296875, 0.3586463928222656, 0.36995697021484375, 0.3812675476074219, 0.392578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 0.0, 5.0, 5.0, 10.0, 11.0, 14.0, 29.0, 27.0, 27.0, 52.0, 62.0, 73.0, 98.0, 119.0, 118.0, 74.0, 55.0, 53.0, 38.0, 22.0, 16.0, 16.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.22928810119628906, -0.22066116333007812, -0.2120342254638672, -0.20340728759765625, -0.1947803497314453, -0.18615341186523438, -0.17752647399902344, -0.1688995361328125, -0.16027259826660156, -0.15164566040039062, -0.1430187225341797, -0.13439178466796875, -0.1257648468017578, -0.11713790893554688, -0.10851097106933594, -0.099884033203125, -0.09125709533691406, -0.08263015747070312, -0.07400321960449219, -0.06537628173828125, -0.05674934387207031, -0.048122406005859375, -0.03949546813964844, -0.0308685302734375, -0.022241592407226562, -0.013614654541015625, -0.0049877166748046875, 0.00363922119140625, 0.012266159057617188, 0.020893096923828125, 0.029520034790039062, 0.03814697265625, 0.04677391052246094, 0.055400848388671875, 0.06402778625488281, 0.07265472412109375, 0.08128166198730469, 0.08990859985351562, 0.09853553771972656, 0.1071624755859375, 0.11578941345214844, 0.12441635131835938, 0.1330432891845703, 0.14167022705078125, 0.1502971649169922, 0.15892410278320312, 0.16755104064941406, 0.176177978515625, 0.18480491638183594, 0.19343185424804688, 0.2020587921142578, 0.21068572998046875, 0.2193126678466797, 0.22793960571289062, 0.23656654357910156, 0.2451934814453125, 0.25382041931152344, 0.2624473571777344, 0.2710742950439453, 0.27970123291015625, 0.2883281707763672, 0.2969551086425781, 0.30558204650878906, 0.314208984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 30.0, 69.0, 168.0, 265.0, 203.0, 132.0, 69.0, 20.0, 15.0, 11.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.605701446533203, -6.420915126800537, -6.236128807067871, -6.051342487335205, -5.866556167602539, -5.681770324707031, -5.496984004974365, -5.312197685241699, -5.127411365509033, -4.942625045776367, -4.757838726043701, -4.573052406311035, -4.388266563415527, -4.203480243682861, -4.018693923950195, -3.8339076042175293, -3.6491212844848633, -3.4643349647521973, -3.2795486450195312, -3.0947625637054443, -2.9099762439727783, -2.7251899242401123, -2.5404038429260254, -2.3556175231933594, -2.1708312034606934, -1.9860448837280273, -1.8012586832046509, -1.6164724826812744, -1.4316861629486084, -1.2468998432159424, -1.062113642692566, -0.8773274421691895, -0.6925411224365234, -0.5077548623085022, -0.32296860218048096, -0.13818234205245972, 0.04660391807556152, 0.23139017820358276, 0.416176438331604, 0.6009626388549805, 0.7857489585876465, 0.9705352187156677, 1.155321478843689, 1.3401076793670654, 1.5248939990997314, 1.7096803188323975, 1.894466519355774, 2.0792527198791504, 2.2640390396118164, 2.4488253593444824, 2.6336116790771484, 2.8183977603912354, 3.0031840801239014, 3.1879703998565674, 3.3727564811706543, 3.5575428009033203, 3.7423291206359863, 3.9271154403686523, 4.111901760101318, 4.296688079833984, 4.481473922729492, 4.666260242462158, 4.851046562194824, 5.03583288192749, 5.220619201660156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 12.0, 14.0, 13.0, 18.0, 12.0, 16.0, 10.0, 30.0, 24.0, 31.0, 45.0, 34.0, 29.0, 25.0, 34.0, 35.0, 41.0, 43.0, 44.0, 52.0, 50.0, 45.0, 47.0, 42.0, 32.0, 24.0, 25.0, 14.0, 24.0, 17.0, 23.0, 17.0, 16.0, 8.0, 8.0, 8.0, 4.0, 4.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.5272819995880127, -2.450314521789551, -2.373347043991089, -2.296379566192627, -2.219412326812744, -2.1424448490142822, -2.0654773712158203, -1.9885098934173584, -1.9115424156188965, -1.8345749378204346, -1.7576075792312622, -1.6806401014328003, -1.6036726236343384, -1.526705265045166, -1.449737787246704, -1.3727703094482422, -1.2958029508590698, -1.218835473060608, -1.1418681144714355, -1.0649006366729736, -0.9879331588745117, -0.9109657406806946, -0.8339983224868774, -0.7570308446884155, -0.6800634264945984, -0.6030960083007812, -0.5261285305023193, -0.4491611123085022, -0.37219366431236267, -0.29522621631622314, -0.218258798122406, -0.1412913203239441, -0.06432390213012695, 0.012643538415431976, 0.0896109789609909, 0.16657841205596924, 0.24354586005210876, 0.3205133080482483, 0.39748072624206543, 0.47444820404052734, 0.5514156222343445, 0.6283830404281616, 0.7053505182266235, 0.7823179364204407, 0.8592853546142578, 0.9362528324127197, 1.0132203102111816, 1.0901877880096436, 1.167155146598816, 1.2441226243972778, 1.3210899829864502, 1.398057460784912, 1.475024938583374, 1.551992416381836, 1.6289597749710083, 1.7059272527694702, 1.7828946113586426, 1.8598620891571045, 1.9368294477462769, 2.013796806335449, 2.090764284133911, 2.167731761932373, 2.244699239730835, 2.321666717529297, 2.398634195327759]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 7.0, 8.0, 13.0, 22.0, 24.0, 36.0, 50.0, 78.0, 90.0, 135.0, 215.0, 347.0, 586.0, 1099.0, 2250.0, 5237.0, 17048.0, 108258.0, 3815733.0, 207743.0, 23667.0, 6447.0, 2551.0, 1222.0, 598.0, 297.0, 174.0, 102.0, 75.0, 46.0, 32.0, 20.0, 14.0, 10.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4642143249511719, -0.45040130615234375, -0.4365882873535156, -0.4227752685546875, -0.4089622497558594, -0.39514923095703125, -0.3813362121582031, -0.367523193359375, -0.3537101745605469, -0.33989715576171875, -0.3260841369628906, -0.3122711181640625, -0.2984580993652344, -0.28464508056640625, -0.2708320617675781, -0.25701904296875, -0.24320602416992188, -0.22939300537109375, -0.21557998657226562, -0.2017669677734375, -0.18795394897460938, -0.17414093017578125, -0.16032791137695312, -0.146514892578125, -0.13270187377929688, -0.11888885498046875, -0.10507583618164062, -0.0912628173828125, -0.07744979858398438, -0.06363677978515625, -0.049823760986328125, -0.0360107421875, -0.022197723388671875, -0.00838470458984375, 0.005428314208984375, 0.0192413330078125, 0.033054351806640625, 0.04686737060546875, 0.060680389404296875, 0.074493408203125, 0.08830642700195312, 0.10211944580078125, 0.11593246459960938, 0.1297454833984375, 0.14355850219726562, 0.15737152099609375, 0.17118453979492188, 0.18499755859375, 0.19881057739257812, 0.21262359619140625, 0.22643661499023438, 0.2402496337890625, 0.2540626525878906, 0.26787567138671875, 0.2816886901855469, 0.295501708984375, 0.3093147277832031, 0.32312774658203125, 0.3369407653808594, 0.3507537841796875, 0.3645668029785156, 0.37837982177734375, 0.3921928405761719, 0.406005859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 14.0, 14.0, 18.0, 26.0, 31.0, 62.0, 105.0, 99.0, 105.0, 116.0, 104.0, 67.0, 78.0, 52.0, 29.0, 28.0, 24.0, 6.0, 3.0, 7.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199462890625, -0.19361114501953125, -0.1877593994140625, -0.18190765380859375, -0.176055908203125, -0.17020416259765625, -0.1643524169921875, -0.15850067138671875, -0.15264892578125, -0.14679718017578125, -0.1409454345703125, -0.13509368896484375, -0.129241943359375, -0.12339019775390625, -0.1175384521484375, -0.11168670654296875, -0.1058349609375, -0.09998321533203125, -0.0941314697265625, -0.08827972412109375, -0.082427978515625, -0.07657623291015625, -0.0707244873046875, -0.06487274169921875, -0.05902099609375, -0.05316925048828125, -0.0473175048828125, -0.04146575927734375, -0.035614013671875, -0.02976226806640625, -0.0239105224609375, -0.01805877685546875, -0.01220703125, -0.00635528564453125, -0.0005035400390625, 0.00534820556640625, 0.011199951171875, 0.01705169677734375, 0.0229034423828125, 0.02875518798828125, 0.03460693359375, 0.04045867919921875, 0.0463104248046875, 0.05216217041015625, 0.058013916015625, 0.06386566162109375, 0.0697174072265625, 0.07556915283203125, 0.0814208984375, 0.08727264404296875, 0.0931243896484375, 0.09897613525390625, 0.104827880859375, 0.11067962646484375, 0.1165313720703125, 0.12238311767578125, 0.12823486328125, 0.13408660888671875, 0.1399383544921875, 0.14579010009765625, 0.151641845703125, 0.15749359130859375, 0.1633453369140625, 0.16919708251953125, 0.175048828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 13.0, 18.0, 44.0, 76.0, 142.0, 287.0, 607.0, 1702.0, 5340.0, 23075.0, 258867.0, 3787604.0, 96602.0, 13999.0, 3648.0, 1289.0, 524.0, 218.0, 103.0, 55.0, 31.0, 16.0, 13.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.5541801452636719, -0.5375595092773438, -0.5209388732910156, -0.5043182373046875, -0.4876976013183594, -0.47107696533203125, -0.4544563293457031, -0.437835693359375, -0.4212150573730469, -0.40459442138671875, -0.3879737854003906, -0.3713531494140625, -0.3547325134277344, -0.33811187744140625, -0.3214912414550781, -0.30487060546875, -0.2882499694824219, -0.27162933349609375, -0.2550086975097656, -0.2383880615234375, -0.22176742553710938, -0.20514678955078125, -0.18852615356445312, -0.171905517578125, -0.15528488159179688, -0.13866424560546875, -0.12204360961914062, -0.1054229736328125, -0.08880233764648438, -0.07218170166015625, -0.055561065673828125, -0.0389404296875, -0.022319793701171875, -0.00569915771484375, 0.010921478271484375, 0.0275421142578125, 0.044162750244140625, 0.06078338623046875, 0.07740402221679688, 0.094024658203125, 0.11064529418945312, 0.12726593017578125, 0.14388656616210938, 0.1605072021484375, 0.17712783813476562, 0.19374847412109375, 0.21036911010742188, 0.22698974609375, 0.24361038208007812, 0.26023101806640625, 0.2768516540527344, 0.2934722900390625, 0.3100929260253906, 0.32671356201171875, 0.3433341979980469, 0.359954833984375, 0.3765754699707031, 0.39319610595703125, 0.4098167419433594, 0.4264373779296875, 0.4430580139160156, 0.45967864990234375, 0.4762992858886719, 0.492919921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 21.0, 23.0, 30.0, 54.0, 99.0, 235.0, 919.0, 1868.0, 461.0, 145.0, 72.0, 40.0, 24.0, 14.0, 17.0, 11.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24578475952148438, -0.23839569091796875, -0.23100662231445312, -0.2236175537109375, -0.21622848510742188, -0.20883941650390625, -0.20145034790039062, -0.194061279296875, -0.18667221069335938, -0.17928314208984375, -0.17189407348632812, -0.1645050048828125, -0.15711593627929688, -0.14972686767578125, -0.14233779907226562, -0.13494873046875, -0.12755966186523438, -0.12017059326171875, -0.11278152465820312, -0.1053924560546875, -0.09800338745117188, -0.09061431884765625, -0.08322525024414062, -0.075836181640625, -0.06844711303710938, -0.06105804443359375, -0.053668975830078125, -0.0462799072265625, -0.038890838623046875, -0.03150177001953125, -0.024112701416015625, -0.0167236328125, -0.009334564208984375, -0.00194549560546875, 0.005443572998046875, 0.0128326416015625, 0.020221710205078125, 0.02761077880859375, 0.034999847412109375, 0.042388916015625, 0.049777984619140625, 0.05716705322265625, 0.06455612182617188, 0.0719451904296875, 0.07933425903320312, 0.08672332763671875, 0.09411239624023438, 0.10150146484375, 0.10889053344726562, 0.11627960205078125, 0.12366867065429688, 0.1310577392578125, 0.13844680786132812, 0.14583587646484375, 0.15322494506835938, 0.160614013671875, 0.16800308227539062, 0.17539215087890625, 0.18278121948242188, 0.1901702880859375, 0.19755935668945312, 0.20494842529296875, 0.21233749389648438, 0.2197265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 14.0, 46.0, 100.0, 169.0, 213.0, 208.0, 132.0, 67.0, 27.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8922836780548096, -0.8475372195243835, -0.8027907013893127, -0.7580442428588867, -0.7132977247238159, -0.6685512661933899, -0.6238048076629639, -0.5790582895278931, -0.534311830997467, -0.48956534266471863, -0.4448188543319702, -0.4000723958015442, -0.3553259074687958, -0.31057941913604736, -0.26583296060562134, -0.22108647227287292, -0.1763399839401245, -0.1315934956073761, -0.08684702217578888, -0.04210054874420166, 0.002645939588546753, 0.047392427921295166, 0.09213888645172119, 0.1368853747844696, 0.18163186311721802, 0.22637835144996643, 0.27112483978271484, 0.31587129831314087, 0.3606177866458893, 0.4053642749786377, 0.4501107335090637, 0.49485722184181213, 0.5396037101745605, 0.5843501687049866, 0.6290966868400574, 0.6738431453704834, 0.7185896635055542, 0.7633361220359802, 0.8080825805664062, 0.852829098701477, 0.8975755572319031, 0.9423220157623291, 0.9870685338973999, 1.0318150520324707, 1.076561450958252, 1.1213079690933228, 1.1660544872283936, 1.2108008861541748, 1.2555474042892456, 1.3002939224243164, 1.3450403213500977, 1.3897868394851685, 1.4345333576202393, 1.4792797565460205, 1.5240262746810913, 1.568772792816162, 1.6135191917419434, 1.6582657098770142, 1.7030121088027954, 1.7477586269378662, 1.792505145072937, 1.8372516632080078, 1.881998062133789, 1.9267445802688599, 1.9714910984039307]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 14.0, 14.0, 10.0, 26.0, 17.0, 29.0, 35.0, 31.0, 39.0, 36.0, 33.0, 42.0, 52.0, 43.0, 43.0, 49.0, 50.0, 48.0, 50.0, 57.0, 49.0, 37.0, 33.0, 15.0, 19.0, 28.0, 20.0, 11.0, 10.0, 10.0, 5.0, 11.0, 3.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5624531507492065, -0.5436984896659851, -0.5249438285827637, -0.5061891674995422, -0.4874345064163208, -0.46867984533309937, -0.44992515444755554, -0.4311704933643341, -0.41241583228111267, -0.39366117119789124, -0.3749065101146698, -0.35615184903144836, -0.33739715814590454, -0.3186424970626831, -0.29988783597946167, -0.28113317489624023, -0.2623785138130188, -0.24362385272979736, -0.22486919164657593, -0.2061145156621933, -0.18735985457897186, -0.16860519349575043, -0.1498505175113678, -0.13109585642814636, -0.11234119534492493, -0.09358653426170349, -0.07483186572790146, -0.056077200919389725, -0.03732253611087799, -0.018567875027656555, 0.0001867935061454773, 0.01894146203994751, 0.037696123123168945, 0.05645078793168068, 0.07520545274019241, 0.09396012127399445, 0.11271478235721588, 0.13146944344043732, 0.15022411942481995, 0.16897878050804138, 0.18773344159126282, 0.20648810267448425, 0.2252427637577057, 0.24399743974208832, 0.26275211572647095, 0.2815067768096924, 0.3002614378929138, 0.31901609897613525, 0.3377707600593567, 0.3565254211425781, 0.37528008222579956, 0.394034743309021, 0.41278940439224243, 0.43154406547546387, 0.4502987563610077, 0.4690534174442291, 0.48780807852745056, 0.5065627694129944, 0.5253174304962158, 0.5440720915794373, 0.5628267526626587, 0.5815814137458801, 0.6003360748291016, 0.619090735912323, 0.6378453969955444]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 14.0, 7.0, 16.0, 15.0, 21.0, 39.0, 35.0, 46.0, 71.0, 94.0, 155.0, 230.0, 390.0, 762.0, 1566.0, 3695.0, 13368.0, 75603.0, 748983.0, 170434.0, 22911.0, 5631.0, 2165.0, 960.0, 491.0, 276.0, 185.0, 125.0, 83.0, 59.0, 38.0, 20.0, 21.0, 12.0, 11.0, 0.0, 1.0, 9.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5161895751953125, -0.495269775390625, -0.4743499755859375, -0.45343017578125, -0.4325103759765625, -0.411590576171875, -0.3906707763671875, -0.3697509765625, -0.3488311767578125, -0.327911376953125, -0.3069915771484375, -0.28607177734375, -0.2651519775390625, -0.244232177734375, -0.2233123779296875, -0.202392578125, -0.1814727783203125, -0.160552978515625, -0.1396331787109375, -0.11871337890625, -0.0977935791015625, -0.076873779296875, -0.0559539794921875, -0.0350341796875, -0.0141143798828125, 0.006805419921875, 0.0277252197265625, 0.04864501953125, 0.0695648193359375, 0.090484619140625, 0.1114044189453125, 0.13232421875, 0.1532440185546875, 0.174163818359375, 0.1950836181640625, 0.21600341796875, 0.2369232177734375, 0.257843017578125, 0.2787628173828125, 0.2996826171875, 0.3206024169921875, 0.341522216796875, 0.3624420166015625, 0.38336181640625, 0.4042816162109375, 0.425201416015625, 0.4461212158203125, 0.467041015625, 0.4879608154296875, 0.508880615234375, 0.5298004150390625, 0.55072021484375, 0.5716400146484375, 0.592559814453125, 0.6134796142578125, 0.6343994140625, 0.6553192138671875, 0.676239013671875, 0.6971588134765625, 0.71807861328125, 0.7389984130859375, 0.759918212890625, 0.7808380126953125, 0.8017578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 11.0, 18.0, 14.0, 34.0, 39.0, 75.0, 97.0, 111.0, 97.0, 120.0, 95.0, 76.0, 68.0, 42.0, 30.0, 22.0, 18.0, 9.0, 2.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1949462890625, -0.189178466796875, -0.18341064453125, -0.177642822265625, -0.171875, -0.166107177734375, -0.16033935546875, -0.154571533203125, -0.1488037109375, -0.143035888671875, -0.13726806640625, -0.131500244140625, -0.125732421875, -0.119964599609375, -0.11419677734375, -0.108428955078125, -0.1026611328125, -0.096893310546875, -0.09112548828125, -0.085357666015625, -0.07958984375, -0.073822021484375, -0.06805419921875, -0.062286376953125, -0.0565185546875, -0.050750732421875, -0.04498291015625, -0.039215087890625, -0.033447265625, -0.027679443359375, -0.02191162109375, -0.016143798828125, -0.0103759765625, -0.004608154296875, 0.00115966796875, 0.006927490234375, 0.0126953125, 0.018463134765625, 0.02423095703125, 0.029998779296875, 0.0357666015625, 0.041534423828125, 0.04730224609375, 0.053070068359375, 0.058837890625, 0.064605712890625, 0.07037353515625, 0.076141357421875, 0.0819091796875, 0.087677001953125, 0.09344482421875, 0.099212646484375, 0.10498046875, 0.110748291015625, 0.11651611328125, 0.122283935546875, 0.1280517578125, 0.133819580078125, 0.13958740234375, 0.145355224609375, 0.151123046875, 0.156890869140625, 0.16265869140625, 0.168426513671875, 0.1741943359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 9.0, 14.0, 5.0, 14.0, 16.0, 29.0, 37.0, 62.0, 107.0, 183.0, 330.0, 682.0, 1718.0, 4863.0, 16035.0, 73973.0, 676244.0, 227313.0, 33204.0, 8682.0, 2823.0, 1130.0, 461.0, 225.0, 132.0, 88.0, 52.0, 37.0, 27.0, 15.0, 13.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5506744384765625, -0.531524658203125, -0.5123748779296875, -0.49322509765625, -0.4740753173828125, -0.454925537109375, -0.4357757568359375, -0.4166259765625, -0.3974761962890625, -0.378326416015625, -0.3591766357421875, -0.34002685546875, -0.3208770751953125, -0.301727294921875, -0.2825775146484375, -0.263427734375, -0.2442779541015625, -0.225128173828125, -0.2059783935546875, -0.18682861328125, -0.1676788330078125, -0.148529052734375, -0.1293792724609375, -0.1102294921875, -0.0910797119140625, -0.071929931640625, -0.0527801513671875, -0.03363037109375, -0.0144805908203125, 0.004669189453125, 0.0238189697265625, 0.04296875, 0.0621185302734375, 0.081268310546875, 0.1004180908203125, 0.11956787109375, 0.1387176513671875, 0.157867431640625, 0.1770172119140625, 0.1961669921875, 0.2153167724609375, 0.234466552734375, 0.2536163330078125, 0.27276611328125, 0.2919158935546875, 0.311065673828125, 0.3302154541015625, 0.349365234375, 0.3685150146484375, 0.387664794921875, 0.4068145751953125, 0.42596435546875, 0.4451141357421875, 0.464263916015625, 0.4834136962890625, 0.5025634765625, 0.5217132568359375, 0.540863037109375, 0.5600128173828125, 0.57916259765625, 0.5983123779296875, 0.617462158203125, 0.6366119384765625, 0.65576171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 0.0, 7.0, 9.0, 8.0, 11.0, 13.0, 12.0, 8.0, 21.0, 19.0, 20.0, 33.0, 18.0, 27.0, 27.0, 33.0, 33.0, 45.0, 44.0, 46.0, 44.0, 46.0, 42.0, 39.0, 41.0, 46.0, 30.0, 30.0, 38.0, 22.0, 26.0, 31.0, 23.0, 13.0, 23.0, 10.0, 10.0, 11.0, 9.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.34989166259765625, -0.3377227783203125, -0.32555389404296875, -0.313385009765625, -0.30121612548828125, -0.2890472412109375, -0.27687835693359375, -0.26470947265625, -0.25254058837890625, -0.2403717041015625, -0.22820281982421875, -0.216033935546875, -0.20386505126953125, -0.1916961669921875, -0.17952728271484375, -0.1673583984375, -0.15518951416015625, -0.1430206298828125, -0.13085174560546875, -0.118682861328125, -0.10651397705078125, -0.0943450927734375, -0.08217620849609375, -0.07000732421875, -0.05783843994140625, -0.0456695556640625, -0.03350067138671875, -0.021331787109375, -0.00916290283203125, 0.0030059814453125, 0.01517486572265625, 0.02734375, 0.03951263427734375, 0.0516815185546875, 0.06385040283203125, 0.076019287109375, 0.08818817138671875, 0.1003570556640625, 0.11252593994140625, 0.12469482421875, 0.13686370849609375, 0.1490325927734375, 0.16120147705078125, 0.173370361328125, 0.18553924560546875, 0.1977081298828125, 0.20987701416015625, 0.2220458984375, 0.23421478271484375, 0.2463836669921875, 0.25855255126953125, 0.270721435546875, 0.28289031982421875, 0.2950592041015625, 0.30722808837890625, 0.31939697265625, 0.33156585693359375, 0.3437347412109375, 0.35590362548828125, 0.368072509765625, 0.38024139404296875, 0.3924102783203125, 0.40457916259765625, 0.416748046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 8.0, 11.0, 8.0, 21.0, 24.0, 54.0, 56.0, 120.0, 250.0, 601.0, 2414.0, 17587.0, 527373.0, 479672.0, 16921.0, 2300.0, 564.0, 276.0, 105.0, 75.0, 39.0, 25.0, 12.0, 9.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33464813232421875, -0.3231048583984375, -0.31156158447265625, -0.300018310546875, -0.28847503662109375, -0.2769317626953125, -0.26538848876953125, -0.25384521484375, -0.24230194091796875, -0.2307586669921875, -0.21921539306640625, -0.207672119140625, -0.19612884521484375, -0.1845855712890625, -0.17304229736328125, -0.1614990234375, -0.14995574951171875, -0.1384124755859375, -0.12686920166015625, -0.115325927734375, -0.10378265380859375, -0.0922393798828125, -0.08069610595703125, -0.06915283203125, -0.05760955810546875, -0.0460662841796875, -0.03452301025390625, -0.022979736328125, -0.01143646240234375, 0.0001068115234375, 0.01165008544921875, 0.023193359375, 0.03473663330078125, 0.0462799072265625, 0.05782318115234375, 0.069366455078125, 0.08090972900390625, 0.0924530029296875, 0.10399627685546875, 0.11553955078125, 0.12708282470703125, 0.1386260986328125, 0.15016937255859375, 0.161712646484375, 0.17325592041015625, 0.1847991943359375, 0.19634246826171875, 0.2078857421875, 0.21942901611328125, 0.2309722900390625, 0.24251556396484375, 0.254058837890625, 0.26560211181640625, 0.2771453857421875, 0.28868865966796875, 0.30023193359375, 0.31177520751953125, 0.3233184814453125, 0.33486175537109375, 0.346405029296875, 0.35794830322265625, 0.3694915771484375, 0.38103485107421875, 0.392578125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 14.0, 35.0, 76.0, 156.0, 296.0, 207.0, 90.0, 52.0, 33.0, 10.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030112266540527344, -0.0002894066274166107, -0.000277690589427948, -0.0002659745514392853, -0.00025425851345062256, -0.00024254247546195984, -0.00023082643747329712, -0.0002191103994846344, -0.00020739436149597168, -0.00019567832350730896, -0.00018396228551864624, -0.00017224624752998352, -0.0001605302095413208, -0.00014881417155265808, -0.00013709813356399536, -0.00012538209557533264, -0.00011366605758666992, -0.0001019500195980072, -9.023398160934448e-05, -7.851794362068176e-05, -6.680190563201904e-05, -5.508586764335632e-05, -4.3369829654693604e-05, -3.1653791666030884e-05, -1.9937753677368164e-05, -8.221715688705444e-06, 3.4943222999572754e-06, 1.5210360288619995e-05, 2.6926398277282715e-05, 3.8642436265945435e-05, 5.0358474254608154e-05, 6.207451224327087e-05, 7.37905502319336e-05, 8.550658822059631e-05, 9.722262620925903e-05, 0.00010893866419792175, 0.00012065470218658447, 0.0001323707401752472, 0.0001440867781639099, 0.00015580281615257263, 0.00016751885414123535, 0.00017923489212989807, 0.0001909509301185608, 0.0002026669681072235, 0.00021438300609588623, 0.00022609904408454895, 0.00023781508207321167, 0.0002495311200618744, 0.0002612471580505371, 0.00027296319603919983, 0.00028467923402786255, 0.00029639527201652527, 0.000308111310005188, 0.0003198273479938507, 0.00033154338598251343, 0.00034325942397117615, 0.00035497546195983887, 0.0003666914999485016, 0.0003784075379371643, 0.000390123575925827, 0.00040183961391448975, 0.00041355565190315247, 0.0004252716898918152, 0.0004369877278804779, 0.0004487037658691406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 5.0, 15.0, 14.0, 13.0, 25.0, 41.0, 69.0, 106.0, 157.0, 329.0, 1005.0, 4916.0, 68406.0, 921447.0, 46524.0, 3839.0, 871.0, 334.0, 149.0, 99.0, 57.0, 48.0, 22.0, 20.0, 9.0, 9.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.51318359375, -0.49828338623046875, -0.4833831787109375, -0.46848297119140625, -0.453582763671875, -0.43868255615234375, -0.4237823486328125, -0.40888214111328125, -0.39398193359375, -0.37908172607421875, -0.3641815185546875, -0.34928131103515625, -0.334381103515625, -0.31948089599609375, -0.3045806884765625, -0.28968048095703125, -0.2747802734375, -0.25988006591796875, -0.2449798583984375, -0.23007965087890625, -0.215179443359375, -0.20027923583984375, -0.1853790283203125, -0.17047882080078125, -0.15557861328125, -0.14067840576171875, -0.1257781982421875, -0.11087799072265625, -0.095977783203125, -0.08107757568359375, -0.0661773681640625, -0.05127716064453125, -0.036376953125, -0.02147674560546875, -0.0065765380859375, 0.00832366943359375, 0.023223876953125, 0.03812408447265625, 0.0530242919921875, 0.06792449951171875, 0.08282470703125, 0.09772491455078125, 0.1126251220703125, 0.12752532958984375, 0.142425537109375, 0.15732574462890625, 0.1722259521484375, 0.18712615966796875, 0.2020263671875, 0.21692657470703125, 0.2318267822265625, 0.24672698974609375, 0.261627197265625, 0.27652740478515625, 0.2914276123046875, 0.30632781982421875, 0.32122802734375, 0.33612823486328125, 0.3510284423828125, 0.36592864990234375, 0.380828857421875, 0.39572906494140625, 0.4106292724609375, 0.42552947998046875, 0.4404296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 13.0, 10.0, 16.0, 25.0, 36.0, 43.0, 54.0, 57.0, 120.0, 118.0, 122.0, 99.0, 66.0, 43.0, 32.0, 22.0, 15.0, 19.0, 13.0, 13.0, 8.0, 6.0, 4.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.185546875, -0.17972183227539062, -0.17389678955078125, -0.16807174682617188, -0.1622467041015625, -0.15642166137695312, -0.15059661865234375, -0.14477157592773438, -0.138946533203125, -0.13312149047851562, -0.12729644775390625, -0.12147140502929688, -0.1156463623046875, -0.10982131958007812, -0.10399627685546875, -0.09817123413085938, -0.09234619140625, -0.08652114868164062, -0.08069610595703125, -0.07487106323242188, -0.0690460205078125, -0.06322097778320312, -0.05739593505859375, -0.051570892333984375, -0.045745849609375, -0.039920806884765625, -0.03409576416015625, -0.028270721435546875, -0.0224456787109375, -0.016620635986328125, -0.01079559326171875, -0.004970550537109375, 0.0008544921875, 0.006679534912109375, 0.01250457763671875, 0.018329620361328125, 0.0241546630859375, 0.029979705810546875, 0.03580474853515625, 0.041629791259765625, 0.047454833984375, 0.053279876708984375, 0.05910491943359375, 0.06492996215820312, 0.0707550048828125, 0.07658004760742188, 0.08240509033203125, 0.08823013305664062, 0.09405517578125, 0.09988021850585938, 0.10570526123046875, 0.11153030395507812, 0.1173553466796875, 0.12318038940429688, 0.12900543212890625, 0.13483047485351562, 0.140655517578125, 0.14648056030273438, 0.15230560302734375, 0.15813064575195312, 0.1639556884765625, 0.16978073120117188, 0.17560577392578125, 0.18143081665039062, 0.187255859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 15.0, 39.0, 75.0, 172.0, 232.0, 211.0, 102.0, 78.0, 30.0, 20.0, 8.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16450572013855, -2.0163140296936035, -1.8681225776672363, -1.71993088722229, -1.5717393159866333, -1.4235477447509766, -1.2753560543060303, -1.1271644830703735, -0.9789729118347168, -0.8307813405990601, -0.6825897097587585, -0.534398078918457, -0.3862065076828003, -0.23801493644714355, -0.08982330560684204, 0.05836832523345947, 0.2065598964691162, 0.35475149750709534, 0.5029430985450745, 0.651134729385376, 0.7993263006210327, 0.9475178718566895, 1.0957095623016357, 1.2439011335372925, 1.3920927047729492, 1.540284276008606, 1.6884758472442627, 1.836667537689209, 1.9848591089248657, 2.1330506801605225, 2.2812423706054688, 2.429433822631836, 2.5776257514953613, 2.7258174419403076, 2.874008893966675, 3.022200584411621, 3.1703920364379883, 3.3185837268829346, 3.466775417327881, 3.614966869354248, 3.7631585597991943, 3.9113502502441406, 4.059541702270508, 4.207733154296875, 4.3559250831604, 4.504116535186768, 4.652307987213135, 4.80049991607666, 4.948691368103027, 5.0968828201293945, 5.24507474899292, 5.393266201019287, 5.541457653045654, 5.68964958190918, 5.837841033935547, 5.986032485961914, 6.134223937988281, 6.282415390014648, 6.430607318878174, 6.578798770904541, 6.726990222930908, 6.875182151794434, 7.023373603820801, 7.171565055847168, 7.319756984710693]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 11.0, 8.0, 7.0, 18.0, 13.0, 16.0, 26.0, 24.0, 21.0, 32.0, 29.0, 28.0, 37.0, 39.0, 43.0, 46.0, 58.0, 53.0, 37.0, 51.0, 33.0, 55.0, 37.0, 36.0, 40.0, 40.0, 33.0, 17.0, 22.0, 23.0, 13.0, 14.0, 11.0, 6.0, 6.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4904160499572754, -2.4153387546539307, -2.340261459350586, -2.2651844024658203, -2.1901071071624756, -2.115029811859131, -2.0399527549743652, -1.9648754596710205, -1.8897981643676758, -1.814720869064331, -1.7396436929702759, -1.6645665168762207, -1.589489221572876, -1.5144119262695312, -1.439334750175476, -1.364257574081421, -1.2891802787780762, -1.2141029834747314, -1.1390258073806763, -1.063948631286621, -0.9888713359832764, -0.9137941002845764, -0.8387168645858765, -0.7636396288871765, -0.6885623931884766, -0.6134851574897766, -0.5384079217910767, -0.4633306860923767, -0.38825345039367676, -0.3131762146949768, -0.23809897899627686, -0.1630217432975769, -0.08794450759887695, -0.012867271900177002, 0.06220996379852295, 0.1372871994972229, 0.21236443519592285, 0.2874416708946228, 0.36251890659332275, 0.4375961422920227, 0.5126733779907227, 0.5877506136894226, 0.6628278493881226, 0.7379050850868225, 0.8129823207855225, 0.8880595564842224, 0.9631367921829224, 1.0382139682769775, 1.1132912635803223, 1.188368558883667, 1.2634457349777222, 1.3385229110717773, 1.413600206375122, 1.4886775016784668, 1.563754677772522, 1.6388318538665771, 1.7139091491699219, 1.7889864444732666, 1.8640636205673218, 1.939140796661377, 2.0142180919647217, 2.0892953872680664, 2.164372444152832, 2.2394497394561768, 2.3145270347595215]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 8.0, 6.0, 10.0, 8.0, 17.0, 18.0, 31.0, 49.0, 66.0, 108.0, 178.0, 404.0, 973.0, 2672.0, 11006.0, 145461.0, 3989187.0, 35628.0, 5721.0, 1621.0, 573.0, 215.0, 139.0, 76.0, 31.0, 30.0, 20.0, 13.0, 3.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212890625, -0.7966156005859375, -0.771942138671875, -0.7472686767578125, -0.72259521484375, -0.6979217529296875, -0.673248291015625, -0.6485748291015625, -0.6239013671875, -0.5992279052734375, -0.574554443359375, -0.5498809814453125, -0.52520751953125, -0.5005340576171875, -0.475860595703125, -0.4511871337890625, -0.426513671875, -0.4018402099609375, -0.377166748046875, -0.3524932861328125, -0.32781982421875, -0.3031463623046875, -0.278472900390625, -0.2537994384765625, -0.2291259765625, -0.2044525146484375, -0.179779052734375, -0.1551055908203125, -0.13043212890625, -0.1057586669921875, -0.081085205078125, -0.0564117431640625, -0.03173828125, -0.0070648193359375, 0.017608642578125, 0.0422821044921875, 0.06695556640625, 0.0916290283203125, 0.116302490234375, 0.1409759521484375, 0.1656494140625, 0.1903228759765625, 0.214996337890625, 0.2396697998046875, 0.26434326171875, 0.2890167236328125, 0.313690185546875, 0.3383636474609375, 0.363037109375, 0.3877105712890625, 0.412384033203125, 0.4370574951171875, 0.46173095703125, 0.4864044189453125, 0.511077880859375, 0.5357513427734375, 0.5604248046875, 0.5850982666015625, 0.609771728515625, 0.6344451904296875, 0.65911865234375, 0.6837921142578125, 0.708465576171875, 0.7331390380859375, 0.7578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 12.0, 13.0, 23.0, 24.0, 38.0, 61.0, 74.0, 113.0, 114.0, 118.0, 93.0, 77.0, 64.0, 52.0, 33.0, 28.0, 21.0, 16.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19587135314941406, -0.18996047973632812, -0.1840496063232422, -0.17813873291015625, -0.1722278594970703, -0.16631698608398438, -0.16040611267089844, -0.1544952392578125, -0.14858436584472656, -0.14267349243164062, -0.1367626190185547, -0.13085174560546875, -0.12494087219238281, -0.11902999877929688, -0.11311912536621094, -0.107208251953125, -0.10129737854003906, -0.09538650512695312, -0.08947563171386719, -0.08356475830078125, -0.07765388488769531, -0.07174301147460938, -0.06583213806152344, -0.0599212646484375, -0.05401039123535156, -0.048099517822265625, -0.04218864440917969, -0.03627777099609375, -0.030366897583007812, -0.024456024169921875, -0.018545150756835938, -0.01263427734375, -0.0067234039306640625, -0.000812530517578125, 0.0050983428955078125, 0.01100921630859375, 0.016920089721679688, 0.022830963134765625, 0.028741836547851562, 0.0346527099609375, 0.04056358337402344, 0.046474456787109375, 0.05238533020019531, 0.05829620361328125, 0.06420707702636719, 0.07011795043945312, 0.07602882385253906, 0.081939697265625, 0.08785057067871094, 0.09376144409179688, 0.09967231750488281, 0.10558319091796875, 0.11149406433105469, 0.11740493774414062, 0.12331581115722656, 0.1292266845703125, 0.13513755798339844, 0.14104843139648438, 0.1469593048095703, 0.15287017822265625, 0.1587810516357422, 0.16469192504882812, 0.17060279846191406, 0.176513671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 14.0, 17.0, 42.0, 68.0, 129.0, 290.0, 688.0, 1921.0, 7144.0, 40909.0, 3666554.0, 447909.0, 21551.0, 4660.0, 1422.0, 512.0, 227.0, 89.0, 57.0, 27.0, 17.0, 14.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84375, -0.8220291137695312, -0.8003082275390625, -0.7785873413085938, -0.756866455078125, -0.7351455688476562, -0.7134246826171875, -0.6917037963867188, -0.66998291015625, -0.6482620239257812, -0.6265411376953125, -0.6048202514648438, -0.583099365234375, -0.5613784790039062, -0.5396575927734375, -0.5179367065429688, -0.4962158203125, -0.47449493408203125, -0.4527740478515625, -0.43105316162109375, -0.409332275390625, -0.38761138916015625, -0.3658905029296875, -0.34416961669921875, -0.32244873046875, -0.30072784423828125, -0.2790069580078125, -0.25728607177734375, -0.235565185546875, -0.21384429931640625, -0.1921234130859375, -0.17040252685546875, -0.148681640625, -0.12696075439453125, -0.1052398681640625, -0.08351898193359375, -0.061798095703125, -0.04007720947265625, -0.0183563232421875, 0.00336456298828125, 0.02508544921875, 0.04680633544921875, 0.0685272216796875, 0.09024810791015625, 0.111968994140625, 0.13368988037109375, 0.1554107666015625, 0.17713165283203125, 0.1988525390625, 0.22057342529296875, 0.2422943115234375, 0.26401519775390625, 0.285736083984375, 0.30745697021484375, 0.3291778564453125, 0.35089874267578125, 0.37261962890625, 0.39434051513671875, 0.4160614013671875, 0.43778228759765625, 0.459503173828125, 0.48122406005859375, 0.5029449462890625, 0.5246658325195312, 0.54638671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 10.0, 19.0, 26.0, 54.0, 108.0, 338.0, 2523.0, 687.0, 147.0, 63.0, 35.0, 18.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.4140625, -0.40499305725097656, -0.3959236145019531, -0.3868541717529297, -0.37778472900390625, -0.3687152862548828, -0.3596458435058594, -0.35057640075683594, -0.3415069580078125, -0.33243751525878906, -0.3233680725097656, -0.3142986297607422, -0.30522918701171875, -0.2961597442626953, -0.2870903015136719, -0.27802085876464844, -0.268951416015625, -0.25988197326660156, -0.2508125305175781, -0.2417430877685547, -0.23267364501953125, -0.2236042022705078, -0.21453475952148438, -0.20546531677246094, -0.1963958740234375, -0.18732643127441406, -0.17825698852539062, -0.1691875457763672, -0.16011810302734375, -0.1510486602783203, -0.14197921752929688, -0.13290977478027344, -0.12384033203125, -0.11477088928222656, -0.10570144653320312, -0.09663200378417969, -0.08756256103515625, -0.07849311828613281, -0.06942367553710938, -0.06035423278808594, -0.0512847900390625, -0.04221534729003906, -0.033145904541015625, -0.024076461791992188, -0.01500701904296875, -0.0059375762939453125, 0.003131866455078125, 0.012201309204101562, 0.021270751953125, 0.030340194702148438, 0.039409637451171875, 0.04847908020019531, 0.05754852294921875, 0.06661796569824219, 0.07568740844726562, 0.08475685119628906, 0.0938262939453125, 0.10289573669433594, 0.11196517944335938, 0.12103462219238281, 0.13010406494140625, 0.1391735076904297, 0.14824295043945312, 0.15731239318847656, 0.1663818359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 9.0, 8.0, 20.0, 45.0, 69.0, 90.0, 100.0, 149.0, 137.0, 109.0, 107.0, 54.0, 30.0, 21.0, 13.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6373927593231201, -0.6108295321464539, -0.5842663645744324, -0.5577031373977661, -0.5311399698257446, -0.5045767426490784, -0.4780135154724121, -0.45145031809806824, -0.42488712072372437, -0.3983239233493805, -0.3717607259750366, -0.34519749879837036, -0.3186343014240265, -0.2920711040496826, -0.26550787687301636, -0.23894467949867249, -0.2123814821243286, -0.18581828474998474, -0.15925507247447968, -0.1326918601989746, -0.10612866282463074, -0.07956546545028687, -0.0530022531747818, -0.026439040899276733, 0.00012415647506713867, 0.026687361299991608, 0.05325056612491608, 0.07981377094984055, 0.10637697577476501, 0.1329401731491089, 0.15950338542461395, 0.18606659770011902, 0.2126297950744629, 0.23919299244880676, 0.26575618982315063, 0.2923194169998169, 0.31888261437416077, 0.34544581174850464, 0.3720090389251709, 0.39857223629951477, 0.42513543367385864, 0.4516986310482025, 0.4782618284225464, 0.5048250555992126, 0.5313882827758789, 0.5579514503479004, 0.5845146775245667, 0.6110779047012329, 0.6376410722732544, 0.6642042994499207, 0.6907674670219421, 0.7173306941986084, 0.7438938617706299, 0.7704570889472961, 0.7970203161239624, 0.8235834836959839, 0.8501467108726501, 0.8767099380493164, 0.9032731056213379, 0.9298363327980042, 0.9563995599746704, 0.9829627275466919, 1.0095258951187134, 1.0360891819000244, 1.062652349472046]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 6.0, 15.0, 25.0, 27.0, 42.0, 37.0, 61.0, 56.0, 63.0, 59.0, 65.0, 79.0, 72.0, 69.0, 66.0, 55.0, 47.0, 42.0, 33.0, 22.0, 22.0, 14.0, 12.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5507141351699829, -0.524960994720459, -0.49920785427093506, -0.4734547436237335, -0.4477016031742096, -0.42194846272468567, -0.39619535207748413, -0.3704422116279602, -0.3446890711784363, -0.31893593072891235, -0.2931827902793884, -0.2674296796321869, -0.24167653918266296, -0.21592339873313904, -0.1901702731847763, -0.16441714763641357, -0.13866400718688965, -0.11291087418794632, -0.08715774118900299, -0.06140460819005966, -0.03565147519111633, -0.009898334741592407, 0.015854790806770325, 0.04160791635513306, 0.06736105680465698, 0.09311418980360031, 0.11886732280254364, 0.14462044835090637, 0.1703735888004303, 0.19612672924995422, 0.22187985479831696, 0.2476329803466797, 0.2733861207962036, 0.29913926124572754, 0.32489240169525146, 0.350645512342453, 0.37639865279197693, 0.40215179324150085, 0.4279049038887024, 0.4536580443382263, 0.47941118478775024, 0.5051643252372742, 0.5309174656867981, 0.556670606136322, 0.5824236869812012, 0.6081768274307251, 0.633929967880249, 0.659683108329773, 0.6854362487792969, 0.7111893892288208, 0.7369425296783447, 0.7626956701278687, 0.7884488105773926, 0.8142019510269165, 0.8399550318717957, 0.8657081723213196, 0.8914613127708435, 0.9172144532203674, 0.9429675936698914, 0.9687207341194153, 0.9944738149642944, 1.0202269554138184, 1.0459800958633423, 1.0717332363128662, 1.0974863767623901]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 11.0, 8.0, 9.0, 18.0, 24.0, 32.0, 37.0, 52.0, 80.0, 111.0, 198.0, 267.0, 463.0, 774.0, 1424.0, 2947.0, 7766.0, 27805.0, 137210.0, 642753.0, 176569.0, 33839.0, 8966.0, 3337.0, 1517.0, 821.0, 518.0, 302.0, 209.0, 143.0, 93.0, 64.0, 53.0, 24.0, 29.0, 26.0, 12.0, 4.0, 4.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.464599609375, -0.4488868713378906, -0.43317413330078125, -0.4174613952636719, -0.4017486572265625, -0.3860359191894531, -0.37032318115234375, -0.3546104431152344, -0.338897705078125, -0.3231849670410156, -0.30747222900390625, -0.2917594909667969, -0.2760467529296875, -0.2603340148925781, -0.24462127685546875, -0.22890853881835938, -0.21319580078125, -0.19748306274414062, -0.18177032470703125, -0.16605758666992188, -0.1503448486328125, -0.13463211059570312, -0.11891937255859375, -0.10320663452148438, -0.087493896484375, -0.07178115844726562, -0.05606842041015625, -0.040355682373046875, -0.0246429443359375, -0.008930206298828125, 0.00678253173828125, 0.022495269775390625, 0.0382080078125, 0.053920745849609375, 0.06963348388671875, 0.08534622192382812, 0.1010589599609375, 0.11677169799804688, 0.13248443603515625, 0.14819717407226562, 0.163909912109375, 0.17962265014648438, 0.19533538818359375, 0.21104812622070312, 0.2267608642578125, 0.24247360229492188, 0.25818634033203125, 0.2738990783691406, 0.28961181640625, 0.3053245544433594, 0.32103729248046875, 0.3367500305175781, 0.3524627685546875, 0.3681755065917969, 0.38388824462890625, 0.3996009826660156, 0.415313720703125, 0.4310264587402344, 0.44673919677734375, 0.4624519348144531, 0.4781646728515625, 0.4938774108886719, 0.5095901489257812, 0.5253028869628906, 0.541015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 11.0, 15.0, 18.0, 26.0, 29.0, 59.0, 71.0, 81.0, 117.0, 101.0, 112.0, 101.0, 67.0, 54.0, 33.0, 32.0, 25.0, 15.0, 8.0, 10.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19677734375, -0.19091224670410156, -0.18504714965820312, -0.1791820526123047, -0.17331695556640625, -0.1674518585205078, -0.16158676147460938, -0.15572166442871094, -0.1498565673828125, -0.14399147033691406, -0.13812637329101562, -0.1322612762451172, -0.12639617919921875, -0.12053108215332031, -0.11466598510742188, -0.10880088806152344, -0.102935791015625, -0.09707069396972656, -0.09120559692382812, -0.08534049987792969, -0.07947540283203125, -0.07361030578613281, -0.06774520874023438, -0.06188011169433594, -0.0560150146484375, -0.05014991760253906, -0.044284820556640625, -0.03841972351074219, -0.03255462646484375, -0.026689529418945312, -0.020824432373046875, -0.014959335327148438, -0.00909423828125, -0.0032291412353515625, 0.002635955810546875, 0.008501052856445312, 0.01436614990234375, 0.020231246948242188, 0.026096343994140625, 0.03196144104003906, 0.0378265380859375, 0.04369163513183594, 0.049556732177734375, 0.05542182922363281, 0.06128692626953125, 0.06715202331542969, 0.07301712036132812, 0.07888221740722656, 0.084747314453125, 0.09061241149902344, 0.09647750854492188, 0.10234260559082031, 0.10820770263671875, 0.11407279968261719, 0.11993789672851562, 0.12580299377441406, 0.1316680908203125, 0.13753318786621094, 0.14339828491210938, 0.1492633819580078, 0.15512847900390625, 0.1609935760498047, 0.16685867309570312, 0.17272377014160156, 0.1785888671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 21.0, 21.0, 28.0, 41.0, 55.0, 103.0, 169.0, 298.0, 529.0, 1104.0, 2767.0, 7286.0, 23083.0, 92014.0, 554815.0, 288529.0, 53864.0, 14962.0, 5016.0, 1946.0, 832.0, 409.0, 221.0, 143.0, 99.0, 67.0, 36.0, 26.0, 21.0, 4.0, 9.0, 11.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.456146240234375, -0.44134521484375, -0.426544189453125, -0.4117431640625, -0.396942138671875, -0.38214111328125, -0.367340087890625, -0.3525390625, -0.337738037109375, -0.32293701171875, -0.308135986328125, -0.2933349609375, -0.278533935546875, -0.26373291015625, -0.248931884765625, -0.234130859375, -0.219329833984375, -0.20452880859375, -0.189727783203125, -0.1749267578125, -0.160125732421875, -0.14532470703125, -0.130523681640625, -0.11572265625, -0.100921630859375, -0.08612060546875, -0.071319580078125, -0.0565185546875, -0.041717529296875, -0.02691650390625, -0.012115478515625, 0.002685546875, 0.017486572265625, 0.03228759765625, 0.047088623046875, 0.0618896484375, 0.076690673828125, 0.09149169921875, 0.106292724609375, 0.12109375, 0.135894775390625, 0.15069580078125, 0.165496826171875, 0.1802978515625, 0.195098876953125, 0.20989990234375, 0.224700927734375, 0.239501953125, 0.254302978515625, 0.26910400390625, 0.283905029296875, 0.2987060546875, 0.313507080078125, 0.32830810546875, 0.343109130859375, 0.35791015625, 0.372711181640625, 0.38751220703125, 0.402313232421875, 0.4171142578125, 0.431915283203125, 0.44671630859375, 0.461517333984375, 0.476318359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 7.0, 17.0, 9.0, 16.0, 20.0, 25.0, 30.0, 25.0, 34.0, 34.0, 35.0, 45.0, 47.0, 41.0, 43.0, 51.0, 36.0, 49.0, 48.0, 33.0, 45.0, 53.0, 36.0, 32.0, 32.0, 33.0, 17.0, 10.0, 18.0, 17.0, 10.0, 7.0, 3.0, 7.0, 5.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.447998046875, -0.4348602294921875, -0.421722412109375, -0.4085845947265625, -0.39544677734375, -0.3823089599609375, -0.369171142578125, -0.3560333251953125, -0.3428955078125, -0.3297576904296875, -0.316619873046875, -0.3034820556640625, -0.29034423828125, -0.2772064208984375, -0.264068603515625, -0.2509307861328125, -0.23779296875, -0.2246551513671875, -0.211517333984375, -0.1983795166015625, -0.18524169921875, -0.1721038818359375, -0.158966064453125, -0.1458282470703125, -0.1326904296875, -0.1195526123046875, -0.106414794921875, -0.0932769775390625, -0.08013916015625, -0.0670013427734375, -0.053863525390625, -0.0407257080078125, -0.027587890625, -0.0144500732421875, -0.001312255859375, 0.0118255615234375, 0.02496337890625, 0.0381011962890625, 0.051239013671875, 0.0643768310546875, 0.0775146484375, 0.0906524658203125, 0.103790283203125, 0.1169281005859375, 0.13006591796875, 0.1432037353515625, 0.156341552734375, 0.1694793701171875, 0.1826171875, 0.1957550048828125, 0.208892822265625, 0.2220306396484375, 0.23516845703125, 0.2483062744140625, 0.261444091796875, 0.2745819091796875, 0.2877197265625, 0.3008575439453125, 0.313995361328125, 0.3271331787109375, 0.34027099609375, 0.3534088134765625, 0.366546630859375, 0.3796844482421875, 0.392822265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 11.0, 31.0, 64.0, 133.0, 407.0, 1990.0, 53512.0, 968821.0, 21660.0, 1377.0, 354.0, 103.0, 45.0, 23.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.492919921875, -0.4772224426269531, -0.46152496337890625, -0.4458274841308594, -0.4301300048828125, -0.4144325256347656, -0.39873504638671875, -0.3830375671386719, -0.367340087890625, -0.3516426086425781, -0.33594512939453125, -0.3202476501464844, -0.3045501708984375, -0.2888526916503906, -0.27315521240234375, -0.2574577331542969, -0.24176025390625, -0.22606277465820312, -0.21036529541015625, -0.19466781616210938, -0.1789703369140625, -0.16327285766601562, -0.14757537841796875, -0.13187789916992188, -0.116180419921875, -0.10048294067382812, -0.08478546142578125, -0.06908798217773438, -0.0533905029296875, -0.037693023681640625, -0.02199554443359375, -0.006298065185546875, 0.0093994140625, 0.025096893310546875, 0.04079437255859375, 0.056491851806640625, 0.0721893310546875, 0.08788681030273438, 0.10358428955078125, 0.11928176879882812, 0.134979248046875, 0.15067672729492188, 0.16637420654296875, 0.18207168579101562, 0.1977691650390625, 0.21346664428710938, 0.22916412353515625, 0.24486160278320312, 0.26055908203125, 0.2762565612792969, 0.29195404052734375, 0.3076515197753906, 0.3233489990234375, 0.3390464782714844, 0.35474395751953125, 0.3704414367675781, 0.386138916015625, 0.4018363952636719, 0.41753387451171875, 0.4332313537597656, 0.4489288330078125, 0.4646263122558594, 0.48032379150390625, 0.4960212707519531, 0.51171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 19.0, 26.0, 54.0, 68.0, 93.0, 179.0, 196.0, 148.0, 82.0, 54.0, 28.0, 19.0, 17.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003497600555419922, -0.0003398619592189789, -0.0003299638628959656, -0.00032006576657295227, -0.00031016767024993896, -0.00030026957392692566, -0.00029037147760391235, -0.00028047338128089905, -0.00027057528495788574, -0.00026067718863487244, -0.00025077909231185913, -0.00024088099598884583, -0.00023098289966583252, -0.00022108480334281921, -0.0002111867070198059, -0.0002012886106967926, -0.0001913905143737793, -0.000181492418050766, -0.00017159432172775269, -0.00016169622540473938, -0.00015179812908172607, -0.00014190003275871277, -0.00013200193643569946, -0.00012210384011268616, -0.00011220574378967285, -0.00010230764746665955, -9.240955114364624e-05, -8.251145482063293e-05, -7.261335849761963e-05, -6.271526217460632e-05, -5.281716585159302e-05, -4.291906952857971e-05, -3.3020973205566406e-05, -2.31228768825531e-05, -1.3224780559539795e-05, -3.3266842365264893e-06, 6.571412086486816e-06, 1.6469508409500122e-05, 2.6367604732513428e-05, 3.6265701055526733e-05, 4.616379737854004e-05, 5.6061893701553345e-05, 6.595999002456665e-05, 7.585808634757996e-05, 8.575618267059326e-05, 9.565427899360657e-05, 0.00010555237531661987, 0.00011545047163963318, 0.00012534856796264648, 0.0001352466642856598, 0.0001451447606086731, 0.0001550428569316864, 0.0001649409532546997, 0.000174839049577713, 0.00018473714590072632, 0.00019463524222373962, 0.00020453333854675293, 0.00021443143486976624, 0.00022432953119277954, 0.00023422762751579285, 0.00024412572383880615, 0.00025402382016181946, 0.00026392191648483276, 0.00027382001280784607, 0.0002837181091308594]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 8.0, 5.0, 14.0, 31.0, 53.0, 95.0, 175.0, 393.0, 1259.0, 4324.0, 33017.0, 738515.0, 251076.0, 15433.0, 2665.0, 821.0, 338.0, 142.0, 88.0, 48.0, 20.0, 13.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.270172119140625, -0.26080322265625, -0.251434326171875, -0.2420654296875, -0.232696533203125, -0.22332763671875, -0.213958740234375, -0.20458984375, -0.195220947265625, -0.18585205078125, -0.176483154296875, -0.1671142578125, -0.157745361328125, -0.14837646484375, -0.139007568359375, -0.129638671875, -0.120269775390625, -0.11090087890625, -0.101531982421875, -0.0921630859375, -0.082794189453125, -0.07342529296875, -0.064056396484375, -0.0546875, -0.045318603515625, -0.03594970703125, -0.026580810546875, -0.0172119140625, -0.007843017578125, 0.00152587890625, 0.010894775390625, 0.020263671875, 0.029632568359375, 0.03900146484375, 0.048370361328125, 0.0577392578125, 0.067108154296875, 0.07647705078125, 0.085845947265625, 0.09521484375, 0.104583740234375, 0.11395263671875, 0.123321533203125, 0.1326904296875, 0.142059326171875, 0.15142822265625, 0.160797119140625, 0.170166015625, 0.179534912109375, 0.18890380859375, 0.198272705078125, 0.2076416015625, 0.217010498046875, 0.22637939453125, 0.235748291015625, 0.2451171875, 0.254486083984375, 0.26385498046875, 0.273223876953125, 0.2825927734375, 0.291961669921875, 0.30133056640625, 0.310699462890625, 0.320068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 8.0, 9.0, 9.0, 17.0, 24.0, 23.0, 61.0, 81.0, 131.0, 176.0, 167.0, 105.0, 68.0, 30.0, 34.0, 24.0, 9.0, 8.0, 8.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2391357421875, -0.23110389709472656, -0.22307205200195312, -0.2150402069091797, -0.20700836181640625, -0.1989765167236328, -0.19094467163085938, -0.18291282653808594, -0.1748809814453125, -0.16684913635253906, -0.15881729125976562, -0.1507854461669922, -0.14275360107421875, -0.1347217559814453, -0.12668991088867188, -0.11865806579589844, -0.110626220703125, -0.10259437561035156, -0.09456253051757812, -0.08653068542480469, -0.07849884033203125, -0.07046699523925781, -0.062435150146484375, -0.05440330505371094, -0.0463714599609375, -0.03833961486816406, -0.030307769775390625, -0.022275924682617188, -0.01424407958984375, -0.0062122344970703125, 0.001819610595703125, 0.009851455688476562, 0.01788330078125, 0.025915145874023438, 0.033946990966796875, 0.04197883605957031, 0.05001068115234375, 0.05804252624511719, 0.06607437133789062, 0.07410621643066406, 0.0821380615234375, 0.09016990661621094, 0.09820175170898438, 0.10623359680175781, 0.11426544189453125, 0.12229728698730469, 0.13032913208007812, 0.13836097717285156, 0.146392822265625, 0.15442466735839844, 0.16245651245117188, 0.1704883575439453, 0.17852020263671875, 0.1865520477294922, 0.19458389282226562, 0.20261573791503906, 0.2106475830078125, 0.21867942810058594, 0.22671127319335938, 0.2347431182861328, 0.24277496337890625, 0.2508068084716797, 0.2588386535644531, 0.26687049865722656, 0.27490234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 16.0, 82.0, 635.0, 252.0, 25.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.62903594970703, -18.192445755004883, -17.7558536529541, -17.319263458251953, -16.882673263549805, -16.446081161499023, -16.009490966796875, -15.572900772094727, -15.136309623718262, -14.699718475341797, -14.263128280639648, -13.826537132263184, -13.389945983886719, -12.95335578918457, -12.516764640808105, -12.08017349243164, -11.643583297729492, -11.206992149353027, -10.770401954650879, -10.333810806274414, -9.89721965789795, -9.4606294631958, -9.024038314819336, -8.587448120117188, -8.150856018066406, -7.7142653465271, -7.277674198150635, -6.841083526611328, -6.4044928550720215, -5.967902183532715, -5.53131103515625, -5.094720363616943, -4.658129692077637, -4.22153902053833, -3.7849481105804443, -3.3483572006225586, -2.911766529083252, -2.475175619125366, -2.0385847091674805, -1.6019940376281738, -1.165403127670288, -0.7288123369216919, -0.2922214865684509, 0.14436936378479004, 0.5809601545333862, 1.0175509452819824, 1.4541418552398682, 1.8907325267791748, 2.3273234367370605, 2.7639143466949463, 3.200505018234253, 3.6370959281921387, 4.073686599731445, 4.51027774810791, 4.946868419647217, 5.383459091186523, 5.820050239562988, 6.256640911102295, 6.69323205947876, 7.129822731018066, 7.566413402557373, 8.00300407409668, 8.439595222473145, 8.87618637084961, 9.312776565551758]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 10.0, 13.0, 16.0, 18.0, 13.0, 18.0, 27.0, 18.0, 29.0, 23.0, 39.0, 33.0, 44.0, 36.0, 50.0, 47.0, 49.0, 42.0, 49.0, 35.0, 34.0, 45.0, 42.0, 38.0, 37.0, 26.0, 22.0, 25.0, 28.0, 16.0, 16.0, 13.0, 6.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7476615905761719, -1.6891059875488281, -1.6305503845214844, -1.5719947814941406, -1.5134391784667969, -1.4548835754394531, -1.3963279724121094, -1.337772250175476, -1.2792166471481323, -1.2206610441207886, -1.1621054410934448, -1.103549838066101, -1.0449942350387573, -0.9864385724067688, -0.927882969379425, -0.8693273067474365, -0.8107717633247375, -0.7522161602973938, -0.69366055727005, -0.6351048946380615, -0.5765492916107178, -0.517993688583374, -0.4594380855560303, -0.40088245272636414, -0.3423268496990204, -0.28377124667167664, -0.2252156138420105, -0.16666001081466675, -0.1081043928861618, -0.04954877495765686, 0.00900682806968689, 0.06756246089935303, 0.12611806392669678, 0.18467368185520172, 0.24322929978370667, 0.3017849028110504, 0.36034053564071655, 0.4188961386680603, 0.47745174169540405, 0.5360074043273926, 0.5945630073547363, 0.6531186103820801, 0.7116742134094238, 0.7702298164367676, 0.8287854790687561, 0.8873410820960999, 0.9458966851234436, 1.0044523477554321, 1.0630078315734863, 1.12156343460083, 1.1801190376281738, 1.2386746406555176, 1.2972302436828613, 1.355785846710205, 1.4143414497375488, 1.4728971719741821, 1.5314527750015259, 1.5900083780288696, 1.6485639810562134, 1.7071195840835571, 1.7656751871109009, 1.8242309093475342, 1.882786512374878, 1.9413421154022217, 1.9998977184295654]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 9.0, 7.0, 12.0, 6.0, 23.0, 18.0, 26.0, 36.0, 50.0, 58.0, 96.0, 162.0, 231.0, 340.0, 613.0, 1171.0, 2613.0, 6687.0, 23795.0, 345878.0, 3749003.0, 46584.0, 9962.0, 3515.0, 1534.0, 744.0, 393.0, 237.0, 131.0, 86.0, 77.0, 52.0, 22.0, 19.0, 18.0, 15.0, 10.0, 5.0, 3.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.91552734375, -0.8879318237304688, -0.8603363037109375, -0.8327407836914062, -0.805145263671875, -0.7775497436523438, -0.7499542236328125, -0.7223587036132812, -0.69476318359375, -0.6671676635742188, -0.6395721435546875, -0.6119766235351562, -0.584381103515625, -0.5567855834960938, -0.5291900634765625, -0.5015945434570312, -0.4739990234375, -0.44640350341796875, -0.4188079833984375, -0.39121246337890625, -0.363616943359375, -0.33602142333984375, -0.3084259033203125, -0.28083038330078125, -0.25323486328125, -0.22563934326171875, -0.1980438232421875, -0.17044830322265625, -0.142852783203125, -0.11525726318359375, -0.0876617431640625, -0.06006622314453125, -0.032470703125, -0.00487518310546875, 0.0227203369140625, 0.05031585693359375, 0.077911376953125, 0.10550689697265625, 0.1331024169921875, 0.16069793701171875, 0.18829345703125, 0.21588897705078125, 0.2434844970703125, 0.27108001708984375, 0.298675537109375, 0.32627105712890625, 0.3538665771484375, 0.38146209716796875, 0.4090576171875, 0.43665313720703125, 0.4642486572265625, 0.49184417724609375, 0.519439697265625, 0.5470352172851562, 0.5746307373046875, 0.6022262573242188, 0.62982177734375, 0.6574172973632812, 0.6850128173828125, 0.7126083374023438, 0.740203857421875, 0.7677993774414062, 0.7953948974609375, 0.8229904174804688, 0.8505859375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 9.0, 10.0, 14.0, 21.0, 24.0, 30.0, 53.0, 70.0, 92.0, 108.0, 114.0, 112.0, 83.0, 71.0, 49.0, 40.0, 27.0, 32.0, 11.0, 7.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1995849609375, -0.193634033203125, -0.18768310546875, -0.181732177734375, -0.17578125, -0.169830322265625, -0.16387939453125, -0.157928466796875, -0.1519775390625, -0.146026611328125, -0.14007568359375, -0.134124755859375, -0.128173828125, -0.122222900390625, -0.11627197265625, -0.110321044921875, -0.1043701171875, -0.098419189453125, -0.09246826171875, -0.086517333984375, -0.08056640625, -0.074615478515625, -0.06866455078125, -0.062713623046875, -0.0567626953125, -0.050811767578125, -0.04486083984375, -0.038909912109375, -0.032958984375, -0.027008056640625, -0.02105712890625, -0.015106201171875, -0.0091552734375, -0.003204345703125, 0.00274658203125, 0.008697509765625, 0.0146484375, 0.020599365234375, 0.02655029296875, 0.032501220703125, 0.0384521484375, 0.044403076171875, 0.05035400390625, 0.056304931640625, 0.062255859375, 0.068206787109375, 0.07415771484375, 0.080108642578125, 0.0860595703125, 0.092010498046875, 0.09796142578125, 0.103912353515625, 0.10986328125, 0.115814208984375, 0.12176513671875, 0.127716064453125, 0.1336669921875, 0.139617919921875, 0.14556884765625, 0.151519775390625, 0.157470703125, 0.163421630859375, 0.16937255859375, 0.175323486328125, 0.1812744140625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 9.0, 18.0, 27.0, 39.0, 51.0, 112.0, 153.0, 265.0, 495.0, 1037.0, 2149.0, 5449.0, 15375.0, 69342.0, 3384822.0, 651371.0, 44000.0, 11492.0, 4286.0, 1892.0, 826.0, 469.0, 235.0, 130.0, 87.0, 63.0, 31.0, 17.0, 10.0, 6.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7602005004882812, -0.7401275634765625, -0.7200546264648438, -0.699981689453125, -0.6799087524414062, -0.6598358154296875, -0.6397628784179688, -0.61968994140625, -0.5996170043945312, -0.5795440673828125, -0.5594711303710938, -0.539398193359375, -0.5193252563476562, -0.4992523193359375, -0.47917938232421875, -0.4591064453125, -0.43903350830078125, -0.4189605712890625, -0.39888763427734375, -0.378814697265625, -0.35874176025390625, -0.3386688232421875, -0.31859588623046875, -0.29852294921875, -0.27845001220703125, -0.2583770751953125, -0.23830413818359375, -0.218231201171875, -0.19815826416015625, -0.1780853271484375, -0.15801239013671875, -0.137939453125, -0.11786651611328125, -0.0977935791015625, -0.07772064208984375, -0.057647705078125, -0.03757476806640625, -0.0175018310546875, 0.00257110595703125, 0.02264404296875, 0.04271697998046875, 0.0627899169921875, 0.08286285400390625, 0.102935791015625, 0.12300872802734375, 0.1430816650390625, 0.16315460205078125, 0.1832275390625, 0.20330047607421875, 0.2233734130859375, 0.24344635009765625, 0.263519287109375, 0.28359222412109375, 0.3036651611328125, 0.32373809814453125, 0.34381103515625, 0.36388397216796875, 0.3839569091796875, 0.40402984619140625, 0.424102783203125, 0.44417572021484375, 0.4642486572265625, 0.48432159423828125, 0.50439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 6.0, 5.0, 12.0, 13.0, 18.0, 50.0, 54.0, 117.0, 360.0, 2359.0, 673.0, 166.0, 86.0, 42.0, 19.0, 22.0, 17.0, 7.0, 6.0, 6.0, 7.0, 2.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35302734375, -0.3445549011230469, -0.33608245849609375, -0.3276100158691406, -0.3191375732421875, -0.3106651306152344, -0.30219268798828125, -0.2937202453613281, -0.285247802734375, -0.2767753601074219, -0.26830291748046875, -0.2598304748535156, -0.2513580322265625, -0.24288558959960938, -0.23441314697265625, -0.22594070434570312, -0.21746826171875, -0.20899581909179688, -0.20052337646484375, -0.19205093383789062, -0.1835784912109375, -0.17510604858398438, -0.16663360595703125, -0.15816116333007812, -0.149688720703125, -0.14121627807617188, -0.13274383544921875, -0.12427139282226562, -0.1157989501953125, -0.10732650756835938, -0.09885406494140625, -0.09038162231445312, -0.0819091796875, -0.07343673706054688, -0.06496429443359375, -0.056491851806640625, -0.0480194091796875, -0.039546966552734375, -0.03107452392578125, -0.022602081298828125, -0.014129638671875, -0.005657196044921875, 0.00281524658203125, 0.011287689208984375, 0.0197601318359375, 0.028232574462890625, 0.03670501708984375, 0.045177459716796875, 0.05364990234375, 0.062122344970703125, 0.07059478759765625, 0.07906723022460938, 0.0875396728515625, 0.09601211547851562, 0.10448455810546875, 0.11295700073242188, 0.121429443359375, 0.12990188598632812, 0.13837432861328125, 0.14684677124023438, 0.1553192138671875, 0.16379165649414062, 0.17226409912109375, 0.18073654174804688, 0.189208984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 17.0, 98.0, 306.0, 358.0, 168.0, 33.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9152201414108276, -0.8144505620002747, -0.7136809825897217, -0.6129114031791687, -0.5121418237686157, -0.41137224435806274, -0.31060266494750977, -0.2098330855369568, -0.10906350612640381, -0.00829392671585083, 0.09247565269470215, 0.19324523210525513, 0.2940148115158081, 0.3947843909263611, 0.49555397033691406, 0.596323549747467, 0.69709312915802, 0.797862708568573, 0.898632287979126, 0.999401867389679, 1.100171446800232, 1.2009410858154297, 1.301710605621338, 1.402480125427246, 1.5032497644424438, 1.6040194034576416, 1.7047889232635498, 1.805558443069458, 1.9063280820846558, 2.0070977210998535, 2.1078672409057617, 2.20863676071167, 2.309406280517578, 2.4101758003234863, 2.5109453201293945, 2.611715078353882, 2.71248459815979, 2.8132541179656982, 2.9140238761901855, 3.0147933959960938, 3.115562915802002, 3.21633243560791, 3.3171019554138184, 3.4178717136383057, 3.518641233444214, 3.619410753250122, 3.7201805114746094, 3.8209500312805176, 3.921719551086426, 4.022489070892334, 4.123258590698242, 4.22402811050415, 4.324797630310059, 4.425567626953125, 4.526337146759033, 4.627106666564941, 4.72787618637085, 4.828645706176758, 4.929415225982666, 5.030184745788574, 5.130954742431641, 5.231724262237549, 5.332493782043457, 5.433263301849365, 5.534032821655273]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 11.0, 13.0, 19.0, 14.0, 25.0, 30.0, 36.0, 32.0, 37.0, 60.0, 55.0, 45.0, 60.0, 70.0, 55.0, 41.0, 42.0, 57.0, 48.0, 44.0, 35.0, 30.0, 31.0, 23.0, 16.0, 18.0, 19.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7623158693313599, -0.7360689640045166, -0.7098220586776733, -0.6835751533508301, -0.6573282480239868, -0.6310813426971436, -0.6048344373703003, -0.5785874724388123, -0.552340567111969, -0.5260936617851257, -0.49984675645828247, -0.4735998511314392, -0.44735291600227356, -0.4211060106754303, -0.39485910534858704, -0.3686121702194214, -0.3423652946949005, -0.31611838936805725, -0.289871484041214, -0.26362454891204834, -0.23737764358520508, -0.21113073825836182, -0.18488383293151855, -0.1586369127035141, -0.13239000737667084, -0.10614309459924698, -0.07989618182182312, -0.05364927649497986, -0.027402363717556, -0.0011554509401321411, 0.02509145438671112, 0.051338374614715576, 0.07758527994155884, 0.1038321927189827, 0.13007910549640656, 0.15632601082324982, 0.18257293105125427, 0.20881983637809753, 0.2350667417049408, 0.26131367683410645, 0.2875605821609497, 0.31380748748779297, 0.34005439281463623, 0.3663012981414795, 0.39254823327064514, 0.4187951385974884, 0.44504204392433167, 0.4712889790534973, 0.4975358545780182, 0.5237827897071838, 0.5500296950340271, 0.5762766003608704, 0.6025235056877136, 0.6287704110145569, 0.6550173163414001, 0.6812642216682434, 0.7075111269950867, 0.7337580323219299, 0.7600049376487732, 0.7862518429756165, 0.8124987483024597, 0.8387457132339478, 0.864992618560791, 0.8912395238876343, 0.9174864292144775]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 14.0, 19.0, 28.0, 33.0, 37.0, 60.0, 107.0, 130.0, 172.0, 317.0, 547.0, 996.0, 2115.0, 5057.0, 16600.0, 86867.0, 601249.0, 279293.0, 38637.0, 9451.0, 3328.0, 1569.0, 731.0, 417.0, 224.0, 163.0, 112.0, 60.0, 47.0, 33.0, 31.0, 24.0, 20.0, 7.0, 9.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.068359375, -1.0384979248046875, -1.008636474609375, -0.9787750244140625, -0.94891357421875, -0.9190521240234375, -0.889190673828125, -0.8593292236328125, -0.8294677734375, -0.7996063232421875, -0.769744873046875, -0.7398834228515625, -0.71002197265625, -0.6801605224609375, -0.650299072265625, -0.6204376220703125, -0.590576171875, -0.5607147216796875, -0.530853271484375, -0.5009918212890625, -0.47113037109375, -0.4412689208984375, -0.411407470703125, -0.3815460205078125, -0.3516845703125, -0.3218231201171875, -0.291961669921875, -0.2621002197265625, -0.23223876953125, -0.2023773193359375, -0.172515869140625, -0.1426544189453125, -0.11279296875, -0.0829315185546875, -0.053070068359375, -0.0232086181640625, 0.00665283203125, 0.0365142822265625, 0.066375732421875, 0.0962371826171875, 0.1260986328125, 0.1559600830078125, 0.185821533203125, 0.2156829833984375, 0.24554443359375, 0.2754058837890625, 0.305267333984375, 0.3351287841796875, 0.364990234375, 0.3948516845703125, 0.424713134765625, 0.4545745849609375, 0.48443603515625, 0.5142974853515625, 0.544158935546875, 0.5740203857421875, 0.6038818359375, 0.6337432861328125, 0.663604736328125, 0.6934661865234375, 0.72332763671875, 0.7531890869140625, 0.783050537109375, 0.8129119873046875, 0.8427734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 13.0, 16.0, 25.0, 30.0, 36.0, 63.0, 73.0, 120.0, 99.0, 115.0, 95.0, 86.0, 56.0, 43.0, 37.0, 28.0, 24.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1993408203125, -0.19330787658691406, -0.18727493286132812, -0.1812419891357422, -0.17520904541015625, -0.1691761016845703, -0.16314315795898438, -0.15711021423339844, -0.1510772705078125, -0.14504432678222656, -0.13901138305664062, -0.1329784393310547, -0.12694549560546875, -0.12091255187988281, -0.11487960815429688, -0.10884666442871094, -0.102813720703125, -0.09678077697753906, -0.09074783325195312, -0.08471488952636719, -0.07868194580078125, -0.07264900207519531, -0.06661605834960938, -0.06058311462402344, -0.0545501708984375, -0.04851722717285156, -0.042484283447265625, -0.03645133972167969, -0.03041839599609375, -0.024385452270507812, -0.018352508544921875, -0.012319564819335938, -0.00628662109375, -0.0002536773681640625, 0.005779266357421875, 0.011812210083007812, 0.01784515380859375, 0.023878097534179688, 0.029911041259765625, 0.03594398498535156, 0.0419769287109375, 0.04800987243652344, 0.054042816162109375, 0.06007575988769531, 0.06610870361328125, 0.07214164733886719, 0.07817459106445312, 0.08420753479003906, 0.090240478515625, 0.09627342224121094, 0.10230636596679688, 0.10833930969238281, 0.11437225341796875, 0.12040519714355469, 0.12643814086914062, 0.13247108459472656, 0.1385040283203125, 0.14453697204589844, 0.15056991577148438, 0.1566028594970703, 0.16263580322265625, 0.1686687469482422, 0.17470169067382812, 0.18073463439941406, 0.186767578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 1.0, 5.0, 6.0, 8.0, 14.0, 26.0, 34.0, 41.0, 77.0, 127.0, 215.0, 371.0, 640.0, 1247.0, 2815.0, 7517.0, 26193.0, 156663.0, 679098.0, 137075.0, 23723.0, 7143.0, 2801.0, 1175.0, 611.0, 343.0, 201.0, 140.0, 58.0, 65.0, 34.0, 25.0, 13.0, 12.0, 11.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.7547378540039062, -0.7282257080078125, -0.7017135620117188, -0.675201416015625, -0.6486892700195312, -0.6221771240234375, -0.5956649780273438, -0.56915283203125, -0.5426406860351562, -0.5161285400390625, -0.48961639404296875, -0.463104248046875, -0.43659210205078125, -0.4100799560546875, -0.38356781005859375, -0.3570556640625, -0.33054351806640625, -0.3040313720703125, -0.27751922607421875, -0.251007080078125, -0.22449493408203125, -0.1979827880859375, -0.17147064208984375, -0.14495849609375, -0.11844635009765625, -0.0919342041015625, -0.06542205810546875, -0.038909912109375, -0.01239776611328125, 0.0141143798828125, 0.04062652587890625, 0.067138671875, 0.09365081787109375, 0.1201629638671875, 0.14667510986328125, 0.173187255859375, 0.19969940185546875, 0.2262115478515625, 0.25272369384765625, 0.27923583984375, 0.30574798583984375, 0.3322601318359375, 0.35877227783203125, 0.385284423828125, 0.41179656982421875, 0.4383087158203125, 0.46482086181640625, 0.4913330078125, 0.5178451538085938, 0.5443572998046875, 0.5708694458007812, 0.597381591796875, 0.6238937377929688, 0.6504058837890625, 0.6769180297851562, 0.70343017578125, 0.7299423217773438, 0.7564544677734375, 0.7829666137695312, 0.809478759765625, 0.8359909057617188, 0.8625030517578125, 0.8890151977539062, 0.91552734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 7.0, 6.0, 10.0, 14.0, 14.0, 11.0, 35.0, 28.0, 41.0, 52.0, 60.0, 59.0, 66.0, 85.0, 75.0, 78.0, 59.0, 51.0, 38.0, 49.0, 34.0, 26.0, 22.0, 19.0, 14.0, 13.0, 11.0, 7.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5363311767578125, -0.513092041015625, -0.4898529052734375, -0.46661376953125, -0.4433746337890625, -0.420135498046875, -0.3968963623046875, -0.3736572265625, -0.3504180908203125, -0.327178955078125, -0.3039398193359375, -0.28070068359375, -0.2574615478515625, -0.234222412109375, -0.2109832763671875, -0.187744140625, -0.1645050048828125, -0.141265869140625, -0.1180267333984375, -0.09478759765625, -0.0715484619140625, -0.048309326171875, -0.0250701904296875, -0.0018310546875, 0.0214080810546875, 0.044647216796875, 0.0678863525390625, 0.09112548828125, 0.1143646240234375, 0.137603759765625, 0.1608428955078125, 0.18408203125, 0.2073211669921875, 0.230560302734375, 0.2537994384765625, 0.27703857421875, 0.3002777099609375, 0.323516845703125, 0.3467559814453125, 0.3699951171875, 0.3932342529296875, 0.416473388671875, 0.4397125244140625, 0.46295166015625, 0.4861907958984375, 0.509429931640625, 0.5326690673828125, 0.555908203125, 0.5791473388671875, 0.602386474609375, 0.6256256103515625, 0.64886474609375, 0.6721038818359375, 0.695343017578125, 0.7185821533203125, 0.7418212890625, 0.7650604248046875, 0.788299560546875, 0.8115386962890625, 0.83477783203125, 0.8580169677734375, 0.881256103515625, 0.9044952392578125, 0.927734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 10.0, 12.0, 16.0, 50.0, 99.0, 225.0, 564.0, 2404.0, 21323.0, 1003062.0, 17679.0, 2160.0, 539.0, 217.0, 92.0, 38.0, 23.0, 13.0, 4.0, 1.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.337890625, -2.252777099609375, -2.16766357421875, -2.082550048828125, -1.9974365234375, -1.912322998046875, -1.82720947265625, -1.742095947265625, -1.656982421875, -1.571868896484375, -1.48675537109375, -1.401641845703125, -1.3165283203125, -1.231414794921875, -1.14630126953125, -1.061187744140625, -0.97607421875, -0.890960693359375, -0.80584716796875, -0.720733642578125, -0.6356201171875, -0.550506591796875, -0.46539306640625, -0.380279541015625, -0.295166015625, -0.210052490234375, -0.12493896484375, -0.039825439453125, 0.0452880859375, 0.130401611328125, 0.21551513671875, 0.300628662109375, 0.3857421875, 0.470855712890625, 0.55596923828125, 0.641082763671875, 0.7261962890625, 0.811309814453125, 0.89642333984375, 0.981536865234375, 1.066650390625, 1.151763916015625, 1.23687744140625, 1.321990966796875, 1.4071044921875, 1.492218017578125, 1.57733154296875, 1.662445068359375, 1.74755859375, 1.832672119140625, 1.91778564453125, 2.002899169921875, 2.0880126953125, 2.173126220703125, 2.25823974609375, 2.343353271484375, 2.428466796875, 2.513580322265625, 2.59869384765625, 2.683807373046875, 2.7689208984375, 2.854034423828125, 2.93914794921875, 3.024261474609375, 3.109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 20.0, 26.0, 32.0, 59.0, 61.0, 89.0, 185.0, 145.0, 90.0, 76.0, 63.0, 36.0, 27.0, 23.0, 20.0, 11.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.0003962516784667969, -0.0003879815340042114, -0.000379711389541626, -0.00037144124507904053, -0.0003631711006164551, -0.00035490095615386963, -0.0003466308116912842, -0.00033836066722869873, -0.0003300905227661133, -0.00032182037830352783, -0.0003135502338409424, -0.00030528008937835693, -0.0002970099449157715, -0.00028873980045318604, -0.0002804696559906006, -0.00027219951152801514, -0.0002639293670654297, -0.00025565922260284424, -0.0002473890781402588, -0.00023911893367767334, -0.0002308487892150879, -0.00022257864475250244, -0.000214308500289917, -0.00020603835582733154, -0.0001977682113647461, -0.00018949806690216064, -0.0001812279224395752, -0.00017295777797698975, -0.0001646876335144043, -0.00015641748905181885, -0.0001481473445892334, -0.00013987720012664795, -0.0001316070556640625, -0.00012333691120147705, -0.0001150667667388916, -0.00010679662227630615, -9.85264778137207e-05, -9.025633335113525e-05, -8.19861888885498e-05, -7.371604442596436e-05, -6.54458999633789e-05, -5.717575550079346e-05, -4.890561103820801e-05, -4.063546657562256e-05, -3.236532211303711e-05, -2.409517765045166e-05, -1.582503318786621e-05, -7.554888725280762e-06, 7.152557373046875e-07, 8.985400199890137e-06, 1.7255544662475586e-05, 2.5525689125061035e-05, 3.3795833587646484e-05, 4.2065978050231934e-05, 5.033612251281738e-05, 5.860626697540283e-05, 6.687641143798828e-05, 7.514655590057373e-05, 8.341670036315918e-05, 9.168684482574463e-05, 9.995698928833008e-05, 0.00010822713375091553, 0.00011649727821350098, 0.00012476742267608643, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 10.0, 17.0, 44.0, 92.0, 195.0, 408.0, 1117.0, 4942.0, 128589.0, 900524.0, 10029.0, 1581.0, 554.0, 238.0, 108.0, 39.0, 25.0, 15.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.0536041259765625, -1.999786376953125, -1.9459686279296875, -1.89215087890625, -1.8383331298828125, -1.784515380859375, -1.7306976318359375, -1.6768798828125, -1.6230621337890625, -1.569244384765625, -1.5154266357421875, -1.46160888671875, -1.4077911376953125, -1.353973388671875, -1.3001556396484375, -1.246337890625, -1.1925201416015625, -1.138702392578125, -1.0848846435546875, -1.03106689453125, -0.9772491455078125, -0.923431396484375, -0.8696136474609375, -0.8157958984375, -0.7619781494140625, -0.708160400390625, -0.6543426513671875, -0.60052490234375, -0.5467071533203125, -0.492889404296875, -0.4390716552734375, -0.38525390625, -0.3314361572265625, -0.277618408203125, -0.2238006591796875, -0.16998291015625, -0.1161651611328125, -0.062347412109375, -0.0085296630859375, 0.0452880859375, 0.0991058349609375, 0.152923583984375, 0.2067413330078125, 0.26055908203125, 0.3143768310546875, 0.368194580078125, 0.4220123291015625, 0.475830078125, 0.5296478271484375, 0.583465576171875, 0.6372833251953125, 0.69110107421875, 0.7449188232421875, 0.798736572265625, 0.8525543212890625, 0.9063720703125, 0.9601898193359375, 1.014007568359375, 1.0678253173828125, 1.12164306640625, 1.1754608154296875, 1.229278564453125, 1.2830963134765625, 1.3369140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 11.0, 23.0, 29.0, 82.0, 165.0, 381.0, 151.0, 60.0, 20.0, 13.0, 11.0, 5.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.611328125, -1.5733261108398438, -1.5353240966796875, -1.4973220825195312, -1.459320068359375, -1.4213180541992188, -1.3833160400390625, -1.3453140258789062, -1.30731201171875, -1.2693099975585938, -1.2313079833984375, -1.1933059692382812, -1.155303955078125, -1.1173019409179688, -1.0792999267578125, -1.0412979125976562, -1.0032958984375, -0.9652938842773438, -0.9272918701171875, -0.8892898559570312, -0.851287841796875, -0.8132858276367188, -0.7752838134765625, -0.7372817993164062, -0.69927978515625, -0.6612777709960938, -0.6232757568359375, -0.5852737426757812, -0.547271728515625, -0.5092697143554688, -0.4712677001953125, -0.43326568603515625, -0.395263671875, -0.35726165771484375, -0.3192596435546875, -0.28125762939453125, -0.243255615234375, -0.20525360107421875, -0.1672515869140625, -0.12924957275390625, -0.09124755859375, -0.05324554443359375, -0.0152435302734375, 0.02275848388671875, 0.060760498046875, 0.09876251220703125, 0.1367645263671875, 0.17476654052734375, 0.2127685546875, 0.25077056884765625, 0.2887725830078125, 0.32677459716796875, 0.364776611328125, 0.40277862548828125, 0.4407806396484375, 0.47878265380859375, 0.51678466796875, 0.5547866821289062, 0.5927886962890625, 0.6307907104492188, 0.668792724609375, 0.7067947387695312, 0.7447967529296875, 0.7827987670898438, 0.82080078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 18.0, 41.0, 88.0, 178.0, 263.0, 200.0, 110.0, 48.0, 30.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.211750030517578, -15.74354362487793, -15.275337219238281, -14.807130813598633, -14.338924407958984, -13.870718002319336, -13.402511596679688, -12.934305191040039, -12.46609878540039, -11.997892379760742, -11.529685974121094, -11.061479568481445, -10.593273162841797, -10.125066757202148, -9.6568603515625, -9.188653945922852, -8.720446586608887, -8.252240180969238, -7.78403377532959, -7.315827369689941, -6.847620964050293, -6.3794145584106445, -5.911207675933838, -5.4430012702941895, -4.974794864654541, -4.506588459014893, -4.038382053375244, -3.5701754093170166, -3.101969003677368, -2.6337625980377197, -2.165555953979492, -1.6973495483398438, -1.2291440963745117, -0.7609376311302185, -0.2927311658859253, 0.1754753589630127, 0.6436817646026611, 1.1118881702423096, 1.580094814300537, 2.0483012199401855, 2.516507625579834, 2.9847140312194824, 3.452920436859131, 3.9211270809173584, 4.389333724975586, 4.857540130615234, 5.325746536254883, 5.793952941894531, 6.26215934753418, 6.730365753173828, 7.198572158813477, 7.666778564453125, 8.134984970092773, 8.603191375732422, 9.07139778137207, 9.539604187011719, 10.007810592651367, 10.476016998291016, 10.944223403930664, 11.412429809570312, 11.880636215209961, 12.34884262084961, 12.817049026489258, 13.285255432128906, 13.753462791442871]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 7.0, 11.0, 12.0, 16.0, 26.0, 19.0, 26.0, 35.0, 34.0, 35.0, 45.0, 48.0, 42.0, 58.0, 64.0, 67.0, 50.0, 65.0, 51.0, 51.0, 47.0, 46.0, 26.0, 26.0, 24.0, 13.0, 13.0, 12.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.072422504425049, -5.903326034545898, -5.73422908782959, -5.5651326179504395, -5.396036148071289, -5.2269392013549805, -5.05784273147583, -4.88874626159668, -4.719649314880371, -4.550552845001221, -4.381455898284912, -4.212359428405762, -4.043262958526611, -3.8741660118103027, -3.7050695419311523, -3.535972833633423, -3.3668763637542725, -3.197779655456543, -3.0286831855773926, -2.859586477279663, -2.6904897689819336, -2.521393299102783, -2.3522965908050537, -2.183199882507324, -2.014103412628174, -1.8450068235397339, -1.6759101152420044, -1.5068135261535645, -1.337716817855835, -1.168620228767395, -0.9995236396789551, -0.8304269313812256, -0.6613302230834961, -0.4922335743904114, -0.32313695549964905, -0.15404033660888672, 0.015056312084197998, 0.18415296077728271, 0.35324954986572266, 0.5223462581634521, 0.6914428472518921, 0.8605394959449768, 1.0296361446380615, 1.1987327337265015, 1.3678293228149414, 1.536926031112671, 1.7060226202011108, 1.8751193284988403, 2.0442159175872803, 2.2133126258850098, 2.38240909576416, 2.5515058040618896, 2.720602512359619, 2.8896989822387695, 3.058795690536499, 3.2278923988342285, 3.396988868713379, 3.5660855770111084, 3.735182046890259, 3.9042787551879883, 4.073375225067139, 4.242472171783447, 4.411568641662598, 4.580665588378906, 4.749762058258057]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 9.0, 6.0, 7.0, 13.0, 20.0, 26.0, 24.0, 40.0, 76.0, 108.0, 135.0, 257.0, 411.0, 683.0, 1219.0, 2363.0, 4969.0, 12908.0, 45721.0, 491541.0, 3501123.0, 98106.0, 20818.0, 7063.0, 3094.0, 1498.0, 777.0, 501.0, 291.0, 173.0, 86.0, 84.0, 37.0, 29.0, 14.0, 16.0, 6.0, 6.0, 0.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77197265625, -0.7472381591796875, -0.722503662109375, -0.6977691650390625, -0.67303466796875, -0.6483001708984375, -0.623565673828125, -0.5988311767578125, -0.5740966796875, -0.5493621826171875, -0.524627685546875, -0.4998931884765625, -0.47515869140625, -0.4504241943359375, -0.425689697265625, -0.4009552001953125, -0.376220703125, -0.3514862060546875, -0.326751708984375, -0.3020172119140625, -0.27728271484375, -0.2525482177734375, -0.227813720703125, -0.2030792236328125, -0.1783447265625, -0.1536102294921875, -0.128875732421875, -0.1041412353515625, -0.07940673828125, -0.0546722412109375, -0.029937744140625, -0.0052032470703125, 0.01953125, 0.0442657470703125, 0.069000244140625, 0.0937347412109375, 0.11846923828125, 0.1432037353515625, 0.167938232421875, 0.1926727294921875, 0.2174072265625, 0.2421417236328125, 0.266876220703125, 0.2916107177734375, 0.31634521484375, 0.3410797119140625, 0.365814208984375, 0.3905487060546875, 0.415283203125, 0.4400177001953125, 0.464752197265625, 0.4894866943359375, 0.51422119140625, 0.5389556884765625, 0.563690185546875, 0.5884246826171875, 0.6131591796875, 0.6378936767578125, 0.662628173828125, 0.6873626708984375, 0.71209716796875, 0.7368316650390625, 0.761566162109375, 0.7863006591796875, 0.81103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 13.0, 8.0, 14.0, 26.0, 22.0, 30.0, 40.0, 43.0, 65.0, 71.0, 82.0, 94.0, 78.0, 83.0, 76.0, 58.0, 51.0, 37.0, 32.0, 23.0, 14.0, 11.0, 7.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.19744491577148438, -0.19139862060546875, -0.18535232543945312, -0.1793060302734375, -0.17325973510742188, -0.16721343994140625, -0.16116714477539062, -0.155120849609375, -0.14907455444335938, -0.14302825927734375, -0.13698196411132812, -0.1309356689453125, -0.12488937377929688, -0.11884307861328125, -0.11279678344726562, -0.10675048828125, -0.10070419311523438, -0.09465789794921875, -0.08861160278320312, -0.0825653076171875, -0.07651901245117188, -0.07047271728515625, -0.06442642211914062, -0.058380126953125, -0.052333831787109375, -0.04628753662109375, -0.040241241455078125, -0.0341949462890625, -0.028148651123046875, -0.02210235595703125, -0.016056060791015625, -0.010009765625, -0.003963470458984375, 0.00208282470703125, 0.008129119873046875, 0.0141754150390625, 0.020221710205078125, 0.02626800537109375, 0.032314300537109375, 0.038360595703125, 0.044406890869140625, 0.05045318603515625, 0.056499481201171875, 0.0625457763671875, 0.06859207153320312, 0.07463836669921875, 0.08068466186523438, 0.08673095703125, 0.09277725219726562, 0.09882354736328125, 0.10486984252929688, 0.1109161376953125, 0.11696243286132812, 0.12300872802734375, 0.12905502319335938, 0.135101318359375, 0.14114761352539062, 0.14719390869140625, 0.15324020385742188, 0.1592864990234375, 0.16533279418945312, 0.17137908935546875, 0.17742538452148438, 0.1834716796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 12.0, 14.0, 19.0, 39.0, 40.0, 74.0, 84.0, 96.0, 153.0, 217.0, 339.0, 486.0, 766.0, 1296.0, 2682.0, 6343.0, 18375.0, 91674.0, 3406612.0, 597014.0, 46198.0, 12085.0, 4525.0, 2018.0, 1086.0, 636.0, 416.0, 280.0, 201.0, 140.0, 95.0, 72.0, 44.0, 45.0, 19.0, 19.0, 11.0, 13.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84619140625, -0.8187332153320312, -0.7912750244140625, -0.7638168334960938, -0.736358642578125, -0.7089004516601562, -0.6814422607421875, -0.6539840698242188, -0.62652587890625, -0.5990676879882812, -0.5716094970703125, -0.5441513061523438, -0.516693115234375, -0.48923492431640625, -0.4617767333984375, -0.43431854248046875, -0.4068603515625, -0.37940216064453125, -0.3519439697265625, -0.32448577880859375, -0.297027587890625, -0.26956939697265625, -0.2421112060546875, -0.21465301513671875, -0.18719482421875, -0.15973663330078125, -0.1322784423828125, -0.10482025146484375, -0.077362060546875, -0.04990386962890625, -0.0224456787109375, 0.00501251220703125, 0.032470703125, 0.05992889404296875, 0.0873870849609375, 0.11484527587890625, 0.142303466796875, 0.16976165771484375, 0.1972198486328125, 0.22467803955078125, 0.25213623046875, 0.27959442138671875, 0.3070526123046875, 0.33451080322265625, 0.361968994140625, 0.38942718505859375, 0.4168853759765625, 0.44434356689453125, 0.4718017578125, 0.49925994873046875, 0.5267181396484375, 0.5541763305664062, 0.581634521484375, 0.6090927124023438, 0.6365509033203125, 0.6640090942382812, 0.69146728515625, 0.7189254760742188, 0.7463836669921875, 0.7738418579101562, 0.801300048828125, 0.8287582397460938, 0.8562164306640625, 0.8836746215820312, 0.9111328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 12.0, 8.0, 11.0, 26.0, 40.0, 96.0, 232.0, 1739.0, 1460.0, 239.0, 87.0, 40.0, 22.0, 14.0, 9.0, 8.0, 4.0, 9.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.5503997802734375, -0.529998779296875, -0.5095977783203125, -0.48919677734375, -0.4687957763671875, -0.448394775390625, -0.4279937744140625, -0.4075927734375, -0.3871917724609375, -0.366790771484375, -0.3463897705078125, -0.32598876953125, -0.3055877685546875, -0.285186767578125, -0.2647857666015625, -0.244384765625, -0.2239837646484375, -0.203582763671875, -0.1831817626953125, -0.16278076171875, -0.1423797607421875, -0.121978759765625, -0.1015777587890625, -0.0811767578125, -0.0607757568359375, -0.040374755859375, -0.0199737548828125, 0.00042724609375, 0.0208282470703125, 0.041229248046875, 0.0616302490234375, 0.08203125, 0.1024322509765625, 0.122833251953125, 0.1432342529296875, 0.16363525390625, 0.1840362548828125, 0.204437255859375, 0.2248382568359375, 0.2452392578125, 0.2656402587890625, 0.286041259765625, 0.3064422607421875, 0.32684326171875, 0.3472442626953125, 0.367645263671875, 0.3880462646484375, 0.408447265625, 0.4288482666015625, 0.449249267578125, 0.4696502685546875, 0.49005126953125, 0.5104522705078125, 0.530853271484375, 0.5512542724609375, 0.5716552734375, 0.5920562744140625, 0.612457275390625, 0.6328582763671875, 0.65325927734375, 0.6736602783203125, 0.694061279296875, 0.7144622802734375, 0.73486328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 21.0, 45.0, 72.0, 115.0, 159.0, 194.0, 152.0, 82.0, 64.0, 35.0, 20.0, 9.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5355024337768555, -4.439301490783691, -4.343100547790527, -4.246899604797363, -4.150698661804199, -4.054497718811035, -3.958296775817871, -3.862095832824707, -3.765894889831543, -3.669693946838379, -3.573493003845215, -3.477292060852051, -3.3810911178588867, -3.2848901748657227, -3.1886892318725586, -3.0924882888793945, -2.9962873458862305, -2.9000864028930664, -2.8038854598999023, -2.7076845169067383, -2.611483573913574, -2.51528263092041, -2.419081687927246, -2.322880744934082, -2.226679801940918, -2.130478858947754, -2.03427791595459, -1.9380769729614258, -1.8418760299682617, -1.7456750869750977, -1.6494741439819336, -1.5532732009887695, -1.4570720195770264, -1.3608710765838623, -1.2646701335906982, -1.1684691905975342, -1.0722682476043701, -0.976067304611206, -0.879866361618042, -0.7836654186248779, -0.6874644756317139, -0.5912635326385498, -0.49506258964538574, -0.3988616466522217, -0.3026607036590576, -0.20645976066589355, -0.11025881767272949, -0.01405787467956543, 0.08214306831359863, 0.1783440113067627, 0.27454495429992676, 0.3707458972930908, 0.4669468402862549, 0.563147783279419, 0.659348726272583, 0.7555496692657471, 0.8517506122589111, 0.9479515552520752, 1.0441524982452393, 1.1403534412384033, 1.2365543842315674, 1.3327553272247314, 1.4289562702178955, 1.5251572132110596, 1.6213581562042236]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 0.0, 2.0, 6.0, 5.0, 7.0, 10.0, 17.0, 15.0, 19.0, 29.0, 28.0, 29.0, 24.0, 32.0, 36.0, 35.0, 41.0, 41.0, 35.0, 45.0, 45.0, 62.0, 56.0, 50.0, 48.0, 45.0, 43.0, 30.0, 33.0, 29.0, 16.0, 9.0, 18.0, 13.0, 17.0, 8.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5683906078338623, -1.5192416906356812, -1.4700926542282104, -1.4209437370300293, -1.3717948198318481, -1.3226457834243774, -1.2734968662261963, -1.2243478298187256, -1.1751989126205444, -1.1260499954223633, -1.0769009590148926, -1.0277520418167114, -0.9786030650138855, -0.9294540882110596, -0.8803051710128784, -0.8311561942100525, -0.7820072770118713, -0.7328583002090454, -0.6837093830108643, -0.6345604062080383, -0.5854114294052124, -0.5362625122070312, -0.4871135354042053, -0.4379645586013794, -0.38881561160087585, -0.3396666646003723, -0.2905176877975464, -0.24136874079704285, -0.1922197788953781, -0.14307081699371338, -0.09392186999320984, -0.04477289319038391, 0.004376053810119629, 0.053525011986494064, 0.1026739701628685, 0.15182292461395264, 0.20097188651561737, 0.2501208484172821, 0.29926979541778564, 0.3484187722206116, 0.3975677192211151, 0.44671666622161865, 0.4958656430244446, 0.5450146198272705, 0.5941635370254517, 0.6433125138282776, 0.6924614906311035, 0.7416104078292847, 0.7907593846321106, 0.8399083614349365, 0.8890572786331177, 0.9382062554359436, 0.9873552322387695, 1.0365041494369507, 1.0856530666351318, 1.1348021030426025, 1.1839510202407837, 1.2330999374389648, 1.2822489738464355, 1.3313978910446167, 1.3805468082427979, 1.4296958446502686, 1.4788447618484497, 1.5279936790466309, 1.5771427154541016]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 11.0, 13.0, 24.0, 29.0, 42.0, 74.0, 129.0, 166.0, 298.0, 473.0, 895.0, 1823.0, 4058.0, 10510.0, 31580.0, 121796.0, 451201.0, 316282.0, 74322.0, 21097.0, 7441.0, 3064.0, 1441.0, 752.0, 378.0, 253.0, 120.0, 85.0, 57.0, 35.0, 33.0, 16.0, 15.0, 13.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74755859375, -0.7206954956054688, -0.6938323974609375, -0.6669692993164062, -0.640106201171875, -0.6132431030273438, -0.5863800048828125, -0.5595169067382812, -0.53265380859375, -0.5057907104492188, -0.4789276123046875, -0.45206451416015625, -0.425201416015625, -0.39833831787109375, -0.3714752197265625, -0.34461212158203125, -0.3177490234375, -0.29088592529296875, -0.2640228271484375, -0.23715972900390625, -0.210296630859375, -0.18343353271484375, -0.1565704345703125, -0.12970733642578125, -0.10284423828125, -0.07598114013671875, -0.0491180419921875, -0.02225494384765625, 0.004608154296875, 0.03147125244140625, 0.0583343505859375, 0.08519744873046875, 0.112060546875, 0.13892364501953125, 0.1657867431640625, 0.19264984130859375, 0.219512939453125, 0.24637603759765625, 0.2732391357421875, 0.30010223388671875, 0.32696533203125, 0.35382843017578125, 0.3806915283203125, 0.40755462646484375, 0.434417724609375, 0.46128082275390625, 0.4881439208984375, 0.5150070190429688, 0.5418701171875, 0.5687332153320312, 0.5955963134765625, 0.6224594116210938, 0.649322509765625, 0.6761856079101562, 0.7030487060546875, 0.7299118041992188, 0.75677490234375, 0.7836380004882812, 0.8105010986328125, 0.8373641967773438, 0.864227294921875, 0.8910903930664062, 0.9179534912109375, 0.9448165893554688, 0.9716796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 9.0, 8.0, 20.0, 25.0, 37.0, 35.0, 40.0, 64.0, 79.0, 68.0, 77.0, 80.0, 76.0, 74.0, 52.0, 70.0, 55.0, 29.0, 34.0, 22.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20291709899902344, -0.19660568237304688, -0.1902942657470703, -0.18398284912109375, -0.1776714324951172, -0.17136001586914062, -0.16504859924316406, -0.1587371826171875, -0.15242576599121094, -0.14611434936523438, -0.1398029327392578, -0.13349151611328125, -0.1271800994873047, -0.12086868286132812, -0.11455726623535156, -0.108245849609375, -0.10193443298339844, -0.09562301635742188, -0.08931159973144531, -0.08300018310546875, -0.07668876647949219, -0.07037734985351562, -0.06406593322753906, -0.0577545166015625, -0.05144309997558594, -0.045131683349609375, -0.03882026672363281, -0.03250885009765625, -0.026197433471679688, -0.019886016845703125, -0.013574600219726562, -0.00726318359375, -0.0009517669677734375, 0.005359649658203125, 0.011671066284179688, 0.01798248291015625, 0.024293899536132812, 0.030605316162109375, 0.03691673278808594, 0.0432281494140625, 0.04953956604003906, 0.055850982666015625, 0.06216239929199219, 0.06847381591796875, 0.07478523254394531, 0.08109664916992188, 0.08740806579589844, 0.093719482421875, 0.10003089904785156, 0.10634231567382812, 0.11265373229980469, 0.11896514892578125, 0.1252765655517578, 0.13158798217773438, 0.13789939880371094, 0.1442108154296875, 0.15052223205566406, 0.15683364868164062, 0.1631450653076172, 0.16945648193359375, 0.1757678985595703, 0.18207931518554688, 0.18839073181152344, 0.1947021484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 16.0, 7.0, 17.0, 21.0, 32.0, 51.0, 85.0, 105.0, 189.0, 326.0, 518.0, 917.0, 1919.0, 3869.0, 9382.0, 25890.0, 89283.0, 373691.0, 399859.0, 96816.0, 27295.0, 9890.0, 4076.0, 1912.0, 1015.0, 526.0, 321.0, 191.0, 114.0, 76.0, 41.0, 29.0, 24.0, 14.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8359375, -0.8098373413085938, -0.7837371826171875, -0.7576370239257812, -0.731536865234375, -0.7054367065429688, -0.6793365478515625, -0.6532363891601562, -0.62713623046875, -0.6010360717773438, -0.5749359130859375, -0.5488357543945312, -0.522735595703125, -0.49663543701171875, -0.4705352783203125, -0.44443511962890625, -0.4183349609375, -0.39223480224609375, -0.3661346435546875, -0.34003448486328125, -0.313934326171875, -0.28783416748046875, -0.2617340087890625, -0.23563385009765625, -0.20953369140625, -0.18343353271484375, -0.1573333740234375, -0.13123321533203125, -0.105133056640625, -0.07903289794921875, -0.0529327392578125, -0.02683258056640625, -0.000732421875, 0.02536773681640625, 0.0514678955078125, 0.07756805419921875, 0.103668212890625, 0.12976837158203125, 0.1558685302734375, 0.18196868896484375, 0.20806884765625, 0.23416900634765625, 0.2602691650390625, 0.28636932373046875, 0.312469482421875, 0.33856964111328125, 0.3646697998046875, 0.39076995849609375, 0.4168701171875, 0.44297027587890625, 0.4690704345703125, 0.49517059326171875, 0.521270751953125, 0.5473709106445312, 0.5734710693359375, 0.5995712280273438, 0.62567138671875, 0.6517715454101562, 0.6778717041015625, 0.7039718627929688, 0.730072021484375, 0.7561721801757812, 0.7822723388671875, 0.8083724975585938, 0.83447265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 3.0, 5.0, 6.0, 13.0, 11.0, 18.0, 25.0, 21.0, 30.0, 36.0, 52.0, 53.0, 59.0, 58.0, 52.0, 74.0, 57.0, 49.0, 53.0, 54.0, 52.0, 39.0, 36.0, 28.0, 21.0, 21.0, 13.0, 16.0, 15.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1806640625, -1.1495437622070312, -1.1184234619140625, -1.0873031616210938, -1.056182861328125, -1.0250625610351562, -0.9939422607421875, -0.9628219604492188, -0.93170166015625, -0.9005813598632812, -0.8694610595703125, -0.8383407592773438, -0.807220458984375, -0.7761001586914062, -0.7449798583984375, -0.7138595581054688, -0.6827392578125, -0.6516189575195312, -0.6204986572265625, -0.5893783569335938, -0.558258056640625, -0.5271377563476562, -0.4960174560546875, -0.46489715576171875, -0.43377685546875, -0.40265655517578125, -0.3715362548828125, -0.34041595458984375, -0.309295654296875, -0.27817535400390625, -0.2470550537109375, -0.21593475341796875, -0.184814453125, -0.15369415283203125, -0.1225738525390625, -0.09145355224609375, -0.060333251953125, -0.02921295166015625, 0.0019073486328125, 0.03302764892578125, 0.06414794921875, 0.09526824951171875, 0.1263885498046875, 0.15750885009765625, 0.188629150390625, 0.21974945068359375, 0.2508697509765625, 0.28199005126953125, 0.3131103515625, 0.34423065185546875, 0.3753509521484375, 0.40647125244140625, 0.437591552734375, 0.46871185302734375, 0.4998321533203125, 0.5309524536132812, 0.56207275390625, 0.5931930541992188, 0.6243133544921875, 0.6554336547851562, 0.686553955078125, 0.7176742553710938, 0.7487945556640625, 0.7799148559570312, 0.81103515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 12.0, 19.0, 21.0, 31.0, 75.0, 133.0, 288.0, 773.0, 3429.0, 46658.0, 954680.0, 37961.0, 3158.0, 779.0, 266.0, 121.0, 61.0, 32.0, 19.0, 11.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.3987274169921875, -1.333587646484375, -1.2684478759765625, -1.20330810546875, -1.1381683349609375, -1.073028564453125, -1.0078887939453125, -0.9427490234375, -0.8776092529296875, -0.812469482421875, -0.7473297119140625, -0.68218994140625, -0.6170501708984375, -0.551910400390625, -0.4867706298828125, -0.421630859375, -0.3564910888671875, -0.291351318359375, -0.2262115478515625, -0.16107177734375, -0.0959320068359375, -0.030792236328125, 0.0343475341796875, 0.0994873046875, 0.1646270751953125, 0.229766845703125, 0.2949066162109375, 0.36004638671875, 0.4251861572265625, 0.490325927734375, 0.5554656982421875, 0.62060546875, 0.6857452392578125, 0.750885009765625, 0.8160247802734375, 0.88116455078125, 0.9463043212890625, 1.011444091796875, 1.0765838623046875, 1.1417236328125, 1.2068634033203125, 1.272003173828125, 1.3371429443359375, 1.40228271484375, 1.4674224853515625, 1.532562255859375, 1.5977020263671875, 1.662841796875, 1.7279815673828125, 1.793121337890625, 1.8582611083984375, 1.92340087890625, 1.9885406494140625, 2.053680419921875, 2.1188201904296875, 2.1839599609375, 2.2490997314453125, 2.314239501953125, 2.3793792724609375, 2.44451904296875, 2.5096588134765625, 2.574798583984375, 2.6399383544921875, 2.705078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 11.0, 13.0, 15.0, 31.0, 39.0, 54.0, 61.0, 65.0, 105.0, 90.0, 91.0, 84.0, 78.0, 56.0, 52.0, 30.0, 28.0, 24.0, 19.0, 8.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022912025451660156, -0.00022213906049728394, -0.0002151578664779663, -0.00020817667245864868, -0.00020119547843933105, -0.00019421428442001343, -0.0001872330904006958, -0.00018025189638137817, -0.00017327070236206055, -0.00016628950834274292, -0.0001593083143234253, -0.00015232712030410767, -0.00014534592628479004, -0.0001383647322654724, -0.00013138353824615479, -0.00012440234422683716, -0.00011742115020751953, -0.0001104399561882019, -0.00010345876216888428, -9.647756814956665e-05, -8.949637413024902e-05, -8.25151801109314e-05, -7.553398609161377e-05, -6.855279207229614e-05, -6.157159805297852e-05, -5.459040403366089e-05, -4.760921001434326e-05, -4.0628015995025635e-05, -3.364682197570801e-05, -2.666562795639038e-05, -1.9684433937072754e-05, -1.2703239917755127e-05, -5.7220458984375e-06, 1.259148120880127e-06, 8.240342140197754e-06, 1.5221536159515381e-05, 2.2202730178833008e-05, 2.9183924198150635e-05, 3.616511821746826e-05, 4.314631223678589e-05, 5.0127506256103516e-05, 5.710870027542114e-05, 6.408989429473877e-05, 7.10710883140564e-05, 7.805228233337402e-05, 8.503347635269165e-05, 9.201467037200928e-05, 9.89958643913269e-05, 0.00010597705841064453, 0.00011295825242996216, 0.00011993944644927979, 0.0001269206404685974, 0.00013390183448791504, 0.00014088302850723267, 0.0001478642225265503, 0.00015484541654586792, 0.00016182661056518555, 0.00016880780458450317, 0.0001757889986038208, 0.00018277019262313843, 0.00018975138664245605, 0.00019673258066177368, 0.0002037137746810913, 0.00021069496870040894, 0.00021767616271972656]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 7.0, 6.0, 12.0, 6.0, 8.0, 12.0, 31.0, 30.0, 50.0, 66.0, 114.0, 163.0, 280.0, 443.0, 847.0, 1677.0, 3831.0, 11054.0, 42956.0, 290257.0, 591866.0, 78081.0, 16864.0, 5235.0, 2148.0, 1022.0, 541.0, 325.0, 192.0, 131.0, 78.0, 64.0, 49.0, 31.0, 24.0, 16.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6538314819335938, -0.6328582763671875, -0.6118850708007812, -0.590911865234375, -0.5699386596679688, -0.5489654541015625, -0.5279922485351562, -0.50701904296875, -0.48604583740234375, -0.4650726318359375, -0.44409942626953125, -0.423126220703125, -0.40215301513671875, -0.3811798095703125, -0.36020660400390625, -0.3392333984375, -0.31826019287109375, -0.2972869873046875, -0.27631378173828125, -0.255340576171875, -0.23436737060546875, -0.2133941650390625, -0.19242095947265625, -0.17144775390625, -0.15047454833984375, -0.1295013427734375, -0.10852813720703125, -0.087554931640625, -0.06658172607421875, -0.0456085205078125, -0.02463531494140625, -0.003662109375, 0.01731109619140625, 0.0382843017578125, 0.05925750732421875, 0.080230712890625, 0.10120391845703125, 0.1221771240234375, 0.14315032958984375, 0.16412353515625, 0.18509674072265625, 0.2060699462890625, 0.22704315185546875, 0.248016357421875, 0.26898956298828125, 0.2899627685546875, 0.31093597412109375, 0.3319091796875, 0.35288238525390625, 0.3738555908203125, 0.39482879638671875, 0.415802001953125, 0.43677520751953125, 0.4577484130859375, 0.47872161865234375, 0.49969482421875, 0.5206680297851562, 0.5416412353515625, 0.5626144409179688, 0.583587646484375, 0.6045608520507812, 0.6255340576171875, 0.6465072631835938, 0.66748046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 4.0, 5.0, 10.0, 3.0, 12.0, 6.0, 18.0, 13.0, 21.0, 21.0, 29.0, 55.0, 63.0, 104.0, 144.0, 111.0, 82.0, 77.0, 40.0, 22.0, 27.0, 20.0, 16.0, 16.0, 13.0, 12.0, 8.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7266616821289062, -0.7038116455078125, -0.6809616088867188, -0.658111572265625, -0.6352615356445312, -0.6124114990234375, -0.5895614624023438, -0.56671142578125, -0.5438613891601562, -0.5210113525390625, -0.49816131591796875, -0.475311279296875, -0.45246124267578125, -0.4296112060546875, -0.40676116943359375, -0.3839111328125, -0.36106109619140625, -0.3382110595703125, -0.31536102294921875, -0.292510986328125, -0.26966094970703125, -0.2468109130859375, -0.22396087646484375, -0.20111083984375, -0.17826080322265625, -0.1554107666015625, -0.13256072998046875, -0.109710693359375, -0.08686065673828125, -0.0640106201171875, -0.04116058349609375, -0.018310546875, 0.00453948974609375, 0.0273895263671875, 0.05023956298828125, 0.073089599609375, 0.09593963623046875, 0.1187896728515625, 0.14163970947265625, 0.16448974609375, 0.18733978271484375, 0.2101898193359375, 0.23303985595703125, 0.255889892578125, 0.27873992919921875, 0.3015899658203125, 0.32444000244140625, 0.3472900390625, 0.37014007568359375, 0.3929901123046875, 0.41584014892578125, 0.438690185546875, 0.46154022216796875, 0.4843902587890625, 0.5072402954101562, 0.53009033203125, 0.5529403686523438, 0.5757904052734375, 0.5986404418945312, 0.621490478515625, 0.6443405151367188, 0.6671905517578125, 0.6900405883789062, 0.712890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 11.0, 38.0, 78.0, 154.0, 201.0, 219.0, 154.0, 75.0, 30.0, 14.0, 12.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.661388397216797, -17.22071075439453, -16.780033111572266, -16.33935546875, -15.898676872253418, -15.457999229431152, -15.01732063293457, -14.576642990112305, -14.135965347290039, -13.695287704467773, -13.254610061645508, -12.813931465148926, -12.37325382232666, -11.932576179504395, -11.491897583007812, -11.051219940185547, -10.610542297363281, -10.169864654541016, -9.72918701171875, -9.288508415222168, -8.847830772399902, -8.407153129577637, -7.966475009918213, -7.525796890258789, -7.085119247436523, -6.644441604614258, -6.203763484954834, -5.76308536529541, -5.3224077224731445, -4.881730079650879, -4.441051959991455, -4.000373840332031, -3.559697151184082, -3.1190192699432373, -2.6783413887023926, -2.237663507461548, -1.7969856262207031, -1.3563077449798584, -0.9156298637390137, -0.47495198249816895, -0.03427410125732422, 0.4064037799835205, 0.8470816612243652, 1.28775954246521, 1.7284374237060547, 2.1691153049468994, 2.609793186187744, 3.050471067428589, 3.4911489486694336, 3.9318268299102783, 4.372504711151123, 4.813182830810547, 5.2538604736328125, 5.694538116455078, 6.135216236114502, 6.575894355773926, 7.016571998596191, 7.457249641418457, 7.897927761077881, 8.338605880737305, 8.77928352355957, 9.219961166381836, 9.660638809204102, 10.101317405700684, 10.54199504852295]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 9.0, 7.0, 8.0, 7.0, 8.0, 13.0, 17.0, 22.0, 18.0, 26.0, 26.0, 26.0, 46.0, 29.0, 31.0, 43.0, 42.0, 39.0, 52.0, 48.0, 47.0, 45.0, 48.0, 45.0, 37.0, 30.0, 28.0, 35.0, 28.0, 21.0, 12.0, 15.0, 13.0, 14.0, 13.0, 12.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.533259391784668, -5.363619327545166, -5.193979263305664, -5.024339199066162, -4.85469913482666, -4.68505859375, -4.515418529510498, -4.345778465270996, -4.176138401031494, -4.006498336791992, -3.8368582725524902, -3.667217969894409, -3.4975779056549072, -3.3279378414154053, -3.158297538757324, -2.9886574745178223, -2.8190174102783203, -2.6493773460388184, -2.4797372817993164, -2.3100969791412354, -2.1404569149017334, -1.9708168506622314, -1.80117666721344, -1.6315364837646484, -1.4618964195251465, -1.2922563552856445, -1.122616171836853, -0.9529760479927063, -0.7833359241485596, -0.6136958003044128, -0.4440556764602661, -0.2744154930114746, -0.10477495193481445, 0.06486517190933228, 0.234505295753479, 0.40414541959762573, 0.5737855434417725, 0.7434256672859192, 0.9130657911300659, 1.0827059745788574, 1.2523460388183594, 1.4219861030578613, 1.5916262865066528, 1.7612664699554443, 1.9309065341949463, 2.1005465984344482, 2.2701869010925293, 2.4398269653320312, 2.609467029571533, 2.779107093811035, 2.948747158050537, 3.118387460708618, 3.28802752494812, 3.457667589187622, 3.627307891845703, 3.796947956085205, 3.966588020324707, 4.136228084564209, 4.305868148803711, 4.475508213043213, 4.645148277282715, 4.814788818359375, 4.984428882598877, 5.154068946838379, 5.323709011077881]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 3.0, 9.0, 17.0, 21.0, 34.0, 41.0, 59.0, 99.0, 112.0, 226.0, 370.0, 572.0, 1023.0, 1867.0, 3831.0, 8784.0, 24810.0, 111151.0, 3804409.0, 183680.0, 32801.0, 10750.0, 4537.0, 2207.0, 1135.0, 651.0, 393.0, 237.0, 149.0, 78.0, 70.0, 48.0, 30.0, 16.0, 11.0, 8.0, 8.0, 7.0, 2.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83935546875, -0.81280517578125, -0.7862548828125, -0.75970458984375, -0.733154296875, -0.70660400390625, -0.6800537109375, -0.65350341796875, -0.626953125, -0.60040283203125, -0.5738525390625, -0.54730224609375, -0.520751953125, -0.49420166015625, -0.4676513671875, -0.44110107421875, -0.41455078125, -0.38800048828125, -0.3614501953125, -0.33489990234375, -0.308349609375, -0.28179931640625, -0.2552490234375, -0.22869873046875, -0.2021484375, -0.17559814453125, -0.1490478515625, -0.12249755859375, -0.095947265625, -0.06939697265625, -0.0428466796875, -0.01629638671875, 0.01025390625, 0.03680419921875, 0.0633544921875, 0.08990478515625, 0.116455078125, 0.14300537109375, 0.1695556640625, 0.19610595703125, 0.22265625, 0.24920654296875, 0.2757568359375, 0.30230712890625, 0.328857421875, 0.35540771484375, 0.3819580078125, 0.40850830078125, 0.43505859375, 0.46160888671875, 0.4881591796875, 0.51470947265625, 0.541259765625, 0.56781005859375, 0.5943603515625, 0.62091064453125, 0.6474609375, 0.67401123046875, 0.7005615234375, 0.72711181640625, 0.753662109375, 0.78021240234375, 0.8067626953125, 0.83331298828125, 0.85986328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 14.0, 16.0, 15.0, 21.0, 21.0, 42.0, 33.0, 54.0, 49.0, 67.0, 65.0, 75.0, 85.0, 47.0, 83.0, 44.0, 39.0, 42.0, 34.0, 37.0, 26.0, 15.0, 12.0, 6.0, 14.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.23004531860351562, -0.22327423095703125, -0.21650314331054688, -0.2097320556640625, -0.20296096801757812, -0.19618988037109375, -0.18941879272460938, -0.182647705078125, -0.17587661743164062, -0.16910552978515625, -0.16233444213867188, -0.1555633544921875, -0.14879226684570312, -0.14202117919921875, -0.13525009155273438, -0.12847900390625, -0.12170791625976562, -0.11493682861328125, -0.10816574096679688, -0.1013946533203125, -0.09462356567382812, -0.08785247802734375, -0.08108139038085938, -0.074310302734375, -0.06753921508789062, -0.06076812744140625, -0.053997039794921875, -0.0472259521484375, -0.040454864501953125, -0.03368377685546875, -0.026912689208984375, -0.0201416015625, -0.013370513916015625, -0.00659942626953125, 0.000171661376953125, 0.0069427490234375, 0.013713836669921875, 0.02048492431640625, 0.027256011962890625, 0.034027099609375, 0.040798187255859375, 0.04756927490234375, 0.054340362548828125, 0.0611114501953125, 0.06788253784179688, 0.07465362548828125, 0.08142471313476562, 0.08819580078125, 0.09496688842773438, 0.10173797607421875, 0.10850906372070312, 0.1152801513671875, 0.12205123901367188, 0.12882232666015625, 0.13559341430664062, 0.142364501953125, 0.14913558959960938, 0.15590667724609375, 0.16267776489257812, 0.1694488525390625, 0.17621994018554688, 0.18299102783203125, 0.18976211547851562, 0.196533203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 10.0, 10.0, 11.0, 23.0, 18.0, 29.0, 44.0, 68.0, 89.0, 147.0, 224.0, 334.0, 582.0, 968.0, 1761.0, 3852.0, 10062.0, 44058.0, 3535619.0, 546778.0, 33736.0, 8392.0, 3351.0, 1703.0, 920.0, 543.0, 345.0, 196.0, 130.0, 96.0, 63.0, 39.0, 34.0, 9.0, 9.0, 11.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3349609375, -1.2967376708984375, -1.258514404296875, -1.2202911376953125, -1.18206787109375, -1.1438446044921875, -1.105621337890625, -1.0673980712890625, -1.0291748046875, -0.9909515380859375, -0.952728271484375, -0.9145050048828125, -0.87628173828125, -0.8380584716796875, -0.799835205078125, -0.7616119384765625, -0.723388671875, -0.6851654052734375, -0.646942138671875, -0.6087188720703125, -0.57049560546875, -0.5322723388671875, -0.494049072265625, -0.4558258056640625, -0.4176025390625, -0.3793792724609375, -0.341156005859375, -0.3029327392578125, -0.26470947265625, -0.2264862060546875, -0.188262939453125, -0.1500396728515625, -0.11181640625, -0.0735931396484375, -0.035369873046875, 0.0028533935546875, 0.04107666015625, 0.0792999267578125, 0.117523193359375, 0.1557464599609375, 0.1939697265625, 0.2321929931640625, 0.270416259765625, 0.3086395263671875, 0.34686279296875, 0.3850860595703125, 0.423309326171875, 0.4615325927734375, 0.499755859375, 0.5379791259765625, 0.576202392578125, 0.6144256591796875, 0.65264892578125, 0.6908721923828125, 0.729095458984375, 0.7673187255859375, 0.8055419921875, 0.8437652587890625, 0.881988525390625, 0.9202117919921875, 0.95843505859375, 0.9966583251953125, 1.034881591796875, 1.0731048583984375, 1.111328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 12.0, 6.0, 23.0, 44.0, 93.0, 328.0, 3125.0, 253.0, 66.0, 40.0, 26.0, 18.0, 8.0, 8.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3525390625, -0.3422966003417969, -0.33205413818359375, -0.3218116760253906, -0.3115692138671875, -0.3013267517089844, -0.29108428955078125, -0.2808418273925781, -0.270599365234375, -0.2603569030761719, -0.25011444091796875, -0.23987197875976562, -0.2296295166015625, -0.21938705444335938, -0.20914459228515625, -0.19890213012695312, -0.18865966796875, -0.17841720581054688, -0.16817474365234375, -0.15793228149414062, -0.1476898193359375, -0.13744735717773438, -0.12720489501953125, -0.11696243286132812, -0.106719970703125, -0.09647750854492188, -0.08623504638671875, -0.07599258422851562, -0.0657501220703125, -0.055507659912109375, -0.04526519775390625, -0.035022735595703125, -0.0247802734375, -0.014537811279296875, -0.00429534912109375, 0.005947113037109375, 0.0161895751953125, 0.026432037353515625, 0.03667449951171875, 0.046916961669921875, 0.057159423828125, 0.06740188598632812, 0.07764434814453125, 0.08788681030273438, 0.0981292724609375, 0.10837173461914062, 0.11861419677734375, 0.12885665893554688, 0.13909912109375, 0.14934158325195312, 0.15958404541015625, 0.16982650756835938, 0.1800689697265625, 0.19031143188476562, 0.20055389404296875, 0.21079635620117188, 0.221038818359375, 0.23128128051757812, 0.24152374267578125, 0.2517662048339844, 0.2620086669921875, 0.2722511291503906, 0.28249359130859375, 0.2927360534667969, 0.302978515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 13.0, 17.0, 28.0, 37.0, 72.0, 94.0, 130.0, 131.0, 128.0, 127.0, 74.0, 52.0, 32.0, 25.0, 13.0, 6.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.006881833076477, -0.9752042293548584, -0.9435266256332397, -0.9118490219116211, -0.8801714181900024, -0.8484938144683838, -0.8168161511421204, -0.7851385474205017, -0.7534609436988831, -0.7217833399772644, -0.6901057362556458, -0.6584281325340271, -0.6267504692077637, -0.595072865486145, -0.5633952617645264, -0.5317176580429077, -0.5000400543212891, -0.4683624505996704, -0.43668484687805176, -0.4050072133541107, -0.37332960963249207, -0.3416520059108734, -0.3099743723869324, -0.2782967686653137, -0.24661916494369507, -0.21494156122207642, -0.18326394259929657, -0.15158632397651672, -0.11990872025489807, -0.08823111653327942, -0.05655349791049957, -0.024875879287719727, 0.006801724433898926, 0.038479335606098175, 0.07015694677829742, 0.10183455795049667, 0.13351216912269592, 0.16518977284431458, 0.19686739146709442, 0.22854501008987427, 0.2602226138114929, 0.2919002175331116, 0.3235778212547302, 0.35525545477867126, 0.3869330585002899, 0.41861066222190857, 0.4502882957458496, 0.48196589946746826, 0.5136435031890869, 0.5453211069107056, 0.5769987106323242, 0.6086763143539429, 0.6403539180755615, 0.6720315217971802, 0.7037091851234436, 0.7353867888450623, 0.7670643925666809, 0.7987419962882996, 0.8304196000099182, 0.8620972037315369, 0.8937748670578003, 0.925452470779419, 0.9571300745010376, 0.9888076782226562, 1.020485281944275]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 3.0, 8.0, 10.0, 7.0, 14.0, 18.0, 25.0, 17.0, 16.0, 23.0, 40.0, 30.0, 30.0, 35.0, 39.0, 37.0, 44.0, 56.0, 27.0, 53.0, 48.0, 41.0, 41.0, 38.0, 37.0, 29.0, 29.0, 30.0, 24.0, 18.0, 14.0, 16.0, 22.0, 13.0, 9.0, 11.0, 6.0, 8.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5253311991691589, -0.5084941387176514, -0.4916570782661438, -0.4748200476169586, -0.45798298716545105, -0.4411459267139435, -0.4243088960647583, -0.40747183561325073, -0.39063477516174316, -0.3737977147102356, -0.356960654258728, -0.34012362360954285, -0.3232865631580353, -0.3064495027065277, -0.28961247205734253, -0.27277541160583496, -0.2559383511543274, -0.23910129070281982, -0.22226424515247345, -0.20542719960212708, -0.1885901391506195, -0.17175307869911194, -0.15491603314876556, -0.1380789875984192, -0.12124192714691162, -0.10440487414598465, -0.08756782114505768, -0.0707307681441307, -0.053893715143203735, -0.037056662142276764, -0.020219609141349792, -0.003382556140422821, 0.013454437255859375, 0.030291490256786346, 0.04712854325771332, 0.06396559625864029, 0.08080264925956726, 0.09763970226049423, 0.1144767552614212, 0.13131380081176758, 0.14815086126327515, 0.16498792171478271, 0.1818249672651291, 0.19866201281547546, 0.21549907326698303, 0.2323361337184906, 0.24917317926883698, 0.26601022481918335, 0.2828472852706909, 0.2996843457221985, 0.31652140617370605, 0.33335843682289124, 0.3501954972743988, 0.36703255772590637, 0.38386958837509155, 0.4007066488265991, 0.4175437092781067, 0.43438076972961426, 0.4512178301811218, 0.468054860830307, 0.4848919212818146, 0.5017289519309998, 0.5185660123825073, 0.5354030728340149, 0.5522401332855225]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 24.0, 40.0, 53.0, 99.0, 160.0, 282.0, 599.0, 1293.0, 2973.0, 8292.0, 27667.0, 121163.0, 459747.0, 327614.0, 70787.0, 17681.0, 5806.0, 2265.0, 937.0, 459.0, 230.0, 137.0, 78.0, 54.0, 37.0, 18.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1827239990234375, -1.146697998046875, -1.1106719970703125, -1.07464599609375, -1.0386199951171875, -1.002593994140625, -0.9665679931640625, -0.9305419921875, -0.8945159912109375, -0.858489990234375, -0.8224639892578125, -0.78643798828125, -0.7504119873046875, -0.714385986328125, -0.6783599853515625, -0.642333984375, -0.6063079833984375, -0.570281982421875, -0.5342559814453125, -0.49822998046875, -0.4622039794921875, -0.426177978515625, -0.3901519775390625, -0.3541259765625, -0.3180999755859375, -0.282073974609375, -0.2460479736328125, -0.21002197265625, -0.1739959716796875, -0.137969970703125, -0.1019439697265625, -0.06591796875, -0.0298919677734375, 0.006134033203125, 0.0421600341796875, 0.07818603515625, 0.1142120361328125, 0.150238037109375, 0.1862640380859375, 0.2222900390625, 0.2583160400390625, 0.294342041015625, 0.3303680419921875, 0.36639404296875, 0.4024200439453125, 0.438446044921875, 0.4744720458984375, 0.510498046875, 0.5465240478515625, 0.582550048828125, 0.6185760498046875, 0.65460205078125, 0.6906280517578125, 0.726654052734375, 0.7626800537109375, 0.7987060546875, 0.8347320556640625, 0.870758056640625, 0.9067840576171875, 0.94281005859375, 0.9788360595703125, 1.014862060546875, 1.0508880615234375, 1.0869140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 6.0, 9.0, 10.0, 12.0, 18.0, 19.0, 29.0, 34.0, 44.0, 40.0, 45.0, 49.0, 81.0, 51.0, 81.0, 54.0, 59.0, 60.0, 41.0, 32.0, 44.0, 33.0, 33.0, 23.0, 23.0, 17.0, 16.0, 12.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24322128295898438, -0.23619842529296875, -0.22917556762695312, -0.2221527099609375, -0.21512985229492188, -0.20810699462890625, -0.20108413696289062, -0.194061279296875, -0.18703842163085938, -0.18001556396484375, -0.17299270629882812, -0.1659698486328125, -0.15894699096679688, -0.15192413330078125, -0.14490127563476562, -0.13787841796875, -0.13085556030273438, -0.12383270263671875, -0.11680984497070312, -0.1097869873046875, -0.10276412963867188, -0.09574127197265625, -0.08871841430664062, -0.081695556640625, -0.07467269897460938, -0.06764984130859375, -0.060626983642578125, -0.0536041259765625, -0.046581268310546875, -0.03955841064453125, -0.032535552978515625, -0.0255126953125, -0.018489837646484375, -0.01146697998046875, -0.004444122314453125, 0.0025787353515625, 0.009601593017578125, 0.01662445068359375, 0.023647308349609375, 0.030670166015625, 0.037693023681640625, 0.04471588134765625, 0.051738739013671875, 0.0587615966796875, 0.06578445434570312, 0.07280731201171875, 0.07983016967773438, 0.08685302734375, 0.09387588500976562, 0.10089874267578125, 0.10792160034179688, 0.1149444580078125, 0.12196731567382812, 0.12899017333984375, 0.13601303100585938, 0.143035888671875, 0.15005874633789062, 0.15708160400390625, 0.16410446166992188, 0.1711273193359375, 0.17815017700195312, 0.18517303466796875, 0.19219589233398438, 0.19921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 7.0, 13.0, 16.0, 20.0, 31.0, 64.0, 87.0, 171.0, 304.0, 533.0, 1132.0, 2558.0, 6953.0, 25900.0, 155830.0, 645897.0, 169274.0, 27243.0, 7436.0, 2709.0, 1106.0, 537.0, 315.0, 150.0, 96.0, 65.0, 28.0, 28.0, 21.0, 12.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3134765625, -1.2718048095703125, -1.230133056640625, -1.1884613037109375, -1.14678955078125, -1.1051177978515625, -1.063446044921875, -1.0217742919921875, -0.9801025390625, -0.9384307861328125, -0.896759033203125, -0.8550872802734375, -0.81341552734375, -0.7717437744140625, -0.730072021484375, -0.6884002685546875, -0.646728515625, -0.6050567626953125, -0.563385009765625, -0.5217132568359375, -0.48004150390625, -0.4383697509765625, -0.396697998046875, -0.3550262451171875, -0.3133544921875, -0.2716827392578125, -0.230010986328125, -0.1883392333984375, -0.14666748046875, -0.1049957275390625, -0.063323974609375, -0.0216522216796875, 0.02001953125, 0.0616912841796875, 0.103363037109375, 0.1450347900390625, 0.18670654296875, 0.2283782958984375, 0.270050048828125, 0.3117218017578125, 0.3533935546875, 0.3950653076171875, 0.436737060546875, 0.4784088134765625, 0.52008056640625, 0.5617523193359375, 0.603424072265625, 0.6450958251953125, 0.686767578125, 0.7284393310546875, 0.770111083984375, 0.8117828369140625, 0.85345458984375, 0.8951263427734375, 0.936798095703125, 0.9784698486328125, 1.0201416015625, 1.0618133544921875, 1.103485107421875, 1.1451568603515625, 1.18682861328125, 1.2285003662109375, 1.270172119140625, 1.3118438720703125, 1.353515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 7.0, 4.0, 11.0, 9.0, 19.0, 21.0, 35.0, 36.0, 46.0, 50.0, 45.0, 65.0, 65.0, 68.0, 78.0, 42.0, 64.0, 48.0, 35.0, 36.0, 41.0, 35.0, 31.0, 25.0, 23.0, 11.0, 9.0, 11.0, 9.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2158203125, -1.1701507568359375, -1.124481201171875, -1.0788116455078125, -1.03314208984375, -0.9874725341796875, -0.941802978515625, -0.8961334228515625, -0.8504638671875, -0.8047943115234375, -0.759124755859375, -0.7134552001953125, -0.66778564453125, -0.6221160888671875, -0.576446533203125, -0.5307769775390625, -0.485107421875, -0.4394378662109375, -0.393768310546875, -0.3480987548828125, -0.30242919921875, -0.2567596435546875, -0.211090087890625, -0.1654205322265625, -0.1197509765625, -0.0740814208984375, -0.028411865234375, 0.0172576904296875, 0.06292724609375, 0.1085968017578125, 0.154266357421875, 0.1999359130859375, 0.24560546875, 0.2912750244140625, 0.336944580078125, 0.3826141357421875, 0.42828369140625, 0.4739532470703125, 0.519622802734375, 0.5652923583984375, 0.6109619140625, 0.6566314697265625, 0.702301025390625, 0.7479705810546875, 0.79364013671875, 0.8393096923828125, 0.884979248046875, 0.9306488037109375, 0.976318359375, 1.0219879150390625, 1.067657470703125, 1.1133270263671875, 1.15899658203125, 1.2046661376953125, 1.250335693359375, 1.2960052490234375, 1.3416748046875, 1.3873443603515625, 1.433013916015625, 1.4786834716796875, 1.52435302734375, 1.5700225830078125, 1.615692138671875, 1.6613616943359375, 1.70703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 12.0, 26.0, 32.0, 51.0, 81.0, 149.0, 255.0, 552.0, 1403.0, 5127.0, 47268.0, 929906.0, 55516.0, 5530.0, 1456.0, 534.0, 279.0, 141.0, 92.0, 48.0, 26.0, 14.0, 12.0, 11.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.7833709716796875, -1.724945068359375, -1.6665191650390625, -1.60809326171875, -1.5496673583984375, -1.491241455078125, -1.4328155517578125, -1.3743896484375, -1.3159637451171875, -1.257537841796875, -1.1991119384765625, -1.14068603515625, -1.0822601318359375, -1.023834228515625, -0.9654083251953125, -0.906982421875, -0.8485565185546875, -0.790130615234375, -0.7317047119140625, -0.67327880859375, -0.6148529052734375, -0.556427001953125, -0.4980010986328125, -0.4395751953125, -0.3811492919921875, -0.322723388671875, -0.2642974853515625, -0.20587158203125, -0.1474456787109375, -0.089019775390625, -0.0305938720703125, 0.02783203125, 0.0862579345703125, 0.144683837890625, 0.2031097412109375, 0.26153564453125, 0.3199615478515625, 0.378387451171875, 0.4368133544921875, 0.4952392578125, 0.5536651611328125, 0.612091064453125, 0.6705169677734375, 0.72894287109375, 0.7873687744140625, 0.845794677734375, 0.9042205810546875, 0.962646484375, 1.0210723876953125, 1.079498291015625, 1.1379241943359375, 1.19635009765625, 1.2547760009765625, 1.313201904296875, 1.3716278076171875, 1.4300537109375, 1.4884796142578125, 1.546905517578125, 1.6053314208984375, 1.66375732421875, 1.7221832275390625, 1.780609130859375, 1.8390350341796875, 1.8974609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 16.0, 22.0, 36.0, 58.0, 108.0, 120.0, 144.0, 161.0, 110.0, 112.0, 47.0, 28.0, 15.0, 10.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0003917217254638672, -0.0003816969692707062, -0.00037167221307754517, -0.00036164745688438416, -0.00035162270069122314, -0.00034159794449806213, -0.0003315731883049011, -0.0003215484321117401, -0.0003115236759185791, -0.0003014989197254181, -0.0002914741635322571, -0.00028144940733909607, -0.00027142465114593506, -0.00026139989495277405, -0.00025137513875961304, -0.00024135038256645203, -0.00023132562637329102, -0.00022130087018013, -0.000211276113986969, -0.00020125135779380798, -0.00019122660160064697, -0.00018120184540748596, -0.00017117708921432495, -0.00016115233302116394, -0.00015112757682800293, -0.00014110282063484192, -0.0001310780644416809, -0.0001210533082485199, -0.00011102855205535889, -0.00010100379586219788, -9.097903966903687e-05, -8.095428347587585e-05, -7.092952728271484e-05, -6.090477108955383e-05, -5.088001489639282e-05, -4.085525870323181e-05, -3.08305025100708e-05, -2.080574631690979e-05, -1.078099012374878e-05, -7.562339305877686e-07, 9.268522262573242e-06, 1.9293278455734253e-05, 2.9318034648895264e-05, 3.9342790842056274e-05, 4.9367547035217285e-05, 5.9392303228378296e-05, 6.94170594215393e-05, 7.944181561470032e-05, 8.946657180786133e-05, 9.949132800102234e-05, 0.00010951608419418335, 0.00011954084038734436, 0.00012956559658050537, 0.00013959035277366638, 0.0001496151089668274, 0.0001596398651599884, 0.00016966462135314941, 0.00017968937754631042, 0.00018971413373947144, 0.00019973888993263245, 0.00020976364612579346, 0.00021978840231895447, 0.00022981315851211548, 0.0002398379147052765, 0.0002498626708984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 19.0, 12.0, 22.0, 34.0, 63.0, 96.0, 132.0, 268.0, 594.0, 1499.0, 5156.0, 36704.0, 840866.0, 148387.0, 10534.0, 2395.0, 838.0, 369.0, 204.0, 115.0, 59.0, 35.0, 36.0, 13.0, 22.0, 11.0, 14.0, 5.0, 5.0, 10.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.083831787109375, -1.04168701171875, -0.999542236328125, -0.9573974609375, -0.915252685546875, -0.87310791015625, -0.830963134765625, -0.788818359375, -0.746673583984375, -0.70452880859375, -0.662384033203125, -0.6202392578125, -0.578094482421875, -0.53594970703125, -0.493804931640625, -0.45166015625, -0.409515380859375, -0.36737060546875, -0.325225830078125, -0.2830810546875, -0.240936279296875, -0.19879150390625, -0.156646728515625, -0.114501953125, -0.072357177734375, -0.03021240234375, 0.011932373046875, 0.0540771484375, 0.096221923828125, 0.13836669921875, 0.180511474609375, 0.22265625, 0.264801025390625, 0.30694580078125, 0.349090576171875, 0.3912353515625, 0.433380126953125, 0.47552490234375, 0.517669677734375, 0.559814453125, 0.601959228515625, 0.64410400390625, 0.686248779296875, 0.7283935546875, 0.770538330078125, 0.81268310546875, 0.854827880859375, 0.89697265625, 0.939117431640625, 0.98126220703125, 1.023406982421875, 1.0655517578125, 1.107696533203125, 1.14984130859375, 1.191986083984375, 1.234130859375, 1.276275634765625, 1.31842041015625, 1.360565185546875, 1.4027099609375, 1.444854736328125, 1.48699951171875, 1.529144287109375, 1.5712890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 1.0, 5.0, 3.0, 5.0, 9.0, 9.0, 16.0, 19.0, 35.0, 52.0, 79.0, 136.0, 218.0, 144.0, 78.0, 56.0, 39.0, 35.0, 14.0, 9.0, 8.0, 9.0, 3.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6282806396484375, -1.579803466796875, -1.5313262939453125, -1.48284912109375, -1.4343719482421875, -1.385894775390625, -1.3374176025390625, -1.2889404296875, -1.2404632568359375, -1.191986083984375, -1.1435089111328125, -1.09503173828125, -1.0465545654296875, -0.998077392578125, -0.9496002197265625, -0.901123046875, -0.8526458740234375, -0.804168701171875, -0.7556915283203125, -0.70721435546875, -0.6587371826171875, -0.610260009765625, -0.5617828369140625, -0.5133056640625, -0.4648284912109375, -0.416351318359375, -0.3678741455078125, -0.31939697265625, -0.2709197998046875, -0.222442626953125, -0.1739654541015625, -0.12548828125, -0.0770111083984375, -0.028533935546875, 0.0199432373046875, 0.06842041015625, 0.1168975830078125, 0.165374755859375, 0.2138519287109375, 0.2623291015625, 0.3108062744140625, 0.359283447265625, 0.4077606201171875, 0.45623779296875, 0.5047149658203125, 0.553192138671875, 0.6016693115234375, 0.650146484375, 0.6986236572265625, 0.747100830078125, 0.7955780029296875, 0.84405517578125, 0.8925323486328125, 0.941009521484375, 0.9894866943359375, 1.0379638671875, 1.0864410400390625, 1.134918212890625, 1.1833953857421875, 1.23187255859375, 1.2803497314453125, 1.328826904296875, 1.3773040771484375, 1.42578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 40.0, 93.0, 266.0, 328.0, 172.0, 56.0, 23.0, 12.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.725555419921875, -37.84878158569336, -36.97201156616211, -36.095237731933594, -35.218467712402344, -34.34169387817383, -33.46492385864258, -32.58815002441406, -31.711380004882812, -30.83460807800293, -29.957836151123047, -29.081064224243164, -28.20429229736328, -27.3275203704834, -26.450748443603516, -25.573974609375, -24.697202682495117, -23.820430755615234, -22.94365882873535, -22.06688690185547, -21.190114974975586, -20.313343048095703, -19.436569213867188, -18.559799194335938, -17.683025360107422, -16.80625343322754, -15.929481506347656, -15.052709579467773, -14.17593765258789, -13.299165725708008, -12.422392845153809, -11.545620918273926, -10.668851852416992, -9.79207992553711, -8.915307998657227, -8.038536071777344, -7.161763668060303, -6.28499174118042, -5.408219337463379, -4.531447410583496, -3.6546754837036133, -2.7779035568237305, -1.9011313915252686, -1.0243592262268066, -0.14758729934692383, 0.729184627532959, 1.60595703125, 2.482728958129883, 3.3595008850097656, 4.236272811889648, 5.113044738769531, 5.989817142486572, 6.866589069366455, 7.743360996246338, 8.620133399963379, 9.496905326843262, 10.373677253723145, 11.250449180603027, 12.12722110748291, 13.00399398803711, 13.880765914916992, 14.757537841796875, 15.634309768676758, 16.51108169555664, 17.387853622436523]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 3.0, 6.0, 15.0, 22.0, 20.0, 19.0, 30.0, 40.0, 39.0, 30.0, 44.0, 69.0, 49.0, 53.0, 60.0, 61.0, 48.0, 54.0, 41.0, 47.0, 35.0, 24.0, 34.0, 29.0, 23.0, 24.0, 15.0, 11.0, 10.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.49945068359375, -8.242652893066406, -7.985855579376221, -7.729058265686035, -7.47226095199585, -7.215463638305664, -6.95866584777832, -6.701868534088135, -6.445071220397949, -6.188273906707764, -5.93147611618042, -5.674678802490234, -5.417881488800049, -5.161084175109863, -4.9042863845825195, -4.647489070892334, -4.39069128036499, -4.133893966674805, -3.87709641456604, -3.6202988624572754, -3.36350154876709, -3.106703996658325, -2.8499064445495605, -2.593109130859375, -2.3363115787506104, -2.0795140266418457, -1.8227167129516602, -1.5659191608428955, -1.3091217279434204, -1.0523242950439453, -0.7955267429351807, -0.5387293100357056, -0.28193187713623047, -0.025134414434432983, 0.2316630482673645, 0.4884605407714844, 0.7452579736709595, 1.0020554065704346, 1.2588529586791992, 1.5156503915786743, 1.7724478244781494, 2.029245376586914, 2.2860426902770996, 2.5428402423858643, 2.799637794494629, 3.0564351081848145, 3.313232660293579, 3.5700302124023438, 3.8268275260925293, 4.083624839782715, 4.340422630310059, 4.597219944000244, 4.85401725769043, 5.110815048217773, 5.367612361907959, 5.6244096755981445, 5.881207466125488, 6.138004779815674, 6.394802570343018, 6.651599884033203, 6.908397197723389, 7.165194511413574, 7.421992301940918, 7.6787896156311035, 7.935586929321289]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 5.0, 10.0, 22.0, 25.0, 38.0, 48.0, 80.0, 108.0, 184.0, 334.0, 523.0, 995.0, 2051.0, 5204.0, 17251.0, 111564.0, 3899512.0, 127724.0, 18574.0, 5412.0, 2103.0, 1049.0, 551.0, 310.0, 181.0, 113.0, 81.0, 62.0, 31.0, 24.0, 21.0, 23.0, 8.0, 8.0, 4.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.439453125, -1.3907012939453125, -1.341949462890625, -1.2931976318359375, -1.24444580078125, -1.1956939697265625, -1.146942138671875, -1.0981903076171875, -1.0494384765625, -1.0006866455078125, -0.951934814453125, -0.9031829833984375, -0.85443115234375, -0.8056793212890625, -0.756927490234375, -0.7081756591796875, -0.659423828125, -0.6106719970703125, -0.561920166015625, -0.5131683349609375, -0.46441650390625, -0.4156646728515625, -0.366912841796875, -0.3181610107421875, -0.2694091796875, -0.2206573486328125, -0.171905517578125, -0.1231536865234375, -0.07440185546875, -0.0256500244140625, 0.023101806640625, 0.0718536376953125, 0.12060546875, 0.1693572998046875, 0.218109130859375, 0.2668609619140625, 0.31561279296875, 0.3643646240234375, 0.413116455078125, 0.4618682861328125, 0.5106201171875, 0.5593719482421875, 0.608123779296875, 0.6568756103515625, 0.70562744140625, 0.7543792724609375, 0.803131103515625, 0.8518829345703125, 0.900634765625, 0.9493865966796875, 0.998138427734375, 1.0468902587890625, 1.09564208984375, 1.1443939208984375, 1.193145751953125, 1.2418975830078125, 1.2906494140625, 1.3394012451171875, 1.388153076171875, 1.4369049072265625, 1.48565673828125, 1.5344085693359375, 1.583160400390625, 1.6319122314453125, 1.6806640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 9.0, 16.0, 11.0, 10.0, 17.0, 24.0, 28.0, 36.0, 47.0, 50.0, 54.0, 72.0, 56.0, 75.0, 72.0, 71.0, 67.0, 66.0, 43.0, 29.0, 31.0, 22.0, 20.0, 10.0, 6.0, 10.0, 9.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3246021270751953, -0.3157081604003906, -0.30681419372558594, -0.29792022705078125, -0.28902626037597656, -0.2801322937011719, -0.2712383270263672, -0.2623443603515625, -0.2534503936767578, -0.24455642700195312, -0.23566246032714844, -0.22676849365234375, -0.21787452697753906, -0.20898056030273438, -0.2000865936279297, -0.191192626953125, -0.1822986602783203, -0.17340469360351562, -0.16451072692871094, -0.15561676025390625, -0.14672279357910156, -0.13782882690429688, -0.1289348602294922, -0.1200408935546875, -0.11114692687988281, -0.10225296020507812, -0.09335899353027344, -0.08446502685546875, -0.07557106018066406, -0.06667709350585938, -0.05778312683105469, -0.04888916015625, -0.03999519348144531, -0.031101226806640625, -0.022207260131835938, -0.01331329345703125, -0.0044193267822265625, 0.004474639892578125, 0.013368606567382812, 0.0222625732421875, 0.031156539916992188, 0.040050506591796875, 0.04894447326660156, 0.05783843994140625, 0.06673240661621094, 0.07562637329101562, 0.08452033996582031, 0.093414306640625, 0.10230827331542969, 0.11120223999023438, 0.12009620666503906, 0.12899017333984375, 0.13788414001464844, 0.14677810668945312, 0.1556720733642578, 0.1645660400390625, 0.1734600067138672, 0.18235397338867188, 0.19124794006347656, 0.20014190673828125, 0.20903587341308594, 0.21792984008789062, 0.2268238067626953, 0.2357177734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 8.0, 18.0, 30.0, 27.0, 34.0, 66.0, 101.0, 127.0, 191.0, 361.0, 654.0, 1242.0, 2750.0, 7687.0, 29712.0, 237143.0, 3777321.0, 108283.0, 18492.0, 5522.0, 2064.0, 1038.0, 565.0, 297.0, 159.0, 135.0, 76.0, 40.0, 42.0, 22.0, 11.0, 13.0, 13.0, 7.0, 10.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.632843017578125, -1.57720947265625, -1.521575927734375, -1.4659423828125, -1.410308837890625, -1.35467529296875, -1.299041748046875, -1.243408203125, -1.187774658203125, -1.13214111328125, -1.076507568359375, -1.0208740234375, -0.965240478515625, -0.90960693359375, -0.853973388671875, -0.79833984375, -0.742706298828125, -0.68707275390625, -0.631439208984375, -0.5758056640625, -0.520172119140625, -0.46453857421875, -0.408905029296875, -0.353271484375, -0.297637939453125, -0.24200439453125, -0.186370849609375, -0.1307373046875, -0.075103759765625, -0.01947021484375, 0.036163330078125, 0.091796875, 0.147430419921875, 0.20306396484375, 0.258697509765625, 0.3143310546875, 0.369964599609375, 0.42559814453125, 0.481231689453125, 0.536865234375, 0.592498779296875, 0.64813232421875, 0.703765869140625, 0.7593994140625, 0.815032958984375, 0.87066650390625, 0.926300048828125, 0.98193359375, 1.037567138671875, 1.09320068359375, 1.148834228515625, 1.2044677734375, 1.260101318359375, 1.31573486328125, 1.371368408203125, 1.427001953125, 1.482635498046875, 1.53826904296875, 1.593902587890625, 1.6495361328125, 1.705169677734375, 1.76080322265625, 1.816436767578125, 1.8720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 12.0, 15.0, 33.0, 73.0, 212.0, 2214.0, 1150.0, 171.0, 70.0, 48.0, 32.0, 13.0, 11.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.33892822265625, -0.3189697265625, -0.29901123046875, -0.279052734375, -0.25909423828125, -0.2391357421875, -0.21917724609375, -0.19921875, -0.17926025390625, -0.1593017578125, -0.13934326171875, -0.119384765625, -0.09942626953125, -0.0794677734375, -0.05950927734375, -0.03955078125, -0.01959228515625, 0.0003662109375, 0.02032470703125, 0.040283203125, 0.06024169921875, 0.0802001953125, 0.10015869140625, 0.1201171875, 0.14007568359375, 0.1600341796875, 0.17999267578125, 0.199951171875, 0.21990966796875, 0.2398681640625, 0.25982666015625, 0.27978515625, 0.29974365234375, 0.3197021484375, 0.33966064453125, 0.359619140625, 0.37957763671875, 0.3995361328125, 0.41949462890625, 0.439453125, 0.45941162109375, 0.4793701171875, 0.49932861328125, 0.519287109375, 0.53924560546875, 0.5592041015625, 0.57916259765625, 0.59912109375, 0.61907958984375, 0.6390380859375, 0.65899658203125, 0.678955078125, 0.69891357421875, 0.7188720703125, 0.73883056640625, 0.7587890625, 0.77874755859375, 0.7987060546875, 0.81866455078125, 0.838623046875, 0.85858154296875, 0.8785400390625, 0.89849853515625, 0.91845703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 24.0, 43.0, 127.0, 206.0, 240.0, 163.0, 99.0, 50.0, 28.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.364908695220947, -4.2325334548950195, -4.100157737731934, -3.9677822589874268, -3.83540678024292, -3.703031301498413, -3.5706558227539062, -3.4382803440093994, -3.3059048652648926, -3.1735293865203857, -3.041153907775879, -2.908778429031372, -2.7764029502868652, -2.6440274715423584, -2.5116519927978516, -2.3792765140533447, -2.246901035308838, -2.114525556564331, -1.9821500778198242, -1.8497745990753174, -1.7173991203308105, -1.5850236415863037, -1.4526481628417969, -1.32027268409729, -1.1878972053527832, -1.0555217266082764, -0.9231462478637695, -0.7907707691192627, -0.6583952903747559, -0.526019811630249, -0.3936443328857422, -0.26126885414123535, -0.12889385223388672, 0.003481626510620117, 0.13585710525512695, 0.2682325839996338, 0.4006080627441406, 0.5329835414886475, 0.6653590202331543, 0.7977344989776611, 0.930109977722168, 1.0624854564666748, 1.1948609352111816, 1.3272364139556885, 1.4596118927001953, 1.5919873714447021, 1.724362850189209, 1.8567383289337158, 1.9891138076782227, 2.1214892864227295, 2.2538647651672363, 2.386240243911743, 2.51861572265625, 2.650991201400757, 2.7833666801452637, 2.9157421588897705, 3.0481176376342773, 3.180493116378784, 3.312868595123291, 3.445244073867798, 3.5776195526123047, 3.7099950313568115, 3.8423705101013184, 3.974745988845825, 4.107121467590332]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 5.0, 6.0, 9.0, 9.0, 21.0, 18.0, 25.0, 20.0, 24.0, 29.0, 38.0, 37.0, 32.0, 33.0, 43.0, 36.0, 47.0, 44.0, 41.0, 37.0, 33.0, 48.0, 33.0, 50.0, 39.0, 38.0, 38.0, 33.0, 28.0, 23.0, 21.0, 13.0, 10.0, 6.0, 8.0, 11.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6801671981811523, -1.6221437454223633, -1.5641201734542847, -1.5060967206954956, -1.448073148727417, -1.390049695968628, -1.3320262432098389, -1.2740026712417603, -1.2159790992736816, -1.1579556465148926, -1.099932074546814, -1.041908621788025, -0.9838850498199463, -0.9258615970611572, -0.8678380846977234, -0.8098145723342896, -0.7517911195755005, -0.6937676072120667, -0.6357440948486328, -0.5777206420898438, -0.5196970701217651, -0.4616735875606537, -0.40365010499954224, -0.3456265926361084, -0.28760308027267456, -0.22957956790924072, -0.17155607044696808, -0.11353257298469543, -0.0555090606212616, 0.002514451742172241, 0.06053793430328369, 0.11856144666671753, 0.17658495903015137, 0.2346084713935852, 0.29263198375701904, 0.3506554663181305, 0.40867897868156433, 0.46670249104499817, 0.5247259736061096, 0.5827494859695435, 0.6407729983329773, 0.6987965106964111, 0.756820023059845, 0.8148435354232788, 0.8728669881820679, 0.9308905601501465, 0.9889140129089355, 1.0469374656677246, 1.1049610376358032, 1.1629844903945923, 1.221008062362671, 1.27903151512146, 1.3370550870895386, 1.3950785398483276, 1.4531021118164062, 1.5111255645751953, 1.5691490173339844, 1.6271724700927734, 1.685196042060852, 1.7432194948196411, 1.8012430667877197, 1.8592665195465088, 1.9172899723052979, 1.9753135442733765, 2.033337116241455]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 11.0, 19.0, 31.0, 38.0, 53.0, 89.0, 165.0, 229.0, 416.0, 696.0, 1340.0, 2917.0, 6454.0, 17067.0, 51743.0, 174446.0, 410033.0, 261431.0, 79774.0, 24733.0, 8992.0, 3842.0, 1807.0, 957.0, 522.0, 281.0, 171.0, 84.0, 68.0, 39.0, 33.0, 27.0, 13.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.767578125, -0.740814208984375, -0.71405029296875, -0.687286376953125, -0.6605224609375, -0.633758544921875, -0.60699462890625, -0.580230712890625, -0.553466796875, -0.526702880859375, -0.49993896484375, -0.473175048828125, -0.4464111328125, -0.419647216796875, -0.39288330078125, -0.366119384765625, -0.33935546875, -0.312591552734375, -0.28582763671875, -0.259063720703125, -0.2322998046875, -0.205535888671875, -0.17877197265625, -0.152008056640625, -0.125244140625, -0.098480224609375, -0.07171630859375, -0.044952392578125, -0.0181884765625, 0.008575439453125, 0.03533935546875, 0.062103271484375, 0.0888671875, 0.115631103515625, 0.14239501953125, 0.169158935546875, 0.1959228515625, 0.222686767578125, 0.24945068359375, 0.276214599609375, 0.302978515625, 0.329742431640625, 0.35650634765625, 0.383270263671875, 0.4100341796875, 0.436798095703125, 0.46356201171875, 0.490325927734375, 0.51708984375, 0.543853759765625, 0.57061767578125, 0.597381591796875, 0.6241455078125, 0.650909423828125, 0.67767333984375, 0.704437255859375, 0.731201171875, 0.757965087890625, 0.78472900390625, 0.811492919921875, 0.8382568359375, 0.865020751953125, 0.89178466796875, 0.918548583984375, 0.9453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 5.0, 4.0, 11.0, 18.0, 12.0, 17.0, 19.0, 23.0, 20.0, 32.0, 41.0, 41.0, 34.0, 36.0, 55.0, 65.0, 61.0, 62.0, 46.0, 44.0, 50.0, 55.0, 34.0, 31.0, 25.0, 24.0, 17.0, 23.0, 18.0, 11.0, 10.0, 7.0, 6.0, 12.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.325439453125, -0.3160552978515625, -0.306671142578125, -0.2972869873046875, -0.28790283203125, -0.2785186767578125, -0.269134521484375, -0.2597503662109375, -0.2503662109375, -0.2409820556640625, -0.231597900390625, -0.2222137451171875, -0.21282958984375, -0.2034454345703125, -0.194061279296875, -0.1846771240234375, -0.17529296875, -0.1659088134765625, -0.156524658203125, -0.1471405029296875, -0.13775634765625, -0.1283721923828125, -0.118988037109375, -0.1096038818359375, -0.1002197265625, -0.0908355712890625, -0.081451416015625, -0.0720672607421875, -0.06268310546875, -0.0532989501953125, -0.043914794921875, -0.0345306396484375, -0.025146484375, -0.0157623291015625, -0.006378173828125, 0.0030059814453125, 0.01239013671875, 0.0217742919921875, 0.031158447265625, 0.0405426025390625, 0.0499267578125, 0.0593109130859375, 0.068695068359375, 0.0780792236328125, 0.08746337890625, 0.0968475341796875, 0.106231689453125, 0.1156158447265625, 0.125, 0.1343841552734375, 0.143768310546875, 0.1531524658203125, 0.16253662109375, 0.1719207763671875, 0.181304931640625, 0.1906890869140625, 0.2000732421875, 0.2094573974609375, 0.218841552734375, 0.2282257080078125, 0.23760986328125, 0.2469940185546875, 0.256378173828125, 0.2657623291015625, 0.275146484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 10.0, 6.0, 10.0, 13.0, 21.0, 32.0, 64.0, 103.0, 148.0, 355.0, 662.0, 1590.0, 4399.0, 23648.0, 495296.0, 491178.0, 23780.0, 4335.0, 1408.0, 680.0, 336.0, 167.0, 104.0, 81.0, 42.0, 23.0, 19.0, 12.0, 4.0, 8.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.44921875, -2.370208740234375, -2.29119873046875, -2.212188720703125, -2.1331787109375, -2.054168701171875, -1.97515869140625, -1.896148681640625, -1.817138671875, -1.738128662109375, -1.65911865234375, -1.580108642578125, -1.5010986328125, -1.422088623046875, -1.34307861328125, -1.264068603515625, -1.18505859375, -1.106048583984375, -1.02703857421875, -0.948028564453125, -0.8690185546875, -0.790008544921875, -0.71099853515625, -0.631988525390625, -0.552978515625, -0.473968505859375, -0.39495849609375, -0.315948486328125, -0.2369384765625, -0.157928466796875, -0.07891845703125, 9.1552734375e-05, 0.0791015625, 0.158111572265625, 0.23712158203125, 0.316131591796875, 0.3951416015625, 0.474151611328125, 0.55316162109375, 0.632171630859375, 0.711181640625, 0.790191650390625, 0.86920166015625, 0.948211669921875, 1.0272216796875, 1.106231689453125, 1.18524169921875, 1.264251708984375, 1.34326171875, 1.422271728515625, 1.50128173828125, 1.580291748046875, 1.6593017578125, 1.738311767578125, 1.81732177734375, 1.896331787109375, 1.975341796875, 2.054351806640625, 2.13336181640625, 2.212371826171875, 2.2913818359375, 2.370391845703125, 2.44940185546875, 2.528411865234375, 2.607421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 4.0, 13.0, 8.0, 20.0, 20.0, 29.0, 28.0, 30.0, 40.0, 49.0, 48.0, 70.0, 74.0, 79.0, 57.0, 69.0, 59.0, 56.0, 27.0, 41.0, 35.0, 24.0, 22.0, 24.0, 16.0, 13.0, 6.0, 4.0, 8.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.951171875, -2.863861083984375, -2.77655029296875, -2.689239501953125, -2.6019287109375, -2.514617919921875, -2.42730712890625, -2.339996337890625, -2.252685546875, -2.165374755859375, -2.07806396484375, -1.990753173828125, -1.9034423828125, -1.816131591796875, -1.72882080078125, -1.641510009765625, -1.55419921875, -1.466888427734375, -1.37957763671875, -1.292266845703125, -1.2049560546875, -1.117645263671875, -1.03033447265625, -0.943023681640625, -0.855712890625, -0.768402099609375, -0.68109130859375, -0.593780517578125, -0.5064697265625, -0.419158935546875, -0.33184814453125, -0.244537353515625, -0.1572265625, -0.069915771484375, 0.01739501953125, 0.104705810546875, 0.1920166015625, 0.279327392578125, 0.36663818359375, 0.453948974609375, 0.541259765625, 0.628570556640625, 0.71588134765625, 0.803192138671875, 0.8905029296875, 0.977813720703125, 1.06512451171875, 1.152435302734375, 1.23974609375, 1.327056884765625, 1.41436767578125, 1.501678466796875, 1.5889892578125, 1.676300048828125, 1.76361083984375, 1.850921630859375, 1.938232421875, 2.025543212890625, 2.11285400390625, 2.200164794921875, 2.2874755859375, 2.374786376953125, 2.46209716796875, 2.549407958984375, 2.63671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 3.0, 6.0, 12.0, 15.0, 14.0, 33.0, 48.0, 66.0, 137.0, 312.0, 770.0, 4061.0, 1024783.0, 16086.0, 1345.0, 462.0, 153.0, 93.0, 53.0, 35.0, 22.0, 12.0, 7.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.3538818359375, -8.098388671875, -7.8428955078125, -7.58740234375, -7.3319091796875, -7.076416015625, -6.8209228515625, -6.5654296875, -6.3099365234375, -6.054443359375, -5.7989501953125, -5.54345703125, -5.2879638671875, -5.032470703125, -4.7769775390625, -4.521484375, -4.2659912109375, -4.010498046875, -3.7550048828125, -3.49951171875, -3.2440185546875, -2.988525390625, -2.7330322265625, -2.4775390625, -2.2220458984375, -1.966552734375, -1.7110595703125, -1.45556640625, -1.2000732421875, -0.944580078125, -0.6890869140625, -0.43359375, -0.1781005859375, 0.077392578125, 0.3328857421875, 0.58837890625, 0.8438720703125, 1.099365234375, 1.3548583984375, 1.6103515625, 1.8658447265625, 2.121337890625, 2.3768310546875, 2.63232421875, 2.8878173828125, 3.143310546875, 3.3988037109375, 3.654296875, 3.9097900390625, 4.165283203125, 4.4207763671875, 4.67626953125, 4.9317626953125, 5.187255859375, 5.4427490234375, 5.6982421875, 5.9537353515625, 6.209228515625, 6.4647216796875, 6.72021484375, 6.9757080078125, 7.231201171875, 7.4866943359375, 7.7421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 17.0, 20.0, 41.0, 102.0, 149.0, 212.0, 203.0, 130.0, 61.0, 33.0, 10.0, 12.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004134178161621094, -0.0004032682627439499, -0.0003931187093257904, -0.0003829691559076309, -0.00037281960248947144, -0.00036267004907131195, -0.00035252049565315247, -0.000342370942234993, -0.0003322213888168335, -0.000322071835398674, -0.0003119222819805145, -0.00030177272856235504, -0.00029162317514419556, -0.00028147362172603607, -0.0002713240683078766, -0.0002611745148897171, -0.0002510249614715576, -0.00024087540805339813, -0.00023072585463523865, -0.00022057630121707916, -0.00021042674779891968, -0.0002002771943807602, -0.0001901276409626007, -0.00017997808754444122, -0.00016982853412628174, -0.00015967898070812225, -0.00014952942728996277, -0.00013937987387180328, -0.0001292303204536438, -0.00011908076703548431, -0.00010893121361732483, -9.878166019916534e-05, -8.863210678100586e-05, -7.848255336284637e-05, -6.833299994468689e-05, -5.8183446526527405e-05, -4.803389310836792e-05, -3.7884339690208435e-05, -2.773478627204895e-05, -1.7585232853889465e-05, -7.4356794357299805e-06, 2.7138739824295044e-06, 1.286342740058899e-05, 2.3012980818748474e-05, 3.316253423690796e-05, 4.3312087655067444e-05, 5.346164107322693e-05, 6.361119449138641e-05, 7.37607479095459e-05, 8.391030132770538e-05, 9.405985474586487e-05, 0.00010420940816402435, 0.00011435896158218384, 0.00012450851500034332, 0.0001346580684185028, 0.0001448076218366623, 0.00015495717525482178, 0.00016510672867298126, 0.00017525628209114075, 0.00018540583550930023, 0.00019555538892745972, 0.0002057049423456192, 0.0002158544957637787, 0.00022600404918193817, 0.00023615360260009766]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 2.0, 14.0, 21.0, 31.0, 64.0, 114.0, 273.0, 753.0, 3655.0, 71098.0, 959598.0, 10669.0, 1491.0, 404.0, 172.0, 81.0, 29.0, 26.0, 11.0, 14.0, 14.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.758392333984375, -4.63397216796875, -4.509552001953125, -4.3851318359375, -4.260711669921875, -4.13629150390625, -4.011871337890625, -3.887451171875, -3.763031005859375, -3.63861083984375, -3.514190673828125, -3.3897705078125, -3.265350341796875, -3.14093017578125, -3.016510009765625, -2.89208984375, -2.767669677734375, -2.64324951171875, -2.518829345703125, -2.3944091796875, -2.269989013671875, -2.14556884765625, -2.021148681640625, -1.896728515625, -1.772308349609375, -1.64788818359375, -1.523468017578125, -1.3990478515625, -1.274627685546875, -1.15020751953125, -1.025787353515625, -0.9013671875, -0.776947021484375, -0.65252685546875, -0.528106689453125, -0.4036865234375, -0.279266357421875, -0.15484619140625, -0.030426025390625, 0.093994140625, 0.218414306640625, 0.34283447265625, 0.467254638671875, 0.5916748046875, 0.716094970703125, 0.84051513671875, 0.964935302734375, 1.08935546875, 1.213775634765625, 1.33819580078125, 1.462615966796875, 1.5870361328125, 1.711456298828125, 1.83587646484375, 1.960296630859375, 2.084716796875, 2.209136962890625, 2.33355712890625, 2.457977294921875, 2.5823974609375, 2.706817626953125, 2.83123779296875, 2.955657958984375, 3.080078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 15.0, 47.0, 158.0, 406.0, 235.0, 61.0, 19.0, 9.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.51171875, -6.37213134765625, -6.2325439453125, -6.09295654296875, -5.953369140625, -5.81378173828125, -5.6741943359375, -5.53460693359375, -5.39501953125, -5.25543212890625, -5.1158447265625, -4.97625732421875, -4.836669921875, -4.69708251953125, -4.5574951171875, -4.41790771484375, -4.2783203125, -4.13873291015625, -3.9991455078125, -3.85955810546875, -3.719970703125, -3.58038330078125, -3.4407958984375, -3.30120849609375, -3.16162109375, -3.02203369140625, -2.8824462890625, -2.74285888671875, -2.603271484375, -2.46368408203125, -2.3240966796875, -2.18450927734375, -2.044921875, -1.90533447265625, -1.7657470703125, -1.62615966796875, -1.486572265625, -1.34698486328125, -1.2073974609375, -1.06781005859375, -0.92822265625, -0.78863525390625, -0.6490478515625, -0.50946044921875, -0.369873046875, -0.23028564453125, -0.0906982421875, 0.04888916015625, 0.1884765625, 0.32806396484375, 0.4676513671875, 0.60723876953125, 0.746826171875, 0.88641357421875, 1.0260009765625, 1.16558837890625, 1.30517578125, 1.44476318359375, 1.5843505859375, 1.72393798828125, 1.863525390625, 2.00311279296875, 2.1427001953125, 2.28228759765625, 2.421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 38.0, 125.0, 353.0, 313.0, 116.0, 37.0, 16.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.729516983032227, -19.12299919128418, -17.516481399536133, -15.909964561462402, -14.303447723388672, -12.696929931640625, -11.090412139892578, -9.483895301818848, -7.877377510070801, -6.270860195159912, -4.664342880249023, -3.0578250885009766, -1.451307773590088, 0.15520954132080078, 1.7617273330688477, 3.368244171142578, 4.974761962890625, 6.581279277801514, 8.187796592712402, 9.79431438446045, 11.40083122253418, 13.007349014282227, 14.613866806030273, 16.220382690429688, 17.826900482177734, 19.43341827392578, 21.039936065673828, 22.646453857421875, 24.25296974182129, 25.859487533569336, 27.466005325317383, 29.072521209716797, 30.67904281616211, 32.285560607910156, 33.8920783996582, 35.49859619140625, 37.1051139831543, 38.711631774902344, 40.318145751953125, 41.92466354370117, 43.53118133544922, 45.137699127197266, 46.74421691894531, 48.35073471069336, 49.957252502441406, 51.56376647949219, 53.1702880859375, 54.77680206298828, 56.383323669433594, 57.98984146118164, 59.59635925292969, 61.202877044677734, 62.80939483642578, 64.41590881347656, 66.02243041992188, 67.62894439697266, 69.23545837402344, 70.84197235107422, 72.44849395751953, 74.05500793457031, 75.66152954101562, 77.2680435180664, 78.87456512451172, 80.4810791015625, 82.08760070800781]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 3.0, 4.0, 6.0, 8.0, 14.0, 10.0, 15.0, 14.0, 23.0, 30.0, 30.0, 28.0, 23.0, 40.0, 35.0, 45.0, 50.0, 48.0, 56.0, 61.0, 52.0, 47.0, 43.0, 34.0, 33.0, 40.0, 28.0, 38.0, 22.0, 18.0, 24.0, 15.0, 15.0, 13.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-15.148448944091797, -14.728678703308105, -14.308908462524414, -13.889138221740723, -13.469367980957031, -13.049596786499023, -12.629826545715332, -12.21005630493164, -11.79028606414795, -11.370515823364258, -10.950745582580566, -10.530975341796875, -10.111204147338867, -9.691434860229492, -9.271663665771484, -8.851893424987793, -8.432123184204102, -8.01235294342041, -7.592582702636719, -7.172811985015869, -6.753041744232178, -6.333271503448486, -5.913500785827637, -5.493730545043945, -5.073960304260254, -4.6541900634765625, -4.234419822692871, -3.8146491050720215, -3.39487886428833, -2.9751086235046387, -2.555338144302368, -2.1355676651000977, -1.7157974243164062, -1.2960270643234253, -0.8762567043304443, -0.4564863443374634, -0.03671598434448242, 0.383054256439209, 0.8028247356414795, 1.22259521484375, 1.6423654556274414, 2.062135696411133, 2.4819061756134033, 2.901676654815674, 3.3214468955993652, 3.7412171363830566, 4.160987854003906, 4.580758094787598, 5.000528335571289, 5.4202985763549805, 5.840068817138672, 6.2598395347595215, 6.679609775543213, 7.099380016326904, 7.519150733947754, 7.938920974731445, 8.358691215515137, 8.778461456298828, 9.19823169708252, 9.618001937866211, 10.037773132324219, 10.457542419433594, 10.877313613891602, 11.297083854675293, 11.716854095458984]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 13.0, 22.0, 22.0, 43.0, 153.0, 453.0, 2756.0, 3999609.0, 188577.0, 2013.0, 374.0, 134.0, 47.0, 29.0, 18.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.50897216796875, -5.2327880859375, -4.95660400390625, -4.680419921875, -4.40423583984375, -4.1280517578125, -3.85186767578125, -3.57568359375, -3.29949951171875, -3.0233154296875, -2.74713134765625, -2.470947265625, -2.19476318359375, -1.9185791015625, -1.64239501953125, -1.3662109375, -1.09002685546875, -0.8138427734375, -0.53765869140625, -0.261474609375, 0.01470947265625, 0.2908935546875, 0.56707763671875, 0.84326171875, 1.11944580078125, 1.3956298828125, 1.67181396484375, 1.947998046875, 2.22418212890625, 2.5003662109375, 2.77655029296875, 3.052734375, 3.32891845703125, 3.6051025390625, 3.88128662109375, 4.157470703125, 4.43365478515625, 4.7098388671875, 4.98602294921875, 5.26220703125, 5.53839111328125, 5.8145751953125, 6.09075927734375, 6.366943359375, 6.64312744140625, 6.9193115234375, 7.19549560546875, 7.4716796875, 7.74786376953125, 8.0240478515625, 8.30023193359375, 8.576416015625, 8.85260009765625, 9.1287841796875, 9.40496826171875, 9.68115234375, 9.95733642578125, 10.2335205078125, 10.50970458984375, 10.785888671875, 11.06207275390625, 11.3382568359375, 11.61444091796875, 11.890625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 12.0, 9.0, 12.0, 10.0, 10.0, 34.0, 25.0, 36.0, 48.0, 55.0, 85.0, 98.0, 81.0, 90.0, 85.0, 68.0, 56.0, 49.0, 32.0, 26.0, 20.0, 10.0, 12.0, 12.0, 5.0, 3.0, 1.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.68359375, -0.6663055419921875, -0.649017333984375, -0.6317291259765625, -0.61444091796875, -0.5971527099609375, -0.579864501953125, -0.5625762939453125, -0.5452880859375, -0.5279998779296875, -0.510711669921875, -0.4934234619140625, -0.47613525390625, -0.4588470458984375, -0.441558837890625, -0.4242706298828125, -0.406982421875, -0.3896942138671875, -0.372406005859375, -0.3551177978515625, -0.33782958984375, -0.3205413818359375, -0.303253173828125, -0.2859649658203125, -0.2686767578125, -0.2513885498046875, -0.234100341796875, -0.2168121337890625, -0.19952392578125, -0.1822357177734375, -0.164947509765625, -0.1476593017578125, -0.13037109375, -0.1130828857421875, -0.095794677734375, -0.0785064697265625, -0.06121826171875, -0.0439300537109375, -0.026641845703125, -0.0093536376953125, 0.0079345703125, 0.0252227783203125, 0.042510986328125, 0.0597991943359375, 0.07708740234375, 0.0943756103515625, 0.111663818359375, 0.1289520263671875, 0.146240234375, 0.1635284423828125, 0.180816650390625, 0.1981048583984375, 0.21539306640625, 0.2326812744140625, 0.249969482421875, 0.2672576904296875, 0.2845458984375, 0.3018341064453125, 0.319122314453125, 0.3364105224609375, 0.35369873046875, 0.3709869384765625, 0.388275146484375, 0.4055633544921875, 0.4228515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 10.0, 12.0, 31.0, 28.0, 43.0, 68.0, 76.0, 102.0, 151.0, 290.0, 500.0, 1155.0, 3282.0, 13456.0, 119528.0, 3986913.0, 55284.0, 8815.0, 2417.0, 936.0, 432.0, 209.0, 145.0, 101.0, 66.0, 67.0, 38.0, 22.0, 19.0, 20.0, 12.0, 9.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.935455322265625, -2.84747314453125, -2.759490966796875, -2.6715087890625, -2.583526611328125, -2.49554443359375, -2.407562255859375, -2.319580078125, -2.231597900390625, -2.14361572265625, -2.055633544921875, -1.9676513671875, -1.879669189453125, -1.79168701171875, -1.703704833984375, -1.61572265625, -1.527740478515625, -1.43975830078125, -1.351776123046875, -1.2637939453125, -1.175811767578125, -1.08782958984375, -0.999847412109375, -0.911865234375, -0.823883056640625, -0.73590087890625, -0.647918701171875, -0.5599365234375, -0.471954345703125, -0.38397216796875, -0.295989990234375, -0.2080078125, -0.120025634765625, -0.03204345703125, 0.055938720703125, 0.1439208984375, 0.231903076171875, 0.31988525390625, 0.407867431640625, 0.495849609375, 0.583831787109375, 0.67181396484375, 0.759796142578125, 0.8477783203125, 0.935760498046875, 1.02374267578125, 1.111724853515625, 1.19970703125, 1.287689208984375, 1.37567138671875, 1.463653564453125, 1.5516357421875, 1.639617919921875, 1.72760009765625, 1.815582275390625, 1.903564453125, 1.991546630859375, 2.07952880859375, 2.167510986328125, 2.2554931640625, 2.343475341796875, 2.43145751953125, 2.519439697265625, 2.607421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 9.0, 16.0, 20.0, 28.0, 67.0, 147.0, 625.0, 2824.0, 177.0, 73.0, 24.0, 23.0, 11.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.716796875, -0.6989021301269531, -0.6810073852539062, -0.6631126403808594, -0.6452178955078125, -0.6273231506347656, -0.6094284057617188, -0.5915336608886719, -0.573638916015625, -0.5557441711425781, -0.5378494262695312, -0.5199546813964844, -0.5020599365234375, -0.4841651916503906, -0.46627044677734375, -0.4483757019042969, -0.43048095703125, -0.4125862121582031, -0.39469146728515625, -0.3767967224121094, -0.3589019775390625, -0.3410072326660156, -0.32311248779296875, -0.3052177429199219, -0.287322998046875, -0.2694282531738281, -0.25153350830078125, -0.23363876342773438, -0.2157440185546875, -0.19784927368164062, -0.17995452880859375, -0.16205978393554688, -0.1441650390625, -0.12627029418945312, -0.10837554931640625, -0.09048080444335938, -0.0725860595703125, -0.054691314697265625, -0.03679656982421875, -0.018901824951171875, -0.001007080078125, 0.016887664794921875, 0.03478240966796875, 0.052677154541015625, 0.0705718994140625, 0.08846664428710938, 0.10636138916015625, 0.12425613403320312, 0.14215087890625, 0.16004562377929688, 0.17794036865234375, 0.19583511352539062, 0.2137298583984375, 0.23162460327148438, 0.24951934814453125, 0.2674140930175781, 0.285308837890625, 0.3032035827636719, 0.32109832763671875, 0.3389930725097656, 0.3568878173828125, 0.3747825622558594, 0.39267730712890625, 0.4105720520019531, 0.428466796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 10.0, 17.0, 25.0, 34.0, 50.0, 75.0, 106.0, 116.0, 119.0, 123.0, 105.0, 76.0, 54.0, 31.0, 25.0, 16.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3647809028625488, -1.3026100397109985, -1.2404391765594482, -1.1782681941986084, -1.116097331047058, -1.0539264678955078, -0.9917556047439575, -0.9295847415924072, -0.8674138188362122, -0.8052429556846619, -0.7430720329284668, -0.6809011697769165, -0.6187303066253662, -0.5565593838691711, -0.49438852071762085, -0.43221762776374817, -0.3700467348098755, -0.3078758418560028, -0.24570496380329132, -0.18353408575057983, -0.12136319279670715, -0.05919229984283447, 0.0029785633087158203, 0.0651494562625885, 0.12732034921646118, 0.18949124217033386, 0.25166213512420654, 0.31383299827575684, 0.3760038912296295, 0.4381747841835022, 0.5003456473350525, 0.5625165700912476, 0.6246874332427979, 0.6868582963943481, 0.7490292191505432, 0.8112000823020935, 0.8733710050582886, 0.9355418682098389, 0.9977127313613892, 1.0598835945129395, 1.1220545768737793, 1.1842254400253296, 1.2463963031768799, 1.3085672855377197, 1.37073814868927, 1.4329090118408203, 1.4950798749923706, 1.557250738143921, 1.6194216012954712, 1.6815924644470215, 1.7437633275985718, 1.805934190750122, 1.868105173110962, 1.9302760362625122, 1.9924468994140625, 2.0546178817749023, 2.116788625717163, 2.178959608078003, 2.2411303520202637, 2.3033013343811035, 2.3654720783233643, 2.427643060684204, 2.489813804626465, 2.5519847869873047, 2.6141557693481445]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 11.0, 11.0, 9.0, 17.0, 20.0, 30.0, 22.0, 21.0, 34.0, 43.0, 61.0, 38.0, 47.0, 42.0, 48.0, 41.0, 50.0, 42.0, 38.0, 40.0, 37.0, 35.0, 28.0, 29.0, 33.0, 29.0, 18.0, 22.0, 18.0, 8.0, 11.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9708364605903625, -0.9387990832328796, -0.9067617058753967, -0.874724268913269, -0.8426868915557861, -0.8106495141983032, -0.7786121368408203, -0.7465747594833374, -0.7145373821258545, -0.6825000047683716, -0.6504626274108887, -0.6184252500534058, -0.5863878130912781, -0.5543504357337952, -0.5223130583763123, -0.49027568101882935, -0.45823824405670166, -0.42620086669921875, -0.39416345953941345, -0.36212608218193054, -0.33008867502212524, -0.29805129766464233, -0.2660139203071594, -0.23397652804851532, -0.20193913578987122, -0.1699017435312271, -0.137864351272583, -0.1058269739151001, -0.073789581656456, -0.04175218939781189, -0.00971481204032898, 0.022322580218315125, 0.054360032081604004, 0.08639742434024811, 0.11843480914831161, 0.15047219395637512, 0.18250958621501923, 0.21454697847366333, 0.24658435583114624, 0.27862173318862915, 0.31065914034843445, 0.34269651770591736, 0.37473392486572266, 0.40677130222320557, 0.4388086795806885, 0.4708460867404938, 0.5028834342956543, 0.534920871257782, 0.5669582486152649, 0.5989956259727478, 0.6310330033302307, 0.6630704402923584, 0.6951078176498413, 0.7271451950073242, 0.7591825723648071, 0.79121994972229, 0.823257327079773, 0.8552947044372559, 0.8873320817947388, 0.9193694591522217, 0.9514068961143494, 0.9834442734718323, 1.01548171043396, 1.0475190877914429, 1.0795564651489258]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 7.0, 4.0, 3.0, 9.0, 24.0, 17.0, 33.0, 46.0, 58.0, 95.0, 172.0, 336.0, 608.0, 1376.0, 3890.0, 14998.0, 97538.0, 652818.0, 237409.0, 29119.0, 6180.0, 2026.0, 817.0, 413.0, 212.0, 112.0, 73.0, 58.0, 34.0, 12.0, 19.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.81640625, -1.7640533447265625, -1.711700439453125, -1.6593475341796875, -1.60699462890625, -1.5546417236328125, -1.502288818359375, -1.4499359130859375, -1.3975830078125, -1.3452301025390625, -1.292877197265625, -1.2405242919921875, -1.18817138671875, -1.1358184814453125, -1.083465576171875, -1.0311126708984375, -0.978759765625, -0.9264068603515625, -0.874053955078125, -0.8217010498046875, -0.76934814453125, -0.7169952392578125, -0.664642333984375, -0.6122894287109375, -0.5599365234375, -0.5075836181640625, -0.455230712890625, -0.4028778076171875, -0.35052490234375, -0.2981719970703125, -0.245819091796875, -0.1934661865234375, -0.14111328125, -0.0887603759765625, -0.036407470703125, 0.0159454345703125, 0.06829833984375, 0.1206512451171875, 0.173004150390625, 0.2253570556640625, 0.2777099609375, 0.3300628662109375, 0.382415771484375, 0.4347686767578125, 0.48712158203125, 0.5394744873046875, 0.591827392578125, 0.6441802978515625, 0.696533203125, 0.7488861083984375, 0.801239013671875, 0.8535919189453125, 0.90594482421875, 0.9582977294921875, 1.010650634765625, 1.0630035400390625, 1.1153564453125, 1.1677093505859375, 1.220062255859375, 1.2724151611328125, 1.32476806640625, 1.3771209716796875, 1.429473876953125, 1.4818267822265625, 1.5341796875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 16.0, 13.0, 14.0, 10.0, 27.0, 30.0, 37.0, 42.0, 71.0, 83.0, 85.0, 86.0, 81.0, 82.0, 68.0, 64.0, 46.0, 34.0, 26.0, 27.0, 11.0, 14.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66455078125, -0.6459121704101562, -0.6272735595703125, -0.6086349487304688, -0.589996337890625, -0.5713577270507812, -0.5527191162109375, -0.5340805053710938, -0.51544189453125, -0.49680328369140625, -0.4781646728515625, -0.45952606201171875, -0.440887451171875, -0.42224884033203125, -0.4036102294921875, -0.38497161865234375, -0.3663330078125, -0.34769439697265625, -0.3290557861328125, -0.31041717529296875, -0.291778564453125, -0.27313995361328125, -0.2545013427734375, -0.23586273193359375, -0.21722412109375, -0.19858551025390625, -0.1799468994140625, -0.16130828857421875, -0.142669677734375, -0.12403106689453125, -0.1053924560546875, -0.08675384521484375, -0.068115234375, -0.04947662353515625, -0.0308380126953125, -0.01219940185546875, 0.006439208984375, 0.02507781982421875, 0.0437164306640625, 0.06235504150390625, 0.08099365234375, 0.09963226318359375, 0.1182708740234375, 0.13690948486328125, 0.155548095703125, 0.17418670654296875, 0.1928253173828125, 0.21146392822265625, 0.2301025390625, 0.24874114990234375, 0.2673797607421875, 0.28601837158203125, 0.304656982421875, 0.32329559326171875, 0.3419342041015625, 0.36057281494140625, 0.37921142578125, 0.39785003662109375, 0.4164886474609375, 0.43512725830078125, 0.453765869140625, 0.47240447998046875, 0.4910430908203125, 0.5096817016601562, 0.5283203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 14.0, 17.0, 15.0, 22.0, 40.0, 56.0, 113.0, 179.0, 303.0, 607.0, 1521.0, 5922.0, 107157.0, 886234.0, 40057.0, 3891.0, 1208.0, 518.0, 253.0, 142.0, 93.0, 51.0, 46.0, 29.0, 21.0, 11.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.033203125, -2.9449462890625, -2.856689453125, -2.7684326171875, -2.68017578125, -2.5919189453125, -2.503662109375, -2.4154052734375, -2.3271484375, -2.2388916015625, -2.150634765625, -2.0623779296875, -1.97412109375, -1.8858642578125, -1.797607421875, -1.7093505859375, -1.62109375, -1.5328369140625, -1.444580078125, -1.3563232421875, -1.26806640625, -1.1798095703125, -1.091552734375, -1.0032958984375, -0.9150390625, -0.8267822265625, -0.738525390625, -0.6502685546875, -0.56201171875, -0.4737548828125, -0.385498046875, -0.2972412109375, -0.208984375, -0.1207275390625, -0.032470703125, 0.0557861328125, 0.14404296875, 0.2322998046875, 0.320556640625, 0.4088134765625, 0.4970703125, 0.5853271484375, 0.673583984375, 0.7618408203125, 0.85009765625, 0.9383544921875, 1.026611328125, 1.1148681640625, 1.203125, 1.2913818359375, 1.379638671875, 1.4678955078125, 1.55615234375, 1.6444091796875, 1.732666015625, 1.8209228515625, 1.9091796875, 1.9974365234375, 2.085693359375, 2.1739501953125, 2.26220703125, 2.3504638671875, 2.438720703125, 2.5269775390625, 2.615234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 15.0, 15.0, 20.0, 19.0, 15.0, 33.0, 49.0, 50.0, 52.0, 56.0, 50.0, 46.0, 63.0, 76.0, 68.0, 50.0, 52.0, 50.0, 49.0, 34.0, 21.0, 34.0, 21.0, 14.0, 13.0, 12.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.796661376953125, -2.70660400390625, -2.616546630859375, -2.5264892578125, -2.436431884765625, -2.34637451171875, -2.256317138671875, -2.166259765625, -2.076202392578125, -1.98614501953125, -1.896087646484375, -1.8060302734375, -1.715972900390625, -1.62591552734375, -1.535858154296875, -1.44580078125, -1.355743408203125, -1.26568603515625, -1.175628662109375, -1.0855712890625, -0.995513916015625, -0.90545654296875, -0.815399169921875, -0.725341796875, -0.635284423828125, -0.54522705078125, -0.455169677734375, -0.3651123046875, -0.275054931640625, -0.18499755859375, -0.094940185546875, -0.0048828125, 0.085174560546875, 0.17523193359375, 0.265289306640625, 0.3553466796875, 0.445404052734375, 0.53546142578125, 0.625518798828125, 0.715576171875, 0.805633544921875, 0.89569091796875, 0.985748291015625, 1.0758056640625, 1.165863037109375, 1.25592041015625, 1.345977783203125, 1.43603515625, 1.526092529296875, 1.61614990234375, 1.706207275390625, 1.7962646484375, 1.886322021484375, 1.97637939453125, 2.066436767578125, 2.156494140625, 2.246551513671875, 2.33660888671875, 2.426666259765625, 2.5167236328125, 2.606781005859375, 2.69683837890625, 2.786895751953125, 2.876953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 11.0, 19.0, 15.0, 22.0, 37.0, 53.0, 120.0, 190.0, 403.0, 1028.0, 4065.0, 47713.0, 918499.0, 69311.0, 4876.0, 1205.0, 430.0, 234.0, 107.0, 67.0, 37.0, 25.0, 15.0, 13.0, 11.0, 9.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5615234375, -1.5086822509765625, -1.455841064453125, -1.4029998779296875, -1.35015869140625, -1.2973175048828125, -1.244476318359375, -1.1916351318359375, -1.1387939453125, -1.0859527587890625, -1.033111572265625, -0.9802703857421875, -0.92742919921875, -0.8745880126953125, -0.821746826171875, -0.7689056396484375, -0.716064453125, -0.6632232666015625, -0.610382080078125, -0.5575408935546875, -0.50469970703125, -0.4518585205078125, -0.399017333984375, -0.3461761474609375, -0.2933349609375, -0.2404937744140625, -0.187652587890625, -0.1348114013671875, -0.08197021484375, -0.0291290283203125, 0.023712158203125, 0.0765533447265625, 0.12939453125, 0.1822357177734375, 0.235076904296875, 0.2879180908203125, 0.34075927734375, 0.3936004638671875, 0.446441650390625, 0.4992828369140625, 0.5521240234375, 0.6049652099609375, 0.657806396484375, 0.7106475830078125, 0.76348876953125, 0.8163299560546875, 0.869171142578125, 0.9220123291015625, 0.974853515625, 1.0276947021484375, 1.080535888671875, 1.1333770751953125, 1.18621826171875, 1.2390594482421875, 1.291900634765625, 1.3447418212890625, 1.3975830078125, 1.4504241943359375, 1.503265380859375, 1.5561065673828125, 1.60894775390625, 1.6617889404296875, 1.714630126953125, 1.7674713134765625, 1.8203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 11.0, 13.0, 21.0, 32.0, 44.0, 49.0, 63.0, 76.0, 106.0, 112.0, 116.0, 83.0, 69.0, 41.0, 40.0, 31.0, 34.0, 9.0, 9.0, 7.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010001659393310547, -9.610876441001892e-05, -9.220093488693237e-05, -8.829310536384583e-05, -8.438527584075928e-05, -8.047744631767273e-05, -7.656961679458618e-05, -7.266178727149963e-05, -6.875395774841309e-05, -6.484612822532654e-05, -6.093829870223999e-05, -5.703046917915344e-05, -5.3122639656066895e-05, -4.921481013298035e-05, -4.53069806098938e-05, -4.139915108680725e-05, -3.74913215637207e-05, -3.3583492040634155e-05, -2.9675662517547607e-05, -2.576783299446106e-05, -2.1860003471374512e-05, -1.7952173948287964e-05, -1.4044344425201416e-05, -1.0136514902114868e-05, -6.22868537902832e-06, -2.3208558559417725e-06, 1.5869736671447754e-06, 5.494803190231323e-06, 9.402632713317871e-06, 1.3310462236404419e-05, 1.7218291759490967e-05, 2.1126121282577515e-05, 2.5033950805664062e-05, 2.894178032875061e-05, 3.284960985183716e-05, 3.6757439374923706e-05, 4.0665268898010254e-05, 4.45730984210968e-05, 4.848092794418335e-05, 5.23887574672699e-05, 5.6296586990356445e-05, 6.020441651344299e-05, 6.411224603652954e-05, 6.802007555961609e-05, 7.192790508270264e-05, 7.583573460578918e-05, 7.974356412887573e-05, 8.365139365196228e-05, 8.755922317504883e-05, 9.146705269813538e-05, 9.537488222122192e-05, 9.928271174430847e-05, 0.00010319054126739502, 0.00010709837079048157, 0.00011100620031356812, 0.00011491402983665466, 0.00011882185935974121, 0.00012272968888282776, 0.0001266375184059143, 0.00013054534792900085, 0.0001344531774520874, 0.00013836100697517395, 0.0001422688364982605, 0.00014617666602134705, 0.0001500844955444336]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 13.0, 20.0, 34.0, 59.0, 89.0, 187.0, 412.0, 1037.0, 3604.0, 25811.0, 827105.0, 178200.0, 8739.0, 1920.0, 683.0, 286.0, 136.0, 73.0, 38.0, 24.0, 13.0, 20.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.578125, -1.5232696533203125, -1.468414306640625, -1.4135589599609375, -1.35870361328125, -1.3038482666015625, -1.248992919921875, -1.1941375732421875, -1.1392822265625, -1.0844268798828125, -1.029571533203125, -0.9747161865234375, -0.91986083984375, -0.8650054931640625, -0.810150146484375, -0.7552947998046875, -0.700439453125, -0.6455841064453125, -0.590728759765625, -0.5358734130859375, -0.48101806640625, -0.4261627197265625, -0.371307373046875, -0.3164520263671875, -0.2615966796875, -0.2067413330078125, -0.151885986328125, -0.0970306396484375, -0.04217529296875, 0.0126800537109375, 0.067535400390625, 0.1223907470703125, 0.17724609375, 0.2321014404296875, 0.286956787109375, 0.3418121337890625, 0.39666748046875, 0.4515228271484375, 0.506378173828125, 0.5612335205078125, 0.6160888671875, 0.6709442138671875, 0.725799560546875, 0.7806549072265625, 0.83551025390625, 0.8903656005859375, 0.945220947265625, 1.0000762939453125, 1.054931640625, 1.1097869873046875, 1.164642333984375, 1.2194976806640625, 1.27435302734375, 1.3292083740234375, 1.384063720703125, 1.4389190673828125, 1.4937744140625, 1.5486297607421875, 1.603485107421875, 1.6583404541015625, 1.71319580078125, 1.7680511474609375, 1.822906494140625, 1.8777618408203125, 1.9326171875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 15.0, 12.0, 34.0, 48.0, 70.0, 110.0, 137.0, 141.0, 106.0, 93.0, 70.0, 70.0, 33.0, 16.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.225677490234375, -1.18084716796875, -1.136016845703125, -1.0911865234375, -1.046356201171875, -1.00152587890625, -0.956695556640625, -0.911865234375, -0.867034912109375, -0.82220458984375, -0.777374267578125, -0.7325439453125, -0.687713623046875, -0.64288330078125, -0.598052978515625, -0.55322265625, -0.508392333984375, -0.46356201171875, -0.418731689453125, -0.3739013671875, -0.329071044921875, -0.28424072265625, -0.239410400390625, -0.194580078125, -0.149749755859375, -0.10491943359375, -0.060089111328125, -0.0152587890625, 0.029571533203125, 0.07440185546875, 0.119232177734375, 0.1640625, 0.208892822265625, 0.25372314453125, 0.298553466796875, 0.3433837890625, 0.388214111328125, 0.43304443359375, 0.477874755859375, 0.522705078125, 0.567535400390625, 0.61236572265625, 0.657196044921875, 0.7020263671875, 0.746856689453125, 0.79168701171875, 0.836517333984375, 0.88134765625, 0.926177978515625, 0.97100830078125, 1.015838623046875, 1.0606689453125, 1.105499267578125, 1.15032958984375, 1.195159912109375, 1.239990234375, 1.284820556640625, 1.32965087890625, 1.374481201171875, 1.4193115234375, 1.464141845703125, 1.50897216796875, 1.553802490234375, 1.5986328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 9.0, 86.0, 364.0, 400.0, 115.0, 21.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.907175064086914, -5.5349040031433105, -4.162632942199707, -2.7903618812561035, -1.4180908203125, -0.045819759368896484, 1.326451301574707, 2.6987228393554688, 4.070993423461914, 5.443264484405518, 6.815535545349121, 8.187807083129883, 9.560077667236328, 10.932348251342773, 12.304619789123535, 13.676891326904297, 15.049161911010742, 16.421432495117188, 17.793704986572266, 19.16597557067871, 20.538246154785156, 21.9105167388916, 23.282787322998047, 24.655059814453125, 26.02733039855957, 27.399600982666016, 28.771873474121094, 30.14414405822754, 31.516414642333984, 32.88868713378906, 34.260955810546875, 35.63322830200195, 37.00550079345703, 38.37777328491211, 39.75004196166992, 41.122314453125, 42.49458312988281, 43.86685562133789, 45.23912811279297, 46.61139678955078, 47.98366928100586, 49.35594177246094, 50.72821044921875, 52.10048294067383, 53.472755432128906, 54.84502410888672, 56.2172966003418, 57.589569091796875, 58.96183776855469, 60.334110260009766, 61.70637893676758, 63.078651428222656, 64.45092010498047, 65.82319641113281, 67.19546508789062, 68.56773376464844, 69.94000244140625, 71.31227111816406, 72.6845474243164, 74.05681610107422, 75.42908477783203, 76.80136108398438, 78.17362976074219, 79.5458984375, 80.91817474365234]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 7.0, 8.0, 10.0, 18.0, 19.0, 13.0, 29.0, 28.0, 33.0, 27.0, 39.0, 41.0, 45.0, 41.0, 54.0, 36.0, 53.0, 47.0, 49.0, 51.0, 43.0, 34.0, 31.0, 38.0, 31.0, 35.0, 20.0, 14.0, 18.0, 16.0, 11.0, 12.0, 15.0, 8.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.314973831176758, -8.042481422424316, -7.769989967346191, -7.49749755859375, -7.225005626678467, -6.952513694763184, -6.680021286010742, -6.407529354095459, -6.135037422180176, -5.862545490264893, -5.590053558349609, -5.317561149597168, -5.045069217681885, -4.772577285766602, -4.50008487701416, -4.227592945098877, -3.9551010131835938, -3.6826090812683105, -3.4101169109344482, -3.137624740600586, -2.8651328086853027, -2.5926408767700195, -2.3201487064361572, -2.047656536102295, -1.7751646041870117, -1.502672553062439, -1.2301805019378662, -0.9576884508132935, -0.6851963996887207, -0.41270434856414795, -0.1402122974395752, 0.13227975368499756, 0.4047718048095703, 0.6772638559341431, 0.9497559070587158, 1.2222479581832886, 1.4947400093078613, 1.767232060432434, 2.039724111557007, 2.312216281890869, 2.5847082138061523, 2.8572001457214355, 3.129692316055298, 3.40218448638916, 3.6746764183044434, 3.9471683502197266, 4.219660758972168, 4.492152690887451, 4.764644622802734, 5.037136554718018, 5.309628486633301, 5.582120895385742, 5.854612827301025, 6.127104759216309, 6.39959716796875, 6.672089099884033, 6.944581031799316, 7.2170729637146, 7.489564895629883, 7.762057304382324, 8.034549713134766, 8.30704116821289, 8.579533576965332, 8.852025032043457, 9.124517440795898]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 5.0, 5.0, 6.0, 16.0, 42.0, 85.0, 149.0, 351.0, 977.0, 4549.0, 77850.0, 4081546.0, 24864.0, 2655.0, 640.0, 252.0, 129.0, 84.0, 25.0, 21.0, 11.0, 5.0, 2.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.322265625, -2.213470458984375, -2.10467529296875, -1.995880126953125, -1.8870849609375, -1.778289794921875, -1.66949462890625, -1.560699462890625, -1.451904296875, -1.343109130859375, -1.23431396484375, -1.125518798828125, -1.0167236328125, -0.907928466796875, -0.79913330078125, -0.690338134765625, -0.58154296875, -0.472747802734375, -0.36395263671875, -0.255157470703125, -0.1463623046875, -0.037567138671875, 0.07122802734375, 0.180023193359375, 0.288818359375, 0.397613525390625, 0.50640869140625, 0.615203857421875, 0.7239990234375, 0.832794189453125, 0.94158935546875, 1.050384521484375, 1.1591796875, 1.267974853515625, 1.37677001953125, 1.485565185546875, 1.5943603515625, 1.703155517578125, 1.81195068359375, 1.920745849609375, 2.029541015625, 2.138336181640625, 2.24713134765625, 2.355926513671875, 2.4647216796875, 2.573516845703125, 2.68231201171875, 2.791107177734375, 2.89990234375, 3.008697509765625, 3.11749267578125, 3.226287841796875, 3.3350830078125, 3.443878173828125, 3.55267333984375, 3.661468505859375, 3.770263671875, 3.879058837890625, 3.98785400390625, 4.096649169921875, 4.2054443359375, 4.314239501953125, 4.42303466796875, 4.531829833984375, 4.640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 9.0, 11.0, 18.0, 10.0, 8.0, 33.0, 55.0, 60.0, 82.0, 123.0, 103.0, 107.0, 97.0, 89.0, 52.0, 44.0, 32.0, 20.0, 14.0, 7.0, 8.0, 4.0, 12.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9162673950195312, -0.8921051025390625, -0.8679428100585938, -0.843780517578125, -0.8196182250976562, -0.7954559326171875, -0.7712936401367188, -0.74713134765625, -0.7229690551757812, -0.6988067626953125, -0.6746444702148438, -0.650482177734375, -0.6263198852539062, -0.6021575927734375, -0.5779953002929688, -0.5538330078125, -0.5296707153320312, -0.5055084228515625, -0.48134613037109375, -0.457183837890625, -0.43302154541015625, -0.4088592529296875, -0.38469696044921875, -0.36053466796875, -0.33637237548828125, -0.3122100830078125, -0.28804779052734375, -0.263885498046875, -0.23972320556640625, -0.2155609130859375, -0.19139862060546875, -0.167236328125, -0.14307403564453125, -0.1189117431640625, -0.09474945068359375, -0.070587158203125, -0.04642486572265625, -0.0222625732421875, 0.00189971923828125, 0.02606201171875, 0.05022430419921875, 0.0743865966796875, 0.09854888916015625, 0.122711181640625, 0.14687347412109375, 0.1710357666015625, 0.19519805908203125, 0.2193603515625, 0.24352264404296875, 0.2676849365234375, 0.29184722900390625, 0.316009521484375, 0.34017181396484375, 0.3643341064453125, 0.38849639892578125, 0.41265869140625, 0.43682098388671875, 0.4609832763671875, 0.48514556884765625, 0.509307861328125, 0.5334701538085938, 0.5576324462890625, 0.5817947387695312, 0.60595703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 12.0, 19.0, 19.0, 26.0, 51.0, 54.0, 102.0, 139.0, 232.0, 384.0, 670.0, 1123.0, 2284.0, 5189.0, 13064.0, 41481.0, 212586.0, 3572672.0, 270757.0, 47754.0, 14437.0, 5668.0, 2470.0, 1253.0, 666.0, 398.0, 277.0, 154.0, 105.0, 68.0, 44.0, 41.0, 15.0, 14.0, 4.0, 18.0, 3.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9555435180664062, -0.9242706298828125, -0.8929977416992188, -0.861724853515625, -0.8304519653320312, -0.7991790771484375, -0.7679061889648438, -0.73663330078125, -0.7053604125976562, -0.6740875244140625, -0.6428146362304688, -0.611541748046875, -0.5802688598632812, -0.5489959716796875, -0.5177230834960938, -0.4864501953125, -0.45517730712890625, -0.4239044189453125, -0.39263153076171875, -0.361358642578125, -0.33008575439453125, -0.2988128662109375, -0.26753997802734375, -0.23626708984375, -0.20499420166015625, -0.1737213134765625, -0.14244842529296875, -0.111175537109375, -0.07990264892578125, -0.0486297607421875, -0.01735687255859375, 0.013916015625, 0.04518890380859375, 0.0764617919921875, 0.10773468017578125, 0.139007568359375, 0.17028045654296875, 0.2015533447265625, 0.23282623291015625, 0.26409912109375, 0.29537200927734375, 0.3266448974609375, 0.35791778564453125, 0.389190673828125, 0.42046356201171875, 0.4517364501953125, 0.48300933837890625, 0.5142822265625, 0.5455551147460938, 0.5768280029296875, 0.6081008911132812, 0.639373779296875, 0.6706466674804688, 0.7019195556640625, 0.7331924438476562, 0.76446533203125, 0.7957382202148438, 0.8270111083984375, 0.8582839965820312, 0.889556884765625, 0.9208297729492188, 0.9521026611328125, 0.9833755493164062, 1.0146484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 4.0, 8.0, 10.0, 22.0, 25.0, 44.0, 50.0, 82.0, 138.0, 217.0, 612.0, 2102.0, 291.0, 171.0, 98.0, 58.0, 37.0, 21.0, 20.0, 17.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3559112548828125, -0.341217041015625, -0.3265228271484375, -0.31182861328125, -0.2971343994140625, -0.282440185546875, -0.2677459716796875, -0.2530517578125, -0.2383575439453125, -0.223663330078125, -0.2089691162109375, -0.19427490234375, -0.1795806884765625, -0.164886474609375, -0.1501922607421875, -0.135498046875, -0.1208038330078125, -0.106109619140625, -0.0914154052734375, -0.07672119140625, -0.0620269775390625, -0.047332763671875, -0.0326385498046875, -0.0179443359375, -0.0032501220703125, 0.011444091796875, 0.0261383056640625, 0.04083251953125, 0.0555267333984375, 0.070220947265625, 0.0849151611328125, 0.099609375, 0.1143035888671875, 0.128997802734375, 0.1436920166015625, 0.15838623046875, 0.1730804443359375, 0.187774658203125, 0.2024688720703125, 0.2171630859375, 0.2318572998046875, 0.246551513671875, 0.2612457275390625, 0.27593994140625, 0.2906341552734375, 0.305328369140625, 0.3200225830078125, 0.334716796875, 0.3494110107421875, 0.364105224609375, 0.3787994384765625, 0.39349365234375, 0.4081878662109375, 0.422882080078125, 0.4375762939453125, 0.4522705078125, 0.4669647216796875, 0.481658935546875, 0.4963531494140625, 0.51104736328125, 0.5257415771484375, 0.540435791015625, 0.5551300048828125, 0.56982421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 12.0, 21.0, 22.0, 54.0, 92.0, 128.0, 161.0, 163.0, 156.0, 89.0, 35.0, 21.0, 15.0, 12.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.486344337463379, -4.369661808013916, -4.252979278564453, -4.136297225952148, -4.0196146965026855, -3.9029321670532227, -3.7862496376037598, -3.669567346572876, -3.552884817123413, -3.43620228767395, -3.3195199966430664, -3.2028374671936035, -3.0861551761627197, -2.969472646713257, -2.852790355682373, -2.73610782623291, -2.6194252967834473, -2.5027427673339844, -2.3860604763031006, -2.2693779468536377, -2.152695655822754, -2.036013126373291, -1.9193307161331177, -1.8026483058929443, -1.6859660148620605, -1.5692836046218872, -1.4526011943817139, -1.335918664932251, -1.2192362546920776, -1.1025538444519043, -0.985871434211731, -0.8691889643669128, -0.7525064945220947, -0.6358240842819214, -0.5191416144371033, -0.40245920419692993, -0.2857767641544342, -0.16909432411193848, -0.05241191387176514, 0.06427055597305298, 0.18095296621322632, 0.29763540625572205, 0.4143178462982178, 0.5310002565383911, 0.6476826667785645, 0.7643651366233826, 0.8810475468635559, 0.997730016708374, 1.1144124269485474, 1.2310948371887207, 1.347777247428894, 1.4644596576690674, 1.5811421871185303, 1.6978245973587036, 1.814507007598877, 1.9311895370483398, 2.0478718280792236, 2.1645543575286865, 2.2812366485595703, 2.397919178009033, 2.514601469039917, 2.63128399848938, 2.7479662895202637, 2.8646488189697266, 2.9813313484191895]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 5.0, 7.0, 5.0, 11.0, 9.0, 19.0, 14.0, 21.0, 12.0, 40.0, 32.0, 42.0, 32.0, 36.0, 48.0, 51.0, 49.0, 40.0, 43.0, 44.0, 47.0, 46.0, 39.0, 32.0, 34.0, 36.0, 42.0, 30.0, 32.0, 15.0, 14.0, 11.0, 11.0, 9.0, 4.0, 6.0, 9.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.395074486732483, -1.343608021736145, -1.2921415567398071, -1.2406750917434692, -1.189208745956421, -1.137742280960083, -1.0862758159637451, -1.0348093509674072, -0.9833428859710693, -0.9318764209747314, -0.8804099559783936, -0.8289435505867004, -0.7774770855903625, -0.7260106205940247, -0.6745442152023315, -0.6230777502059937, -0.5716112852096558, -0.5201448202133179, -0.46867838501930237, -0.41721194982528687, -0.365745484828949, -0.3142790198326111, -0.2628125846385956, -0.21134614944458008, -0.1598796844482422, -0.10841323435306549, -0.056946784257888794, -0.005480334162712097, 0.0459861159324646, 0.09745258092880249, 0.148919016122818, 0.2003854513168335, 0.25185203552246094, 0.30331850051879883, 0.35478493571281433, 0.40625137090682983, 0.4577178359031677, 0.5091843008995056, 0.5606507062911987, 0.6121171712875366, 0.6635836362838745, 0.7150501012802124, 0.7665165662765503, 0.8179829716682434, 0.8694494366645813, 0.9209159016609192, 0.9723823070526123, 1.0238487720489502, 1.075315237045288, 1.126781702041626, 1.1782481670379639, 1.2297146320343018, 1.2811810970306396, 1.3326475620269775, 1.3841139078140259, 1.4355803728103638, 1.4870468378067017, 1.5385133028030396, 1.5899797677993774, 1.6414462327957153, 1.6929125785827637, 1.7443790435791016, 1.7958455085754395, 1.8473119735717773, 1.8987784385681152]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 9.0, 10.0, 22.0, 19.0, 40.0, 81.0, 130.0, 244.0, 450.0, 1121.0, 2885.0, 9750.0, 43321.0, 246839.0, 578945.0, 130105.0, 24620.0, 6227.0, 2072.0, 803.0, 363.0, 210.0, 95.0, 70.0, 38.0, 25.0, 14.0, 12.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.80859375, -1.7613983154296875, -1.714202880859375, -1.6670074462890625, -1.61981201171875, -1.5726165771484375, -1.525421142578125, -1.4782257080078125, -1.4310302734375, -1.3838348388671875, -1.336639404296875, -1.2894439697265625, -1.24224853515625, -1.1950531005859375, -1.147857666015625, -1.1006622314453125, -1.053466796875, -1.0062713623046875, -0.959075927734375, -0.9118804931640625, -0.86468505859375, -0.8174896240234375, -0.770294189453125, -0.7230987548828125, -0.6759033203125, -0.6287078857421875, -0.581512451171875, -0.5343170166015625, -0.48712158203125, -0.4399261474609375, -0.392730712890625, -0.3455352783203125, -0.29833984375, -0.2511444091796875, -0.203948974609375, -0.1567535400390625, -0.10955810546875, -0.0623626708984375, -0.015167236328125, 0.0320281982421875, 0.0792236328125, 0.1264190673828125, 0.173614501953125, 0.2208099365234375, 0.26800537109375, 0.3152008056640625, 0.362396240234375, 0.4095916748046875, 0.456787109375, 0.5039825439453125, 0.551177978515625, 0.5983734130859375, 0.64556884765625, 0.6927642822265625, 0.739959716796875, 0.7871551513671875, 0.8343505859375, 0.8815460205078125, 0.928741455078125, 0.9759368896484375, 1.02313232421875, 1.0703277587890625, 1.117523193359375, 1.1647186279296875, 1.2119140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 3.0, 2.0, 8.0, 13.0, 15.0, 20.0, 25.0, 45.0, 49.0, 63.0, 73.0, 79.0, 91.0, 96.0, 83.0, 89.0, 69.0, 43.0, 32.0, 19.0, 24.0, 16.0, 13.0, 9.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.84228515625, -0.82122802734375, -0.8001708984375, -0.77911376953125, -0.758056640625, -0.73699951171875, -0.7159423828125, -0.69488525390625, -0.673828125, -0.65277099609375, -0.6317138671875, -0.61065673828125, -0.589599609375, -0.56854248046875, -0.5474853515625, -0.52642822265625, -0.50537109375, -0.48431396484375, -0.4632568359375, -0.44219970703125, -0.421142578125, -0.40008544921875, -0.3790283203125, -0.35797119140625, -0.3369140625, -0.31585693359375, -0.2947998046875, -0.27374267578125, -0.252685546875, -0.23162841796875, -0.2105712890625, -0.18951416015625, -0.16845703125, -0.14739990234375, -0.1263427734375, -0.10528564453125, -0.084228515625, -0.06317138671875, -0.0421142578125, -0.02105712890625, 0.0, 0.02105712890625, 0.0421142578125, 0.06317138671875, 0.084228515625, 0.10528564453125, 0.1263427734375, 0.14739990234375, 0.16845703125, 0.18951416015625, 0.2105712890625, 0.23162841796875, 0.252685546875, 0.27374267578125, 0.2947998046875, 0.31585693359375, 0.3369140625, 0.35797119140625, 0.3790283203125, 0.40008544921875, 0.421142578125, 0.44219970703125, 0.4632568359375, 0.48431396484375, 0.50537109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 3.0, 6.0, 7.0, 10.0, 11.0, 27.0, 23.0, 33.0, 55.0, 86.0, 117.0, 183.0, 246.0, 402.0, 850.0, 2090.0, 7330.0, 60843.0, 777041.0, 179297.0, 14177.0, 3034.0, 1152.0, 590.0, 344.0, 167.0, 133.0, 93.0, 65.0, 20.0, 28.0, 22.0, 19.0, 8.0, 8.0, 5.0, 5.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.244140625, -2.17547607421875, -2.1068115234375, -2.03814697265625, -1.969482421875, -1.90081787109375, -1.8321533203125, -1.76348876953125, -1.69482421875, -1.62615966796875, -1.5574951171875, -1.48883056640625, -1.420166015625, -1.35150146484375, -1.2828369140625, -1.21417236328125, -1.1455078125, -1.07684326171875, -1.0081787109375, -0.93951416015625, -0.870849609375, -0.80218505859375, -0.7335205078125, -0.66485595703125, -0.59619140625, -0.52752685546875, -0.4588623046875, -0.39019775390625, -0.321533203125, -0.25286865234375, -0.1842041015625, -0.11553955078125, -0.046875, 0.02178955078125, 0.0904541015625, 0.15911865234375, 0.227783203125, 0.29644775390625, 0.3651123046875, 0.43377685546875, 0.50244140625, 0.57110595703125, 0.6397705078125, 0.70843505859375, 0.777099609375, 0.84576416015625, 0.9144287109375, 0.98309326171875, 1.0517578125, 1.12042236328125, 1.1890869140625, 1.25775146484375, 1.326416015625, 1.39508056640625, 1.4637451171875, 1.53240966796875, 1.60107421875, 1.66973876953125, 1.7384033203125, 1.80706787109375, 1.875732421875, 1.94439697265625, 2.0130615234375, 2.08172607421875, 2.150390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 11.0, 11.0, 16.0, 22.0, 16.0, 28.0, 26.0, 35.0, 38.0, 36.0, 42.0, 48.0, 48.0, 57.0, 38.0, 57.0, 65.0, 39.0, 48.0, 45.0, 46.0, 35.0, 26.0, 23.0, 13.0, 19.0, 14.0, 12.0, 8.0, 11.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.89453125, -1.8339080810546875, -1.773284912109375, -1.7126617431640625, -1.65203857421875, -1.5914154052734375, -1.530792236328125, -1.4701690673828125, -1.4095458984375, -1.3489227294921875, -1.288299560546875, -1.2276763916015625, -1.16705322265625, -1.1064300537109375, -1.045806884765625, -0.9851837158203125, -0.924560546875, -0.8639373779296875, -0.803314208984375, -0.7426910400390625, -0.68206787109375, -0.6214447021484375, -0.560821533203125, -0.5001983642578125, -0.4395751953125, -0.3789520263671875, -0.318328857421875, -0.2577056884765625, -0.19708251953125, -0.1364593505859375, -0.075836181640625, -0.0152130126953125, 0.04541015625, 0.1060333251953125, 0.166656494140625, 0.2272796630859375, 0.28790283203125, 0.3485260009765625, 0.409149169921875, 0.4697723388671875, 0.5303955078125, 0.5910186767578125, 0.651641845703125, 0.7122650146484375, 0.77288818359375, 0.8335113525390625, 0.894134521484375, 0.9547576904296875, 1.015380859375, 1.0760040283203125, 1.136627197265625, 1.1972503662109375, 1.25787353515625, 1.3184967041015625, 1.379119873046875, 1.4397430419921875, 1.5003662109375, 1.5609893798828125, 1.621612548828125, 1.6822357177734375, 1.74285888671875, 1.8034820556640625, 1.864105224609375, 1.9247283935546875, 1.9853515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 8.0, 7.0, 17.0, 15.0, 27.0, 56.0, 129.0, 277.0, 753.0, 3022.0, 26744.0, 809715.0, 196744.0, 8667.0, 1529.0, 478.0, 168.0, 89.0, 54.0, 23.0, 14.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.07647705078125, -1.0426025390625, -1.00872802734375, -0.974853515625, -0.94097900390625, -0.9071044921875, -0.87322998046875, -0.83935546875, -0.80548095703125, -0.7716064453125, -0.73773193359375, -0.703857421875, -0.66998291015625, -0.6361083984375, -0.60223388671875, -0.568359375, -0.53448486328125, -0.5006103515625, -0.46673583984375, -0.432861328125, -0.39898681640625, -0.3651123046875, -0.33123779296875, -0.29736328125, -0.26348876953125, -0.2296142578125, -0.19573974609375, -0.161865234375, -0.12799072265625, -0.0941162109375, -0.06024169921875, -0.0263671875, 0.00750732421875, 0.0413818359375, 0.07525634765625, 0.109130859375, 0.14300537109375, 0.1768798828125, 0.21075439453125, 0.24462890625, 0.27850341796875, 0.3123779296875, 0.34625244140625, 0.380126953125, 0.41400146484375, 0.4478759765625, 0.48175048828125, 0.515625, 0.54949951171875, 0.5833740234375, 0.61724853515625, 0.651123046875, 0.68499755859375, 0.7188720703125, 0.75274658203125, 0.78662109375, 0.82049560546875, 0.8543701171875, 0.88824462890625, 0.922119140625, 0.95599365234375, 0.9898681640625, 1.02374267578125, 1.0576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 8.0, 6.0, 6.0, 11.0, 12.0, 15.0, 14.0, 18.0, 24.0, 24.0, 22.0, 23.0, 47.0, 32.0, 43.0, 72.0, 96.0, 84.0, 89.0, 60.0, 45.0, 36.0, 32.0, 38.0, 23.0, 21.0, 18.0, 20.0, 15.0, 11.0, 11.0, 5.0, 1.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.988380432128906e-05, -8.699577301740646e-05, -8.410774171352386e-05, -8.121971040964127e-05, -7.833167910575867e-05, -7.544364780187607e-05, -7.255561649799347e-05, -6.966758519411087e-05, -6.677955389022827e-05, -6.389152258634567e-05, -6.1003491282463074e-05, -5.8115459978580475e-05, -5.5227428674697876e-05, -5.233939737081528e-05, -4.945136606693268e-05, -4.656333476305008e-05, -4.367530345916748e-05, -4.078727215528488e-05, -3.789924085140228e-05, -3.5011209547519684e-05, -3.2123178243637085e-05, -2.9235146939754486e-05, -2.6347115635871887e-05, -2.345908433198929e-05, -2.057105302810669e-05, -1.768302172422409e-05, -1.4794990420341492e-05, -1.1906959116458893e-05, -9.018927812576294e-06, -6.130896508693695e-06, -3.242865204811096e-06, -3.548339009284973e-07, 2.5331974029541016e-06, 5.4212287068367004e-06, 8.3092600107193e-06, 1.1197291314601898e-05, 1.4085322618484497e-05, 1.6973353922367096e-05, 1.9861385226249695e-05, 2.2749416530132294e-05, 2.5637447834014893e-05, 2.852547913789749e-05, 3.141351044178009e-05, 3.430154174566269e-05, 3.718957304954529e-05, 4.007760435342789e-05, 4.2965635657310486e-05, 4.5853666961193085e-05, 4.8741698265075684e-05, 5.162972956895828e-05, 5.451776087284088e-05, 5.740579217672348e-05, 6.029382348060608e-05, 6.318185478448868e-05, 6.606988608837128e-05, 6.895791739225388e-05, 7.184594869613647e-05, 7.473398000001907e-05, 7.762201130390167e-05, 8.051004260778427e-05, 8.339807391166687e-05, 8.628610521554947e-05, 8.917413651943207e-05, 9.206216782331467e-05, 9.495019912719727e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 14.0, 15.0, 29.0, 47.0, 63.0, 110.0, 195.0, 436.0, 1005.0, 3326.0, 25459.0, 751939.0, 251046.0, 11279.0, 2137.0, 709.0, 333.0, 170.0, 99.0, 60.0, 30.0, 19.0, 14.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.044342041015625, -1.01153564453125, -0.978729248046875, -0.9459228515625, -0.913116455078125, -0.88031005859375, -0.847503662109375, -0.814697265625, -0.781890869140625, -0.74908447265625, -0.716278076171875, -0.6834716796875, -0.650665283203125, -0.61785888671875, -0.585052490234375, -0.55224609375, -0.519439697265625, -0.48663330078125, -0.453826904296875, -0.4210205078125, -0.388214111328125, -0.35540771484375, -0.322601318359375, -0.289794921875, -0.256988525390625, -0.22418212890625, -0.191375732421875, -0.1585693359375, -0.125762939453125, -0.09295654296875, -0.060150146484375, -0.02734375, 0.005462646484375, 0.03826904296875, 0.071075439453125, 0.1038818359375, 0.136688232421875, 0.16949462890625, 0.202301025390625, 0.235107421875, 0.267913818359375, 0.30072021484375, 0.333526611328125, 0.3663330078125, 0.399139404296875, 0.43194580078125, 0.464752197265625, 0.49755859375, 0.530364990234375, 0.56317138671875, 0.595977783203125, 0.6287841796875, 0.661590576171875, 0.69439697265625, 0.727203369140625, 0.760009765625, 0.792816162109375, 0.82562255859375, 0.858428955078125, 0.8912353515625, 0.924041748046875, 0.95684814453125, 0.989654541015625, 1.0224609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 7.0, 7.0, 14.0, 23.0, 25.0, 30.0, 40.0, 73.0, 94.0, 110.0, 129.0, 116.0, 92.0, 82.0, 51.0, 25.0, 31.0, 14.0, 8.0, 11.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0], "bins": [-1.158203125, -1.1342811584472656, -1.1103591918945312, -1.0864372253417969, -1.0625152587890625, -1.0385932922363281, -1.0146713256835938, -0.9907493591308594, -0.966827392578125, -0.9429054260253906, -0.9189834594726562, -0.8950614929199219, -0.8711395263671875, -0.8472175598144531, -0.8232955932617188, -0.7993736267089844, -0.77545166015625, -0.7515296936035156, -0.7276077270507812, -0.7036857604980469, -0.6797637939453125, -0.6558418273925781, -0.6319198608398438, -0.6079978942871094, -0.584075927734375, -0.5601539611816406, -0.5362319946289062, -0.5123100280761719, -0.4883880615234375, -0.4644660949707031, -0.44054412841796875, -0.4166221618652344, -0.3927001953125, -0.3687782287597656, -0.34485626220703125, -0.3209342956542969, -0.2970123291015625, -0.2730903625488281, -0.24916839599609375, -0.22524642944335938, -0.201324462890625, -0.17740249633789062, -0.15348052978515625, -0.12955856323242188, -0.1056365966796875, -0.08171463012695312, -0.05779266357421875, -0.033870697021484375, -0.00994873046875, 0.013973236083984375, 0.03789520263671875, 0.061817169189453125, 0.0857391357421875, 0.10966110229492188, 0.13358306884765625, 0.15750503540039062, 0.181427001953125, 0.20534896850585938, 0.22927093505859375, 0.2531929016113281, 0.2771148681640625, 0.3010368347167969, 0.32495880126953125, 0.3488807678222656, 0.372802734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 23.0, 79.0, 227.0, 345.0, 215.0, 80.0, 20.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.49342918395996, -17.704021453857422, -16.914615631103516, -16.125207901000977, -15.335800170898438, -14.546393394470215, -13.756986618041992, -12.967578887939453, -12.17817211151123, -11.388765335083008, -10.599357604980469, -9.809950828552246, -9.020544052124023, -8.231136322021484, -7.441729545593262, -6.652322292327881, -5.8629150390625, -5.073507785797119, -4.284100532531738, -3.4946937561035156, -2.7052865028381348, -1.915879249572754, -1.1264724731445312, -0.3370652198791504, 0.45234203338623047, 1.2417491674423218, 2.031156301498413, 2.820563316345215, 3.6099705696105957, 4.399377822875977, 5.188784599304199, 5.97819185256958, 6.767601013183594, 7.557008266448975, 8.346415519714355, 9.135822296142578, 9.925230026245117, 10.71463680267334, 11.504043579101562, 12.293451309204102, 13.082858085632324, 13.872264862060547, 14.661672592163086, 15.451079368591309, 16.24048614501953, 17.02989387512207, 17.81930160522461, 18.608707427978516, 19.398115158081055, 20.187522888183594, 20.9769287109375, 21.76633644104004, 22.555744171142578, 23.345149993896484, 24.134557723999023, 24.923965454101562, 25.71337127685547, 26.502779006958008, 27.292184829711914, 28.081592559814453, 28.871000289916992, 29.66040802001953, 30.449813842773438, 31.239221572875977, 32.028629302978516]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 5.0, 10.0, 12.0, 17.0, 22.0, 17.0, 27.0, 28.0, 34.0, 47.0, 49.0, 62.0, 45.0, 40.0, 56.0, 53.0, 60.0, 66.0, 51.0, 51.0, 32.0, 38.0, 34.0, 22.0, 12.0, 15.0, 14.0, 12.0, 15.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.913366317749023, -9.619521141052246, -9.325675964355469, -9.031831741333008, -8.73798656463623, -8.444141387939453, -8.150296211242676, -7.856451511383057, -7.5626068115234375, -7.26876163482666, -6.974916934967041, -6.681071758270264, -6.3872270584106445, -6.093381881713867, -5.79953670501709, -5.505692005157471, -5.211846828460693, -4.918001651763916, -4.624156951904297, -4.3303117752075195, -4.0364670753479, -3.742621898651123, -3.448776960372925, -3.1549320220947266, -2.8610870838165283, -2.56724214553833, -2.273397207260132, -1.979552149772644, -1.6857072114944458, -1.3918622732162476, -1.0980172157287598, -0.8041722774505615, -0.5103273391723633, -0.21648237109184265, 0.07736259698867798, 0.371207594871521, 0.6650525331497192, 0.9588974714279175, 1.2527425289154053, 1.5465874671936035, 1.8404324054718018, 2.13427734375, 2.4281222820281982, 2.7219672203063965, 3.015812397003174, 3.309657096862793, 3.6035022735595703, 3.8973472118377686, 4.191192150115967, 4.485037326812744, 4.778882026672363, 5.072727203369141, 5.36657190322876, 5.660417079925537, 5.954261779785156, 6.248106956481934, 6.541952133178711, 6.835797309875488, 7.129642009735107, 7.423487186431885, 7.717331886291504, 8.011177062988281, 8.305022239685059, 8.598867416381836, 8.892711639404297]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 9.0, 14.0, 17.0, 21.0, 36.0, 64.0, 102.0, 143.0, 223.0, 444.0, 880.0, 1813.0, 4411.0, 12963.0, 49672.0, 366633.0, 3251899.0, 428027.0, 55123.0, 13511.0, 4577.0, 1896.0, 781.0, 398.0, 244.0, 120.0, 73.0, 54.0, 27.0, 16.0, 18.0, 11.0, 12.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68359375, -0.6587600708007812, -0.6339263916015625, -0.6090927124023438, -0.584259033203125, -0.5594253540039062, -0.5345916748046875, -0.5097579956054688, -0.48492431640625, -0.46009063720703125, -0.4352569580078125, -0.41042327880859375, -0.385589599609375, -0.36075592041015625, -0.3359222412109375, -0.31108856201171875, -0.2862548828125, -0.26142120361328125, -0.2365875244140625, -0.21175384521484375, -0.186920166015625, -0.16208648681640625, -0.1372528076171875, -0.11241912841796875, -0.08758544921875, -0.06275177001953125, -0.0379180908203125, -0.01308441162109375, 0.011749267578125, 0.03658294677734375, 0.0614166259765625, 0.08625030517578125, 0.111083984375, 0.13591766357421875, 0.1607513427734375, 0.18558502197265625, 0.210418701171875, 0.23525238037109375, 0.2600860595703125, 0.28491973876953125, 0.30975341796875, 0.33458709716796875, 0.3594207763671875, 0.38425445556640625, 0.409088134765625, 0.43392181396484375, 0.4587554931640625, 0.48358917236328125, 0.5084228515625, 0.5332565307617188, 0.5580902099609375, 0.5829238891601562, 0.607757568359375, 0.6325912475585938, 0.6574249267578125, 0.6822586059570312, 0.70709228515625, 0.7319259643554688, 0.7567596435546875, 0.7815933227539062, 0.806427001953125, 0.8312606811523438, 0.8560943603515625, 0.8809280395507812, 0.90576171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 14.0, 16.0, 32.0, 29.0, 51.0, 68.0, 71.0, 76.0, 77.0, 127.0, 88.0, 68.0, 80.0, 47.0, 41.0, 27.0, 19.0, 22.0, 7.0, 8.0, 8.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.7393875122070312, -0.7204742431640625, -0.7015609741210938, -0.682647705078125, -0.6637344360351562, -0.6448211669921875, -0.6259078979492188, -0.60699462890625, -0.5880813598632812, -0.5691680908203125, -0.5502548217773438, -0.531341552734375, -0.5124282836914062, -0.4935150146484375, -0.47460174560546875, -0.4556884765625, -0.43677520751953125, -0.4178619384765625, -0.39894866943359375, -0.380035400390625, -0.36112213134765625, -0.3422088623046875, -0.32329559326171875, -0.30438232421875, -0.28546905517578125, -0.2665557861328125, -0.24764251708984375, -0.228729248046875, -0.20981597900390625, -0.1909027099609375, -0.17198944091796875, -0.153076171875, -0.13416290283203125, -0.1152496337890625, -0.09633636474609375, -0.077423095703125, -0.05850982666015625, -0.0395965576171875, -0.02068328857421875, -0.00177001953125, 0.01714324951171875, 0.0360565185546875, 0.05496978759765625, 0.073883056640625, 0.09279632568359375, 0.1117095947265625, 0.13062286376953125, 0.1495361328125, 0.16844940185546875, 0.1873626708984375, 0.20627593994140625, 0.225189208984375, 0.24410247802734375, 0.2630157470703125, 0.28192901611328125, 0.30084228515625, 0.31975555419921875, 0.3386688232421875, 0.35758209228515625, 0.376495361328125, 0.39540863037109375, 0.4143218994140625, 0.43323516845703125, 0.4521484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 12.0, 10.0, 15.0, 27.0, 25.0, 48.0, 57.0, 101.0, 148.0, 271.0, 464.0, 963.0, 1970.0, 4260.0, 10504.0, 30689.0, 135564.0, 1444999.0, 2310902.0, 191926.0, 39172.0, 12640.0, 4830.0, 2207.0, 1073.0, 577.0, 310.0, 185.0, 103.0, 80.0, 40.0, 31.0, 23.0, 12.0, 11.0, 6.0, 3.0, 5.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.76220703125, -0.7410888671875, -0.719970703125, -0.6988525390625, -0.677734375, -0.6566162109375, -0.635498046875, -0.6143798828125, -0.59326171875, -0.5721435546875, -0.551025390625, -0.5299072265625, -0.5087890625, -0.4876708984375, -0.466552734375, -0.4454345703125, -0.42431640625, -0.4031982421875, -0.382080078125, -0.3609619140625, -0.33984375, -0.3187255859375, -0.297607421875, -0.2764892578125, -0.25537109375, -0.2342529296875, -0.213134765625, -0.1920166015625, -0.1708984375, -0.1497802734375, -0.128662109375, -0.1075439453125, -0.08642578125, -0.0653076171875, -0.044189453125, -0.0230712890625, -0.001953125, 0.0191650390625, 0.040283203125, 0.0614013671875, 0.08251953125, 0.1036376953125, 0.124755859375, 0.1458740234375, 0.1669921875, 0.1881103515625, 0.209228515625, 0.2303466796875, 0.25146484375, 0.2725830078125, 0.293701171875, 0.3148193359375, 0.3359375, 0.3570556640625, 0.378173828125, 0.3992919921875, 0.42041015625, 0.4415283203125, 0.462646484375, 0.4837646484375, 0.5048828125, 0.5260009765625, 0.547119140625, 0.5682373046875, 0.58935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 6.0, 9.0, 11.0, 18.0, 27.0, 32.0, 56.0, 126.0, 192.0, 367.0, 675.0, 967.0, 697.0, 349.0, 227.0, 118.0, 69.0, 27.0, 26.0, 15.0, 11.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.0042266845703125, -0.971343994140625, -0.9384613037109375, -0.90557861328125, -0.8726959228515625, -0.839813232421875, -0.8069305419921875, -0.7740478515625, -0.7411651611328125, -0.708282470703125, -0.6753997802734375, -0.64251708984375, -0.6096343994140625, -0.576751708984375, -0.5438690185546875, -0.510986328125, -0.4781036376953125, -0.445220947265625, -0.4123382568359375, -0.37945556640625, -0.3465728759765625, -0.313690185546875, -0.2808074951171875, -0.2479248046875, -0.2150421142578125, -0.182159423828125, -0.1492767333984375, -0.11639404296875, -0.0835113525390625, -0.050628662109375, -0.0177459716796875, 0.01513671875, 0.0480194091796875, 0.080902099609375, 0.1137847900390625, 0.14666748046875, 0.1795501708984375, 0.212432861328125, 0.2453155517578125, 0.2781982421875, 0.3110809326171875, 0.343963623046875, 0.3768463134765625, 0.40972900390625, 0.4426116943359375, 0.475494384765625, 0.5083770751953125, 0.541259765625, 0.5741424560546875, 0.607025146484375, 0.6399078369140625, 0.67279052734375, 0.7056732177734375, 0.738555908203125, 0.7714385986328125, 0.8043212890625, 0.8372039794921875, 0.870086669921875, 0.9029693603515625, 0.93585205078125, 0.9687347412109375, 1.001617431640625, 1.0345001220703125, 1.0673828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 11.0, 3.0, 12.0, 25.0, 44.0, 92.0, 149.0, 208.0, 162.0, 129.0, 89.0, 36.0, 21.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.519721984863281, -11.229414939880371, -10.939107894897461, -10.64880084991455, -10.35849380493164, -10.06818675994873, -9.77787971496582, -9.48757266998291, -9.197265625, -8.90695858001709, -8.61665153503418, -8.32634449005127, -8.03603744506836, -7.745730400085449, -7.455423355102539, -7.165116310119629, -6.874809741973877, -6.584502696990967, -6.294195652008057, -6.0038886070251465, -5.713581562042236, -5.423274517059326, -5.132967948913574, -4.842660903930664, -4.552353858947754, -4.262046813964844, -3.9717397689819336, -3.6814327239990234, -3.3911256790161133, -3.100818634033203, -2.810511827468872, -2.520204782485962, -2.2298970222473145, -1.9395899772644043, -1.6492829322814941, -1.3589760065078735, -1.0686689615249634, -0.7783619165420532, -0.4880549907684326, -0.19774794578552246, 0.0925590991973877, 0.38286611437797546, 0.6731731295585632, 0.9634801149368286, 1.2537871599197388, 1.544094204902649, 1.8344011306762695, 2.1247081756591797, 2.41501522064209, 2.705322265625, 2.99562931060791, 3.2859363555908203, 3.5762434005737305, 3.8665504455566406, 4.156857490539551, 4.447164535522461, 4.737471580505371, 5.027778625488281, 5.318085670471191, 5.608392715454102, 5.898699760437012, 6.189006805419922, 6.479313850402832, 6.769620895385742, 7.059927463531494]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 14.0, 6.0, 11.0, 16.0, 19.0, 27.0, 25.0, 18.0, 26.0, 38.0, 38.0, 45.0, 43.0, 54.0, 48.0, 50.0, 53.0, 47.0, 47.0, 38.0, 39.0, 38.0, 35.0, 32.0, 31.0, 18.0, 20.0, 18.0, 16.0, 16.0, 9.0, 11.0, 14.0, 7.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.58216667175293, -4.451664924621582, -4.321163654327393, -4.190661907196045, -4.060160160064697, -3.9296586513519287, -3.79915714263916, -3.6686553955078125, -3.538153886795044, -3.4076523780822754, -3.2771506309509277, -3.146649122238159, -3.0161476135253906, -2.885645866394043, -2.7551443576812744, -2.624642848968506, -2.494141101837158, -2.3636395931243896, -2.233137845993042, -2.1026363372802734, -1.9721347093582153, -1.8416330814361572, -1.7111315727233887, -1.5806299448013306, -1.4501283168792725, -1.3196266889572144, -1.1891250610351562, -1.0586235523223877, -0.9281219244003296, -0.7976202964782715, -0.6671187281608582, -0.5366171598434448, -0.4061152935028076, -0.2756136953830719, -0.14511209726333618, -0.014610499143600464, 0.11589109897613525, 0.24639272689819336, 0.3768942952156067, 0.50739586353302, 0.6378974914550781, 0.7683991193771362, 0.8989006876945496, 1.029402256011963, 1.159903883934021, 1.290405511856079, 1.4209070205688477, 1.5514086484909058, 1.6819102764129639, 1.812411904335022, 1.94291353225708, 2.0734150409698486, 2.203916549682617, 2.334418296813965, 2.4649198055267334, 2.595421314239502, 2.7259230613708496, 2.856424570083618, 2.986926317214966, 3.1174278259277344, 3.247929573059082, 3.3784310817718506, 3.508932590484619, 3.639434337615967, 3.7699358463287354]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 0.0, 5.0, 4.0, 6.0, 10.0, 8.0, 15.0, 25.0, 48.0, 77.0, 114.0, 193.0, 364.0, 645.0, 1268.0, 2477.0, 5353.0, 13145.0, 39068.0, 145327.0, 481797.0, 259412.0, 64611.0, 20312.0, 7586.0, 3294.0, 1517.0, 804.0, 430.0, 240.0, 137.0, 88.0, 54.0, 42.0, 19.0, 17.0, 12.0, 12.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.861328125, -0.8323287963867188, -0.8033294677734375, -0.7743301391601562, -0.745330810546875, -0.7163314819335938, -0.6873321533203125, -0.6583328247070312, -0.62933349609375, -0.6003341674804688, -0.5713348388671875, -0.5423355102539062, -0.513336181640625, -0.48433685302734375, -0.4553375244140625, -0.42633819580078125, -0.3973388671875, -0.36833953857421875, -0.3393402099609375, -0.31034088134765625, -0.281341552734375, -0.25234222412109375, -0.2233428955078125, -0.19434356689453125, -0.16534423828125, -0.13634490966796875, -0.1073455810546875, -0.07834625244140625, -0.049346923828125, -0.02034759521484375, 0.0086517333984375, 0.03765106201171875, 0.066650390625, 0.09564971923828125, 0.1246490478515625, 0.15364837646484375, 0.182647705078125, 0.21164703369140625, 0.2406463623046875, 0.26964569091796875, 0.29864501953125, 0.32764434814453125, 0.3566436767578125, 0.38564300537109375, 0.414642333984375, 0.44364166259765625, 0.4726409912109375, 0.5016403198242188, 0.5306396484375, 0.5596389770507812, 0.5886383056640625, 0.6176376342773438, 0.646636962890625, 0.6756362915039062, 0.7046356201171875, 0.7336349487304688, 0.76263427734375, 0.7916336059570312, 0.8206329345703125, 0.8496322631835938, 0.878631591796875, 0.9076309204101562, 0.9366302490234375, 0.9656295776367188, 0.99462890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 11.0, 7.0, 12.0, 21.0, 25.0, 34.0, 36.0, 31.0, 55.0, 50.0, 56.0, 74.0, 69.0, 70.0, 67.0, 58.0, 58.0, 46.0, 46.0, 35.0, 28.0, 21.0, 19.0, 21.0, 9.0, 8.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.56103515625, -0.5479621887207031, -0.5348892211914062, -0.5218162536621094, -0.5087432861328125, -0.4956703186035156, -0.48259735107421875, -0.4695243835449219, -0.456451416015625, -0.4433784484863281, -0.43030548095703125, -0.4172325134277344, -0.4041595458984375, -0.3910865783691406, -0.37801361083984375, -0.3649406433105469, -0.35186767578125, -0.3387947082519531, -0.32572174072265625, -0.3126487731933594, -0.2995758056640625, -0.2865028381347656, -0.27342987060546875, -0.2603569030761719, -0.247283935546875, -0.23421096801757812, -0.22113800048828125, -0.20806503295898438, -0.1949920654296875, -0.18191909790039062, -0.16884613037109375, -0.15577316284179688, -0.1427001953125, -0.12962722778320312, -0.11655426025390625, -0.10348129272460938, -0.0904083251953125, -0.07733535766601562, -0.06426239013671875, -0.051189422607421875, -0.038116455078125, -0.025043487548828125, -0.01197052001953125, 0.001102447509765625, 0.0141754150390625, 0.027248382568359375, 0.04032135009765625, 0.053394317626953125, 0.06646728515625, 0.07954025268554688, 0.09261322021484375, 0.10568618774414062, 0.1187591552734375, 0.13183212280273438, 0.14490509033203125, 0.15797805786132812, 0.171051025390625, 0.18412399291992188, 0.19719696044921875, 0.21026992797851562, 0.2233428955078125, 0.23641586303710938, 0.24948883056640625, 0.2625617980957031, 0.275634765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 20.0, 9.0, 30.0, 43.0, 57.0, 94.0, 173.0, 321.0, 564.0, 1390.0, 4474.0, 37987.0, 882308.0, 109981.0, 7568.0, 1861.0, 710.0, 365.0, 182.0, 136.0, 75.0, 56.0, 40.0, 27.0, 13.0, 15.0, 9.0, 11.0, 6.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.666015625, -2.59124755859375, -2.5164794921875, -2.44171142578125, -2.366943359375, -2.29217529296875, -2.2174072265625, -2.14263916015625, -2.06787109375, -1.99310302734375, -1.9183349609375, -1.84356689453125, -1.768798828125, -1.69403076171875, -1.6192626953125, -1.54449462890625, -1.4697265625, -1.39495849609375, -1.3201904296875, -1.24542236328125, -1.170654296875, -1.09588623046875, -1.0211181640625, -0.94635009765625, -0.87158203125, -0.79681396484375, -0.7220458984375, -0.64727783203125, -0.572509765625, -0.49774169921875, -0.4229736328125, -0.34820556640625, -0.2734375, -0.19866943359375, -0.1239013671875, -0.04913330078125, 0.025634765625, 0.10040283203125, 0.1751708984375, 0.24993896484375, 0.32470703125, 0.39947509765625, 0.4742431640625, 0.54901123046875, 0.623779296875, 0.69854736328125, 0.7733154296875, 0.84808349609375, 0.9228515625, 0.99761962890625, 1.0723876953125, 1.14715576171875, 1.221923828125, 1.29669189453125, 1.3714599609375, 1.44622802734375, 1.52099609375, 1.59576416015625, 1.6705322265625, 1.74530029296875, 1.820068359375, 1.89483642578125, 1.9696044921875, 2.04437255859375, 2.119140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 11.0, 8.0, 3.0, 11.0, 13.0, 15.0, 26.0, 29.0, 36.0, 33.0, 47.0, 44.0, 53.0, 44.0, 55.0, 62.0, 42.0, 51.0, 51.0, 40.0, 48.0, 38.0, 39.0, 26.0, 34.0, 21.0, 15.0, 12.0, 12.0, 8.0, 14.0, 4.0, 9.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.49609375, -1.4463043212890625, -1.396514892578125, -1.3467254638671875, -1.29693603515625, -1.2471466064453125, -1.197357177734375, -1.1475677490234375, -1.0977783203125, -1.0479888916015625, -0.998199462890625, -0.9484100341796875, -0.89862060546875, -0.8488311767578125, -0.799041748046875, -0.7492523193359375, -0.699462890625, -0.6496734619140625, -0.599884033203125, -0.5500946044921875, -0.50030517578125, -0.4505157470703125, -0.400726318359375, -0.3509368896484375, -0.3011474609375, -0.2513580322265625, -0.201568603515625, -0.1517791748046875, -0.10198974609375, -0.0522003173828125, -0.002410888671875, 0.0473785400390625, 0.09716796875, 0.1469573974609375, 0.196746826171875, 0.2465362548828125, 0.29632568359375, 0.3461151123046875, 0.395904541015625, 0.4456939697265625, 0.4954833984375, 0.5452728271484375, 0.595062255859375, 0.6448516845703125, 0.69464111328125, 0.7444305419921875, 0.794219970703125, 0.8440093994140625, 0.893798828125, 0.9435882568359375, 0.993377685546875, 1.0431671142578125, 1.09295654296875, 1.1427459716796875, 1.192535400390625, 1.2423248291015625, 1.2921142578125, 1.3419036865234375, 1.391693115234375, 1.4414825439453125, 1.49127197265625, 1.5410614013671875, 1.590850830078125, 1.6406402587890625, 1.6904296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 11.0, 12.0, 28.0, 33.0, 72.0, 135.0, 288.0, 735.0, 3718.0, 77909.0, 943017.0, 19599.0, 2050.0, 535.0, 204.0, 76.0, 45.0, 29.0, 15.0, 13.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.79296875, -1.748504638671875, -1.70404052734375, -1.659576416015625, -1.6151123046875, -1.570648193359375, -1.52618408203125, -1.481719970703125, -1.437255859375, -1.392791748046875, -1.34832763671875, -1.303863525390625, -1.2593994140625, -1.214935302734375, -1.17047119140625, -1.126007080078125, -1.08154296875, -1.037078857421875, -0.99261474609375, -0.948150634765625, -0.9036865234375, -0.859222412109375, -0.81475830078125, -0.770294189453125, -0.725830078125, -0.681365966796875, -0.63690185546875, -0.592437744140625, -0.5479736328125, -0.503509521484375, -0.45904541015625, -0.414581298828125, -0.3701171875, -0.325653076171875, -0.28118896484375, -0.236724853515625, -0.1922607421875, -0.147796630859375, -0.10333251953125, -0.058868408203125, -0.014404296875, 0.030059814453125, 0.07452392578125, 0.118988037109375, 0.1634521484375, 0.207916259765625, 0.25238037109375, 0.296844482421875, 0.34130859375, 0.385772705078125, 0.43023681640625, 0.474700927734375, 0.5191650390625, 0.563629150390625, 0.60809326171875, 0.652557373046875, 0.697021484375, 0.741485595703125, 0.78594970703125, 0.830413818359375, 0.8748779296875, 0.919342041015625, 0.96380615234375, 1.008270263671875, 1.052734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 12.0, 6.0, 3.0, 12.0, 12.0, 18.0, 21.0, 17.0, 31.0, 34.0, 48.0, 75.0, 72.0, 92.0, 106.0, 80.0, 72.0, 52.0, 44.0, 32.0, 20.0, 17.0, 16.0, 6.0, 10.0, 10.0, 3.0, 10.0, 7.0, 8.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.673833847045898e-05, -9.375158697366714e-05, -9.07648354768753e-05, -8.777808398008347e-05, -8.479133248329163e-05, -8.180458098649979e-05, -7.881782948970795e-05, -7.583107799291611e-05, -7.284432649612427e-05, -6.985757499933243e-05, -6.687082350254059e-05, -6.388407200574875e-05, -6.089732050895691e-05, -5.791056901216507e-05, -5.492381751537323e-05, -5.193706601858139e-05, -4.895031452178955e-05, -4.596356302499771e-05, -4.297681152820587e-05, -3.999006003141403e-05, -3.700330853462219e-05, -3.401655703783035e-05, -3.102980554103851e-05, -2.8043054044246674e-05, -2.5056302547454834e-05, -2.2069551050662994e-05, -1.9082799553871155e-05, -1.6096048057079315e-05, -1.3109296560287476e-05, -1.0122545063495636e-05, -7.135793566703796e-06, -4.149042069911957e-06, -1.1622905731201172e-06, 1.8244609236717224e-06, 4.811212420463562e-06, 7.797963917255402e-06, 1.0784715414047241e-05, 1.377146691083908e-05, 1.675821840763092e-05, 1.974496990442276e-05, 2.27317214012146e-05, 2.571847289800644e-05, 2.870522439479828e-05, 3.169197589159012e-05, 3.467872738838196e-05, 3.76654788851738e-05, 4.065223038196564e-05, 4.363898187875748e-05, 4.6625733375549316e-05, 4.9612484872341156e-05, 5.2599236369132996e-05, 5.5585987865924835e-05, 5.8572739362716675e-05, 6.155949085950851e-05, 6.454624235630035e-05, 6.75329938530922e-05, 7.051974534988403e-05, 7.350649684667587e-05, 7.649324834346771e-05, 7.947999984025955e-05, 8.246675133705139e-05, 8.545350283384323e-05, 8.844025433063507e-05, 9.142700582742691e-05, 9.441375732421875e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 8.0, 9.0, 13.0, 24.0, 56.0, 82.0, 191.0, 482.0, 1331.0, 7966.0, 669384.0, 360678.0, 6426.0, 1166.0, 353.0, 182.0, 83.0, 52.0, 30.0, 12.0, 7.0, 9.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2196807861328125, -1.170806884765625, -1.1219329833984375, -1.07305908203125, -1.0241851806640625, -0.975311279296875, -0.9264373779296875, -0.8775634765625, -0.8286895751953125, -0.779815673828125, -0.7309417724609375, -0.68206787109375, -0.6331939697265625, -0.584320068359375, -0.5354461669921875, -0.486572265625, -0.4376983642578125, -0.388824462890625, -0.3399505615234375, -0.29107666015625, -0.2422027587890625, -0.193328857421875, -0.1444549560546875, -0.0955810546875, -0.0467071533203125, 0.002166748046875, 0.0510406494140625, 0.09991455078125, 0.1487884521484375, 0.197662353515625, 0.2465362548828125, 0.29541015625, 0.3442840576171875, 0.393157958984375, 0.4420318603515625, 0.49090576171875, 0.5397796630859375, 0.588653564453125, 0.6375274658203125, 0.6864013671875, 0.7352752685546875, 0.784149169921875, 0.8330230712890625, 0.88189697265625, 0.9307708740234375, 0.979644775390625, 1.0285186767578125, 1.077392578125, 1.1262664794921875, 1.175140380859375, 1.2240142822265625, 1.27288818359375, 1.3217620849609375, 1.370635986328125, 1.4195098876953125, 1.4683837890625, 1.5172576904296875, 1.566131591796875, 1.6150054931640625, 1.66387939453125, 1.7127532958984375, 1.761627197265625, 1.8105010986328125, 1.859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 18.0, 16.0, 27.0, 51.0, 62.0, 106.0, 145.0, 165.0, 142.0, 81.0, 42.0, 36.0, 15.0, 23.0, 14.0, 11.0, 5.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483642578125, -0.4555778503417969, -0.42751312255859375, -0.3994483947753906, -0.3713836669921875, -0.3433189392089844, -0.31525421142578125, -0.2871894836425781, -0.259124755859375, -0.23106002807617188, -0.20299530029296875, -0.17493057250976562, -0.1468658447265625, -0.11880111694335938, -0.09073638916015625, -0.06267166137695312, -0.03460693359375, -0.006542205810546875, 0.02152252197265625, 0.049587249755859375, 0.0776519775390625, 0.10571670532226562, 0.13378143310546875, 0.16184616088867188, 0.189910888671875, 0.21797561645507812, 0.24604034423828125, 0.2741050720214844, 0.3021697998046875, 0.3302345275878906, 0.35829925537109375, 0.3863639831542969, 0.4144287109375, 0.4424934387207031, 0.47055816650390625, 0.4986228942871094, 0.5266876220703125, 0.5547523498535156, 0.5828170776367188, 0.6108818054199219, 0.638946533203125, 0.6670112609863281, 0.6950759887695312, 0.7231407165527344, 0.7512054443359375, 0.7792701721191406, 0.8073348999023438, 0.8353996276855469, 0.86346435546875, 0.8915290832519531, 0.9195938110351562, 0.9476585388183594, 0.9757232666015625, 1.0037879943847656, 1.0318527221679688, 1.0599174499511719, 1.087982177734375, 1.1160469055175781, 1.1441116333007812, 1.1721763610839844, 1.2002410888671875, 1.2283058166503906, 1.2563705444335938, 1.2844352722167969, 1.3125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 14.0, 19.0, 54.0, 122.0, 220.0, 261.0, 172.0, 83.0, 24.0, 15.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.999593734741211, -8.596375465393066, -8.193158149719238, -7.789939880371094, -7.386722087860107, -6.983504295349121, -6.580286502838135, -6.177068710327148, -5.773850440979004, -5.370632648468018, -4.967414855957031, -4.564196586608887, -4.1609787940979, -3.757761001586914, -3.3545432090759277, -2.9513251781463623, -2.548107624053955, -2.1448898315429688, -1.7416718006134033, -1.338454008102417, -0.9352360963821411, -0.5320181846618652, -0.1288003921508789, 0.2744176387786865, 0.6776354312896729, 1.0808533430099487, 1.4840712547302246, 1.887289047241211, 2.2905068397521973, 2.6937248706817627, 3.096942663192749, 3.5001606941223145, 3.903378486633301, 4.306596279144287, 4.709814071655273, 5.113032341003418, 5.516250133514404, 5.919467926025391, 6.322685718536377, 6.725903511047363, 7.129121780395508, 7.532339572906494, 7.9355573654174805, 8.338775634765625, 8.741992950439453, 9.145211219787598, 9.548429489135742, 9.95164680480957, 10.354864120483398, 10.758082389831543, 11.161299705505371, 11.564517974853516, 11.967735290527344, 12.370953559875488, 12.774171829223633, 13.177389144897461, 13.580607414245605, 13.98382568359375, 14.387042999267578, 14.790261268615723, 15.19347858428955, 15.596696853637695, 15.999914169311523, 16.403133392333984, 16.806350708007812]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 5.0, 7.0, 10.0, 14.0, 18.0, 21.0, 23.0, 28.0, 26.0, 33.0, 48.0, 61.0, 61.0, 48.0, 75.0, 55.0, 46.0, 51.0, 61.0, 51.0, 45.0, 39.0, 22.0, 29.0, 24.0, 18.0, 18.0, 11.0, 12.0, 15.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.69635009765625, -8.46436882019043, -8.23238754272461, -8.000406265258789, -7.768424987792969, -7.536443710327148, -7.304462432861328, -7.072481632232666, -6.840500354766846, -6.608519077301025, -6.376537799835205, -6.144556522369385, -5.9125752449035645, -5.680594444274902, -5.448613166809082, -5.216631889343262, -4.984650611877441, -4.752669334411621, -4.520688056945801, -4.2887067794799805, -4.05672550201416, -3.824744462966919, -3.5927631855010986, -3.3607821464538574, -3.128800392150879, -2.8968191146850586, -2.6648378372192383, -2.432856559753418, -2.2008755207061768, -1.9688942432403564, -1.7369129657745361, -1.5049318075180054, -1.2729506492614746, -1.0409693717956543, -0.8089882135391235, -0.5770069360733032, -0.3450257182121277, -0.11304450035095215, 0.11893677711486816, 0.3509179353713989, 0.5828992128372192, 0.8148804306983948, 1.0468616485595703, 1.2788429260253906, 1.510824203491211, 1.7428053617477417, 1.974786639213562, 2.2067677974700928, 2.438749074935913, 2.6707303524017334, 2.9027116298675537, 3.134692668914795, 3.3666739463806152, 3.5986552238464355, 3.830636501312256, 4.062617778778076, 4.2945990562438965, 4.526580333709717, 4.758561611175537, 4.990542888641357, 5.222524166107178, 5.45450496673584, 5.68648624420166, 5.9184675216674805, 6.150448799133301]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 15.0, 5.0, 11.0, 13.0, 12.0, 21.0, 32.0, 33.0, 48.0, 64.0, 84.0, 103.0, 152.0, 270.0, 1464.0, 899557.0, 3289645.0, 1746.0, 318.0, 171.0, 137.0, 93.0, 70.0, 49.0, 46.0, 28.0, 19.0, 17.0, 10.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.20703125, -4.08343505859375, -3.9598388671875, -3.83624267578125, -3.712646484375, -3.58905029296875, -3.4654541015625, -3.34185791015625, -3.21826171875, -3.09466552734375, -2.9710693359375, -2.84747314453125, -2.723876953125, -2.60028076171875, -2.4766845703125, -2.35308837890625, -2.2294921875, -2.10589599609375, -1.9822998046875, -1.85870361328125, -1.735107421875, -1.61151123046875, -1.4879150390625, -1.36431884765625, -1.24072265625, -1.11712646484375, -0.9935302734375, -0.86993408203125, -0.746337890625, -0.62274169921875, -0.4991455078125, -0.37554931640625, -0.251953125, -0.12835693359375, -0.0047607421875, 0.11883544921875, 0.242431640625, 0.36602783203125, 0.4896240234375, 0.61322021484375, 0.73681640625, 0.86041259765625, 0.9840087890625, 1.10760498046875, 1.231201171875, 1.35479736328125, 1.4783935546875, 1.60198974609375, 1.7255859375, 1.84918212890625, 1.9727783203125, 2.09637451171875, 2.219970703125, 2.34356689453125, 2.4671630859375, 2.59075927734375, 2.71435546875, 2.83795166015625, 2.9615478515625, 3.08514404296875, 3.208740234375, 3.33233642578125, 3.4559326171875, 3.57952880859375, 3.703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 12.0, 14.0, 21.0, 28.0, 34.0, 40.0, 45.0, 37.0, 52.0, 67.0, 68.0, 85.0, 58.0, 56.0, 73.0, 53.0, 50.0, 32.0, 35.0, 32.0, 26.0, 18.0, 15.0, 15.0, 8.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.54638671875, -0.5341529846191406, -0.5219192504882812, -0.5096855163574219, -0.4974517822265625, -0.4852180480957031, -0.47298431396484375, -0.4607505798339844, -0.448516845703125, -0.4362831115722656, -0.42404937744140625, -0.4118156433105469, -0.3995819091796875, -0.3873481750488281, -0.37511444091796875, -0.3628807067871094, -0.35064697265625, -0.3384132385253906, -0.32617950439453125, -0.3139457702636719, -0.3017120361328125, -0.2894783020019531, -0.27724456787109375, -0.2650108337402344, -0.252777099609375, -0.24054336547851562, -0.22830963134765625, -0.21607589721679688, -0.2038421630859375, -0.19160842895507812, -0.17937469482421875, -0.16714096069335938, -0.1549072265625, -0.14267349243164062, -0.13043975830078125, -0.11820602416992188, -0.1059722900390625, -0.09373855590820312, -0.08150482177734375, -0.06927108764648438, -0.057037353515625, -0.044803619384765625, -0.03256988525390625, -0.020336151123046875, -0.0081024169921875, 0.004131317138671875, 0.01636505126953125, 0.028598785400390625, 0.04083251953125, 0.053066253662109375, 0.06529998779296875, 0.07753372192382812, 0.0897674560546875, 0.10200119018554688, 0.11423492431640625, 0.12646865844726562, 0.138702392578125, 0.15093612670898438, 0.16316986083984375, 0.17540359497070312, 0.1876373291015625, 0.19987106323242188, 0.21210479736328125, 0.22433853149414062, 0.236572265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 17.0, 21.0, 51.0, 83.0, 100.0, 241.0, 505.0, 1055.0, 2759.0, 7846.0, 28633.0, 158720.0, 2469389.0, 1387056.0, 105769.0, 21235.0, 6467.0, 2452.0, 979.0, 428.0, 229.0, 105.0, 54.0, 32.0, 21.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5623626708984375, -0.542205810546875, -0.5220489501953125, -0.50189208984375, -0.4817352294921875, -0.461578369140625, -0.4414215087890625, -0.4212646484375, -0.4011077880859375, -0.380950927734375, -0.3607940673828125, -0.34063720703125, -0.3204803466796875, -0.300323486328125, -0.2801666259765625, -0.260009765625, -0.2398529052734375, -0.219696044921875, -0.1995391845703125, -0.17938232421875, -0.1592254638671875, -0.139068603515625, -0.1189117431640625, -0.0987548828125, -0.0785980224609375, -0.058441162109375, -0.0382843017578125, -0.01812744140625, 0.0020294189453125, 0.022186279296875, 0.0423431396484375, 0.0625, 0.0826568603515625, 0.102813720703125, 0.1229705810546875, 0.14312744140625, 0.1632843017578125, 0.183441162109375, 0.2035980224609375, 0.2237548828125, 0.2439117431640625, 0.264068603515625, 0.2842254638671875, 0.30438232421875, 0.3245391845703125, 0.344696044921875, 0.3648529052734375, 0.385009765625, 0.4051666259765625, 0.425323486328125, 0.4454803466796875, 0.46563720703125, 0.4857940673828125, 0.505950927734375, 0.5261077880859375, 0.5462646484375, 0.5664215087890625, 0.586578369140625, 0.6067352294921875, 0.62689208984375, 0.6470489501953125, 0.667205810546875, 0.6873626708984375, 0.70751953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 11.0, 21.0, 25.0, 54.0, 78.0, 102.0, 189.0, 349.0, 663.0, 960.0, 683.0, 377.0, 187.0, 128.0, 70.0, 50.0, 30.0, 16.0, 15.0, 15.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90673828125, -0.8832168579101562, -0.8596954345703125, -0.8361740112304688, -0.812652587890625, -0.7891311645507812, -0.7656097412109375, -0.7420883178710938, -0.71856689453125, -0.6950454711914062, -0.6715240478515625, -0.6480026245117188, -0.624481201171875, -0.6009597778320312, -0.5774383544921875, -0.5539169311523438, -0.5303955078125, -0.5068740844726562, -0.4833526611328125, -0.45983123779296875, -0.436309814453125, -0.41278839111328125, -0.3892669677734375, -0.36574554443359375, -0.34222412109375, -0.31870269775390625, -0.2951812744140625, -0.27165985107421875, -0.248138427734375, -0.22461700439453125, -0.2010955810546875, -0.17757415771484375, -0.154052734375, -0.13053131103515625, -0.1070098876953125, -0.08348846435546875, -0.059967041015625, -0.03644561767578125, -0.0129241943359375, 0.01059722900390625, 0.03411865234375, 0.05764007568359375, 0.0811614990234375, 0.10468292236328125, 0.128204345703125, 0.15172576904296875, 0.1752471923828125, 0.19876861572265625, 0.2222900390625, 0.24581146240234375, 0.2693328857421875, 0.29285430908203125, 0.316375732421875, 0.33989715576171875, 0.3634185791015625, 0.38694000244140625, 0.41046142578125, 0.43398284912109375, 0.4575042724609375, 0.48102569580078125, 0.504547119140625, 0.5280685424804688, 0.5515899658203125, 0.5751113891601562, 0.5986328125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 12.0, 44.0, 143.0, 346.0, 281.0, 109.0, 29.0, 15.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.231163024902344, -8.857980728149414, -8.4847993850708, -8.111618041992188, -7.738435745239258, -7.365253925323486, -6.992072105407715, -6.618890285491943, -6.245708465576172, -5.8725266456604, -5.499344825744629, -5.126163005828857, -4.752981185913086, -4.3797993659973145, -4.006617546081543, -3.6334357261657715, -3.26025390625, -2.8870720863342285, -2.513890266418457, -2.1407084465026855, -1.767526626586914, -1.3943448066711426, -1.021162986755371, -0.6479811668395996, -0.2747993469238281, 0.09838247299194336, 0.47156429290771484, 0.8447461128234863, 1.2179279327392578, 1.5911097526550293, 1.9642915725708008, 2.3374733924865723, 2.71065616607666, 3.0838379859924316, 3.457019805908203, 3.8302016258239746, 4.203383445739746, 4.576565265655518, 4.949747085571289, 5.3229289054870605, 5.696110725402832, 6.0692925453186035, 6.442474365234375, 6.8156561851501465, 7.188838005065918, 7.5620198249816895, 7.935201644897461, 8.30838394165039, 8.681565284729004, 9.054746627807617, 9.427928924560547, 9.801111221313477, 10.17429256439209, 10.547473907470703, 10.920656204223633, 11.293838500976562, 11.667019844055176, 12.040201187133789, 12.413383483886719, 12.786565780639648, 13.159747123718262, 13.532928466796875, 13.906110763549805, 14.279293060302734, 14.652474403381348]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 11.0, 17.0, 11.0, 14.0, 20.0, 26.0, 22.0, 32.0, 34.0, 42.0, 52.0, 46.0, 46.0, 57.0, 64.0, 69.0, 53.0, 47.0, 43.0, 43.0, 38.0, 35.0, 24.0, 25.0, 20.0, 22.0, 14.0, 15.0, 17.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2577648162841797, -3.151721239089966, -3.045677423477173, -2.939633846282959, -2.833590030670166, -2.727546453475952, -2.6215028762817383, -2.5154590606689453, -2.4094154834747314, -2.3033719062805176, -2.1973280906677246, -2.0912845134735107, -1.9852408170700073, -1.879197120666504, -1.7731534242630005, -1.667109727859497, -1.5610660314559937, -1.4550223350524902, -1.3489786386489868, -1.2429349422454834, -1.1368913650512695, -1.0308476686477661, -0.9248039722442627, -0.818760335445404, -0.7127166390419006, -0.6066729426383972, -0.5006293058395386, -0.39458560943603516, -0.2885419428348541, -0.1824982762336731, -0.07645457983016968, 0.029589056968688965, 0.13563275337219238, 0.2416764199733734, 0.34772008657455444, 0.45376378297805786, 0.5598074197769165, 0.6658511161804199, 0.7718948125839233, 0.877938449382782, 0.9839821457862854, 1.090025782585144, 1.1960694789886475, 1.3021131753921509, 1.4081568717956543, 1.5142004489898682, 1.6202442646026611, 1.726287841796875, 1.8323315382003784, 1.9383752346038818, 2.0444188117980957, 2.1504626274108887, 2.2565062046051025, 2.3625497817993164, 2.4685935974121094, 2.5746371746063232, 2.680680990219116, 2.78672456741333, 2.892768383026123, 2.998811960220337, 3.10485577583313, 3.2108993530273438, 3.3169431686401367, 3.4229867458343506, 3.5290303230285645]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 14.0, 14.0, 22.0, 29.0, 48.0, 91.0, 124.0, 176.0, 318.0, 539.0, 985.0, 1675.0, 3467.0, 7235.0, 17817.0, 50057.0, 174481.0, 449983.0, 235683.0, 66171.0, 22211.0, 8842.0, 3980.0, 2004.0, 1030.0, 601.0, 338.0, 208.0, 136.0, 90.0, 59.0, 35.0, 25.0, 12.0, 9.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6614990234375, -0.639892578125, -0.6182861328125, -0.5966796875, -0.5750732421875, -0.553466796875, -0.5318603515625, -0.51025390625, -0.4886474609375, -0.467041015625, -0.4454345703125, -0.423828125, -0.4022216796875, -0.380615234375, -0.3590087890625, -0.33740234375, -0.3157958984375, -0.294189453125, -0.2725830078125, -0.2509765625, -0.2293701171875, -0.207763671875, -0.1861572265625, -0.16455078125, -0.1429443359375, -0.121337890625, -0.0997314453125, -0.078125, -0.0565185546875, -0.034912109375, -0.0133056640625, 0.00830078125, 0.0299072265625, 0.051513671875, 0.0731201171875, 0.0947265625, 0.1163330078125, 0.137939453125, 0.1595458984375, 0.18115234375, 0.2027587890625, 0.224365234375, 0.2459716796875, 0.267578125, 0.2891845703125, 0.310791015625, 0.3323974609375, 0.35400390625, 0.3756103515625, 0.397216796875, 0.4188232421875, 0.4404296875, 0.4620361328125, 0.483642578125, 0.5052490234375, 0.52685546875, 0.5484619140625, 0.570068359375, 0.5916748046875, 0.61328125, 0.6348876953125, 0.656494140625, 0.6781005859375, 0.69970703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 5.0, 8.0, 11.0, 25.0, 25.0, 31.0, 29.0, 46.0, 56.0, 50.0, 77.0, 60.0, 87.0, 66.0, 78.0, 65.0, 54.0, 53.0, 36.0, 43.0, 29.0, 22.0, 13.0, 13.0, 11.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6044921875, -0.590972900390625, -0.57745361328125, -0.563934326171875, -0.5504150390625, -0.536895751953125, -0.52337646484375, -0.509857177734375, -0.496337890625, -0.482818603515625, -0.46929931640625, -0.455780029296875, -0.4422607421875, -0.428741455078125, -0.41522216796875, -0.401702880859375, -0.38818359375, -0.374664306640625, -0.36114501953125, -0.347625732421875, -0.3341064453125, -0.320587158203125, -0.30706787109375, -0.293548583984375, -0.280029296875, -0.266510009765625, -0.25299072265625, -0.239471435546875, -0.2259521484375, -0.212432861328125, -0.19891357421875, -0.185394287109375, -0.171875, -0.158355712890625, -0.14483642578125, -0.131317138671875, -0.1177978515625, -0.104278564453125, -0.09075927734375, -0.077239990234375, -0.063720703125, -0.050201416015625, -0.03668212890625, -0.023162841796875, -0.0096435546875, 0.003875732421875, 0.01739501953125, 0.030914306640625, 0.04443359375, 0.057952880859375, 0.07147216796875, 0.084991455078125, 0.0985107421875, 0.112030029296875, 0.12554931640625, 0.139068603515625, 0.152587890625, 0.166107177734375, 0.17962646484375, 0.193145751953125, 0.2066650390625, 0.220184326171875, 0.23370361328125, 0.247222900390625, 0.2607421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 11.0, 13.0, 17.0, 17.0, 24.0, 24.0, 65.0, 97.0, 132.0, 212.0, 317.0, 654.0, 1341.0, 3719.0, 13464.0, 80277.0, 687980.0, 221563.0, 28241.0, 6286.0, 2074.0, 858.0, 450.0, 250.0, 139.0, 102.0, 54.0, 48.0, 34.0, 23.0, 9.0, 14.0, 4.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.07421875, -1.0368194580078125, -0.999420166015625, -0.9620208740234375, -0.92462158203125, -0.8872222900390625, -0.849822998046875, -0.8124237060546875, -0.7750244140625, -0.7376251220703125, -0.700225830078125, -0.6628265380859375, -0.62542724609375, -0.5880279541015625, -0.550628662109375, -0.5132293701171875, -0.475830078125, -0.4384307861328125, -0.401031494140625, -0.3636322021484375, -0.32623291015625, -0.2888336181640625, -0.251434326171875, -0.2140350341796875, -0.1766357421875, -0.1392364501953125, -0.101837158203125, -0.0644378662109375, -0.02703857421875, 0.0103607177734375, 0.047760009765625, 0.0851593017578125, 0.12255859375, 0.1599578857421875, 0.197357177734375, 0.2347564697265625, 0.27215576171875, 0.3095550537109375, 0.346954345703125, 0.3843536376953125, 0.4217529296875, 0.4591522216796875, 0.496551513671875, 0.5339508056640625, 0.57135009765625, 0.6087493896484375, 0.646148681640625, 0.6835479736328125, 0.720947265625, 0.7583465576171875, 0.795745849609375, 0.8331451416015625, 0.87054443359375, 0.9079437255859375, 0.945343017578125, 0.9827423095703125, 1.0201416015625, 1.0575408935546875, 1.094940185546875, 1.1323394775390625, 1.16973876953125, 1.2071380615234375, 1.244537353515625, 1.2819366455078125, 1.3193359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 4.0, 6.0, 10.0, 15.0, 18.0, 23.0, 27.0, 38.0, 28.0, 35.0, 54.0, 37.0, 55.0, 44.0, 60.0, 51.0, 49.0, 53.0, 53.0, 53.0, 47.0, 25.0, 36.0, 31.0, 19.0, 26.0, 15.0, 14.0, 16.0, 5.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -0.995513916015625, -0.95391845703125, -0.912322998046875, -0.8707275390625, -0.829132080078125, -0.78753662109375, -0.745941162109375, -0.704345703125, -0.662750244140625, -0.62115478515625, -0.579559326171875, -0.5379638671875, -0.496368408203125, -0.45477294921875, -0.413177490234375, -0.37158203125, -0.329986572265625, -0.28839111328125, -0.246795654296875, -0.2052001953125, -0.163604736328125, -0.12200927734375, -0.080413818359375, -0.038818359375, 0.002777099609375, 0.04437255859375, 0.085968017578125, 0.1275634765625, 0.169158935546875, 0.21075439453125, 0.252349853515625, 0.2939453125, 0.335540771484375, 0.37713623046875, 0.418731689453125, 0.4603271484375, 0.501922607421875, 0.54351806640625, 0.585113525390625, 0.626708984375, 0.668304443359375, 0.70989990234375, 0.751495361328125, 0.7930908203125, 0.834686279296875, 0.87628173828125, 0.917877197265625, 0.95947265625, 1.001068115234375, 1.04266357421875, 1.084259033203125, 1.1258544921875, 1.167449951171875, 1.20904541015625, 1.250640869140625, 1.292236328125, 1.333831787109375, 1.37542724609375, 1.417022705078125, 1.4586181640625, 1.500213623046875, 1.54180908203125, 1.583404541015625, 1.625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 12.0, 24.0, 34.0, 37.0, 89.0, 143.0, 352.0, 982.0, 4323.0, 675608.0, 361373.0, 3915.0, 906.0, 354.0, 157.0, 86.0, 43.0, 33.0, 25.0, 12.0, 9.0, 4.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.43695068359375, -2.3582763671875, -2.27960205078125, -2.200927734375, -2.12225341796875, -2.0435791015625, -1.96490478515625, -1.88623046875, -1.80755615234375, -1.7288818359375, -1.65020751953125, -1.571533203125, -1.49285888671875, -1.4141845703125, -1.33551025390625, -1.2568359375, -1.17816162109375, -1.0994873046875, -1.02081298828125, -0.942138671875, -0.86346435546875, -0.7847900390625, -0.70611572265625, -0.62744140625, -0.54876708984375, -0.4700927734375, -0.39141845703125, -0.312744140625, -0.23406982421875, -0.1553955078125, -0.07672119140625, 0.001953125, 0.08062744140625, 0.1593017578125, 0.23797607421875, 0.316650390625, 0.39532470703125, 0.4739990234375, 0.55267333984375, 0.63134765625, 0.71002197265625, 0.7886962890625, 0.86737060546875, 0.946044921875, 1.02471923828125, 1.1033935546875, 1.18206787109375, 1.2607421875, 1.33941650390625, 1.4180908203125, 1.49676513671875, 1.575439453125, 1.65411376953125, 1.7327880859375, 1.81146240234375, 1.89013671875, 1.96881103515625, 2.0474853515625, 2.12615966796875, 2.204833984375, 2.28350830078125, 2.3621826171875, 2.44085693359375, 2.51953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 1.0, 7.0, 5.0, 8.0, 13.0, 14.0, 13.0, 20.0, 23.0, 26.0, 35.0, 52.0, 93.0, 119.0, 140.0, 127.0, 71.0, 60.0, 30.0, 23.0, 17.0, 17.0, 8.0, 7.0, 12.0, 10.0, 8.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011861324310302734, -0.0001153433695435524, -0.00011207349598407745, -0.00010880362242460251, -0.00010553374886512756, -0.00010226387530565262, -9.899400174617767e-05, -9.572412818670273e-05, -9.245425462722778e-05, -8.918438106775284e-05, -8.591450750827789e-05, -8.264463394880295e-05, -7.9374760389328e-05, -7.610488682985306e-05, -7.283501327037811e-05, -6.956513971090317e-05, -6.629526615142822e-05, -6.302539259195328e-05, -5.975551903247833e-05, -5.648564547300339e-05, -5.321577191352844e-05, -4.99458983540535e-05, -4.667602479457855e-05, -4.340615123510361e-05, -4.013627767562866e-05, -3.686640411615372e-05, -3.359653055667877e-05, -3.0326656997203827e-05, -2.7056783437728882e-05, -2.3786909878253937e-05, -2.0517036318778992e-05, -1.7247162759304047e-05, -1.3977289199829102e-05, -1.0707415640354156e-05, -7.4375420808792114e-06, -4.167668521404266e-06, -8.977949619293213e-07, 2.3720785975456238e-06, 5.641952157020569e-06, 8.911825716495514e-06, 1.2181699275970459e-05, 1.5451572835445404e-05, 1.872144639492035e-05, 2.1991319954395294e-05, 2.526119351387024e-05, 2.8531067073345184e-05, 3.180094063282013e-05, 3.5070814192295074e-05, 3.834068775177002e-05, 4.1610561311244965e-05, 4.488043487071991e-05, 4.8150308430194855e-05, 5.14201819896698e-05, 5.4690055549144745e-05, 5.795992910861969e-05, 6.122980266809464e-05, 6.449967622756958e-05, 6.776954978704453e-05, 7.103942334651947e-05, 7.430929690599442e-05, 7.757917046546936e-05, 8.08490440249443e-05, 8.411891758441925e-05, 8.73887911438942e-05, 9.065866470336914e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 13.0, 22.0, 18.0, 43.0, 62.0, 101.0, 199.0, 377.0, 872.0, 2059.0, 9093.0, 660692.0, 363582.0, 7864.0, 1948.0, 758.0, 353.0, 186.0, 105.0, 60.0, 29.0, 30.0, 15.0, 12.0, 7.0, 10.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59765625, -1.5506134033203125, -1.503570556640625, -1.4565277099609375, -1.40948486328125, -1.3624420166015625, -1.315399169921875, -1.2683563232421875, -1.2213134765625, -1.1742706298828125, -1.127227783203125, -1.0801849365234375, -1.03314208984375, -0.9860992431640625, -0.939056396484375, -0.8920135498046875, -0.844970703125, -0.7979278564453125, -0.750885009765625, -0.7038421630859375, -0.65679931640625, -0.6097564697265625, -0.562713623046875, -0.5156707763671875, -0.4686279296875, -0.4215850830078125, -0.374542236328125, -0.3274993896484375, -0.28045654296875, -0.2334136962890625, -0.186370849609375, -0.1393280029296875, -0.09228515625, -0.0452423095703125, 0.001800537109375, 0.0488433837890625, 0.09588623046875, 0.1429290771484375, 0.189971923828125, 0.2370147705078125, 0.2840576171875, 0.3311004638671875, 0.378143310546875, 0.4251861572265625, 0.47222900390625, 0.5192718505859375, 0.566314697265625, 0.6133575439453125, 0.660400390625, 0.7074432373046875, 0.754486083984375, 0.8015289306640625, 0.84857177734375, 0.8956146240234375, 0.942657470703125, 0.9897003173828125, 1.0367431640625, 1.0837860107421875, 1.130828857421875, 1.1778717041015625, 1.22491455078125, 1.2719573974609375, 1.319000244140625, 1.3660430908203125, 1.4130859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 1.0, 5.0, 1.0, 6.0, 9.0, 12.0, 20.0, 47.0, 74.0, 103.0, 159.0, 173.0, 148.0, 96.0, 57.0, 29.0, 19.0, 13.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9878311157226562, -0.9580841064453125, -0.9283370971679688, -0.898590087890625, -0.8688430786132812, -0.8390960693359375, -0.8093490600585938, -0.77960205078125, -0.7498550415039062, -0.7201080322265625, -0.6903610229492188, -0.660614013671875, -0.6308670043945312, -0.6011199951171875, -0.5713729858398438, -0.5416259765625, -0.5118789672851562, -0.4821319580078125, -0.45238494873046875, -0.422637939453125, -0.39289093017578125, -0.3631439208984375, -0.33339691162109375, -0.30364990234375, -0.27390289306640625, -0.2441558837890625, -0.21440887451171875, -0.184661865234375, -0.15491485595703125, -0.1251678466796875, -0.09542083740234375, -0.065673828125, -0.03592681884765625, -0.0061798095703125, 0.02356719970703125, 0.053314208984375, 0.08306121826171875, 0.1128082275390625, 0.14255523681640625, 0.17230224609375, 0.20204925537109375, 0.2317962646484375, 0.26154327392578125, 0.291290283203125, 0.32103729248046875, 0.3507843017578125, 0.38053131103515625, 0.4102783203125, 0.44002532958984375, 0.4697723388671875, 0.49951934814453125, 0.529266357421875, 0.5590133666992188, 0.5887603759765625, 0.6185073852539062, 0.64825439453125, 0.6780014038085938, 0.7077484130859375, 0.7374954223632812, 0.767242431640625, 0.7969894409179688, 0.8267364501953125, 0.8564834594726562, 0.88623046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 42.0, 223.0, 439.0, 204.0, 48.0, 10.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.52410125732422, -29.8038387298584, -29.083574295043945, -28.363311767578125, -27.643049240112305, -26.922786712646484, -26.20252227783203, -25.48225975036621, -24.76199722290039, -24.04173469543457, -23.321470260620117, -22.601207733154297, -21.880945205688477, -21.160682678222656, -20.440418243408203, -19.720155715942383, -18.99989128112793, -18.27962875366211, -17.559364318847656, -16.839101791381836, -16.118839263916016, -15.398575782775879, -14.678312301635742, -13.958049774169922, -13.237786293029785, -12.517522811889648, -11.797260284423828, -11.076996803283691, -10.356733322143555, -9.636470794677734, -8.916207313537598, -8.195943832397461, -7.475681304931641, -6.755418300628662, -6.035155296325684, -5.314891815185547, -4.594628810882568, -3.87436580657959, -3.154102325439453, -2.4338393211364746, -1.713576316833496, -0.993313193321228, -0.27305006980895996, 0.44721317291259766, 1.1674761772155762, 1.8877391815185547, 2.6080026626586914, 3.32826566696167, 4.048528671264648, 4.768791675567627, 5.4890546798706055, 6.209318161010742, 6.929581165313721, 7.649844169616699, 8.370107650756836, 9.090370178222656, 9.810633659362793, 10.53089714050293, 11.25115966796875, 11.971423149108887, 12.691686630249023, 13.411949157714844, 14.13221263885498, 14.852476119995117, 15.572738647460938]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 10.0, 14.0, 18.0, 24.0, 28.0, 44.0, 53.0, 63.0, 59.0, 83.0, 90.0, 104.0, 99.0, 59.0, 56.0, 44.0, 36.0, 33.0, 24.0, 22.0, 13.0, 3.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.369007110595703, -5.085866928100586, -4.8027262687683105, -4.519586086273193, -4.236445426940918, -3.953305244445801, -3.6701650619506836, -3.3870246410369873, -3.103884220123291, -2.8207437992095947, -2.5376033782958984, -2.2544631958007812, -1.971322774887085, -1.6881823539733887, -1.405042052268982, -1.1219017505645752, -0.8387613296508789, -0.5556209683418274, -0.2724806070327759, 0.010659754276275635, 0.29380011558532715, 0.5769405364990234, 0.8600808382034302, 1.143221139907837, 1.4263615608215332, 1.7095019817352295, 1.9926422834396362, 2.275782585144043, 2.5589230060577393, 2.8420634269714355, 3.1252036094665527, 3.408344030380249, 3.6914844512939453, 3.9746248722076416, 4.257765293121338, 4.540905475616455, 4.8240461349487305, 5.107186317443848, 5.390326499938965, 5.673466682434082, 5.956607341766357, 6.239747524261475, 6.52288818359375, 6.806028366088867, 7.089168548583984, 7.37230920791626, 7.655449390411377, 7.938590049743652, 8.22173023223877, 8.504870414733887, 8.788010597229004, 9.071151733398438, 9.354291915893555, 9.637432098388672, 9.920572280883789, 10.203712463378906, 10.486852645874023, 10.76999282836914, 11.053133010864258, 11.336274147033691, 11.619414329528809, 11.902554512023926, 12.185694694519043, 12.46883487701416, 12.751976013183594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 15.0, 13.0, 12.0, 19.0, 24.0, 38.0, 80.0, 107.0, 262.0, 641.0, 2039.0, 11023.0, 147101.0, 3599539.0, 408195.0, 20104.0, 3304.0, 920.0, 367.0, 174.0, 100.0, 62.0, 35.0, 26.0, 21.0, 14.0, 11.0, 3.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8056640625, -0.7729644775390625, -0.740264892578125, -0.7075653076171875, -0.67486572265625, -0.6421661376953125, -0.609466552734375, -0.5767669677734375, -0.5440673828125, -0.5113677978515625, -0.478668212890625, -0.4459686279296875, -0.41326904296875, -0.3805694580078125, -0.347869873046875, -0.3151702880859375, -0.282470703125, -0.2497711181640625, -0.217071533203125, -0.1843719482421875, -0.15167236328125, -0.1189727783203125, -0.086273193359375, -0.0535736083984375, -0.0208740234375, 0.0118255615234375, 0.044525146484375, 0.0772247314453125, 0.10992431640625, 0.1426239013671875, 0.175323486328125, 0.2080230712890625, 0.24072265625, 0.2734222412109375, 0.306121826171875, 0.3388214111328125, 0.37152099609375, 0.4042205810546875, 0.436920166015625, 0.4696197509765625, 0.5023193359375, 0.5350189208984375, 0.567718505859375, 0.6004180908203125, 0.63311767578125, 0.6658172607421875, 0.698516845703125, 0.7312164306640625, 0.763916015625, 0.7966156005859375, 0.829315185546875, 0.8620147705078125, 0.89471435546875, 0.9274139404296875, 0.960113525390625, 0.9928131103515625, 1.0255126953125, 1.0582122802734375, 1.090911865234375, 1.1236114501953125, 1.15631103515625, 1.1890106201171875, 1.221710205078125, 1.2544097900390625, 1.287109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 10.0, 13.0, 19.0, 25.0, 45.0, 48.0, 61.0, 65.0, 93.0, 78.0, 95.0, 92.0, 78.0, 75.0, 56.0, 40.0, 33.0, 23.0, 21.0, 9.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2952003479003906, -0.28058624267578125, -0.2659721374511719, -0.2513580322265625, -0.23674392700195312, -0.22212982177734375, -0.20751571655273438, -0.192901611328125, -0.17828750610351562, -0.16367340087890625, -0.14905929565429688, -0.1344451904296875, -0.11983108520507812, -0.10521697998046875, -0.09060287475585938, -0.07598876953125, -0.061374664306640625, -0.04676055908203125, -0.032146453857421875, -0.0175323486328125, -0.002918243408203125, 0.01169586181640625, 0.026309967041015625, 0.040924072265625, 0.055538177490234375, 0.07015228271484375, 0.08476638793945312, 0.0993804931640625, 0.11399459838867188, 0.12860870361328125, 0.14322280883789062, 0.1578369140625, 0.17245101928710938, 0.18706512451171875, 0.20167922973632812, 0.2162933349609375, 0.23090744018554688, 0.24552154541015625, 0.2601356506347656, 0.274749755859375, 0.2893638610839844, 0.30397796630859375, 0.3185920715332031, 0.3332061767578125, 0.3478202819824219, 0.36243438720703125, 0.3770484924316406, 0.39166259765625, 0.4062767028808594, 0.42089080810546875, 0.4355049133300781, 0.4501190185546875, 0.4647331237792969, 0.47934722900390625, 0.4939613342285156, 0.508575439453125, 0.5231895446777344, 0.5378036499023438, 0.5524177551269531, 0.5670318603515625, 0.5816459655761719, 0.5962600708007812, 0.6108741760253906, 0.62548828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 21.0, 27.0, 44.0, 61.0, 74.0, 164.0, 252.0, 513.0, 1252.0, 4329.0, 27729.0, 492662.0, 3497188.0, 155050.0, 11823.0, 2050.0, 551.0, 218.0, 118.0, 71.0, 28.0, 22.0, 10.0, 13.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.375, -1.3432769775390625, -1.311553955078125, -1.2798309326171875, -1.24810791015625, -1.2163848876953125, -1.184661865234375, -1.1529388427734375, -1.1212158203125, -1.0894927978515625, -1.057769775390625, -1.0260467529296875, -0.99432373046875, -0.9626007080078125, -0.930877685546875, -0.8991546630859375, -0.867431640625, -0.8357086181640625, -0.803985595703125, -0.7722625732421875, -0.74053955078125, -0.7088165283203125, -0.677093505859375, -0.6453704833984375, -0.6136474609375, -0.5819244384765625, -0.550201416015625, -0.5184783935546875, -0.48675537109375, -0.4550323486328125, -0.423309326171875, -0.3915863037109375, -0.35986328125, -0.3281402587890625, -0.296417236328125, -0.2646942138671875, -0.23297119140625, -0.2012481689453125, -0.169525146484375, -0.1378021240234375, -0.1060791015625, -0.0743560791015625, -0.042633056640625, -0.0109100341796875, 0.02081298828125, 0.0525360107421875, 0.084259033203125, 0.1159820556640625, 0.147705078125, 0.1794281005859375, 0.211151123046875, 0.2428741455078125, 0.27459716796875, 0.3063201904296875, 0.338043212890625, 0.3697662353515625, 0.4014892578125, 0.4332122802734375, 0.464935302734375, 0.4966583251953125, 0.52838134765625, 0.5601043701171875, 0.591827392578125, 0.6235504150390625, 0.6552734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 10.0, 20.0, 24.0, 33.0, 59.0, 107.0, 154.0, 238.0, 440.0, 789.0, 857.0, 560.0, 336.0, 165.0, 105.0, 66.0, 37.0, 29.0, 8.0, 7.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4951171875, -1.4635009765625, -1.431884765625, -1.4002685546875, -1.36865234375, -1.3370361328125, -1.305419921875, -1.2738037109375, -1.2421875, -1.2105712890625, -1.178955078125, -1.1473388671875, -1.11572265625, -1.0841064453125, -1.052490234375, -1.0208740234375, -0.9892578125, -0.9576416015625, -0.926025390625, -0.8944091796875, -0.86279296875, -0.8311767578125, -0.799560546875, -0.7679443359375, -0.736328125, -0.7047119140625, -0.673095703125, -0.6414794921875, -0.60986328125, -0.5782470703125, -0.546630859375, -0.5150146484375, -0.4833984375, -0.4517822265625, -0.420166015625, -0.3885498046875, -0.35693359375, -0.3253173828125, -0.293701171875, -0.2620849609375, -0.23046875, -0.1988525390625, -0.167236328125, -0.1356201171875, -0.10400390625, -0.0723876953125, -0.040771484375, -0.0091552734375, 0.0224609375, 0.0540771484375, 0.085693359375, 0.1173095703125, 0.14892578125, 0.1805419921875, 0.212158203125, 0.2437744140625, 0.275390625, 0.3070068359375, 0.338623046875, 0.3702392578125, 0.40185546875, 0.4334716796875, 0.465087890625, 0.4967041015625, 0.5283203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 34.0, 48.0, 107.0, 182.0, 211.0, 188.0, 95.0, 49.0, 15.0, 16.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.270851135253906, -7.964827537536621, -7.658803939819336, -7.352780342102051, -7.046756744384766, -6.7407331466674805, -6.4347100257873535, -6.128686428070068, -5.822662830352783, -5.516639232635498, -5.210615634918213, -4.904592037200928, -4.598568916320801, -4.292545318603516, -3.9865217208862305, -3.6804981231689453, -3.37447452545166, -3.068450927734375, -2.76242733001709, -2.456403970718384, -2.1503803730010986, -1.8443567752838135, -1.5383332967758179, -1.2323098182678223, -0.9262862205505371, -0.6202626824378967, -0.31423914432525635, -0.008215606212615967, 0.2978079319000244, 0.6038315296173096, 0.9098550081253052, 1.2158784866333008, 1.5219030380249023, 1.8279266357421875, 2.1339502334594727, 2.4399735927581787, 2.745997190475464, 3.052020788192749, 3.358044147491455, 3.6640677452087402, 3.9700913429260254, 4.2761149406433105, 4.582138538360596, 4.888162136077881, 5.194185256958008, 5.500208854675293, 5.806232452392578, 6.112256050109863, 6.418279647827148, 6.724303245544434, 7.030326843261719, 7.336350440979004, 7.642374038696289, 7.948397636413574, 8.25442123413086, 8.560443878173828, 8.86646842956543, 9.172492027282715, 9.478515625, 9.784539222717285, 10.09056282043457, 10.396586418151855, 10.70261001586914, 11.00863265991211, 11.314656257629395]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 4.0, 13.0, 5.0, 13.0, 20.0, 21.0, 20.0, 29.0, 37.0, 44.0, 49.0, 48.0, 60.0, 51.0, 49.0, 57.0, 69.0, 62.0, 59.0, 52.0, 54.0, 42.0, 23.0, 23.0, 22.0, 21.0, 18.0, 9.0, 4.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3762922286987305, -6.173606872558594, -5.970921039581299, -5.768235683441162, -5.565550327301025, -5.3628644943237305, -5.160179138183594, -4.957493782043457, -4.75480842590332, -4.552123069763184, -4.349437236785889, -4.146751880645752, -3.9440665245056152, -3.7413809299468994, -3.5386953353881836, -3.336009979248047, -3.133324146270752, -2.930638551712036, -2.7279531955718994, -2.5252676010131836, -2.322582244873047, -2.119896650314331, -1.9172110557556152, -1.714525580406189, -1.5118401050567627, -1.3091546297073364, -1.1064691543579102, -0.9037835597991943, -0.7010980844497681, -0.4984126091003418, -0.295727014541626, -0.09304153919219971, 0.10964393615722656, 0.3123294413089752, 0.5150149464607239, 0.7177004814147949, 0.9203859567642212, 1.1230714321136475, 1.3257570266723633, 1.5284425020217896, 1.7311279773712158, 1.933813452720642, 2.1364989280700684, 2.339184522628784, 2.5418701171875, 2.7445554733276367, 2.9472410678863525, 3.1499266624450684, 3.352612018585205, 3.555297613143921, 3.7579829692840576, 3.9606685638427734, 4.16335391998291, 4.366039276123047, 4.568725109100342, 4.7714104652404785, 4.974096298217773, 5.17678165435791, 5.379467487335205, 5.582152843475342, 5.7848381996154785, 5.987524032592773, 6.19020938873291, 6.392894744873047, 6.595580101013184]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 10.0, 12.0, 9.0, 39.0, 58.0, 105.0, 237.0, 510.0, 1350.0, 4362.0, 17132.0, 89414.0, 464819.0, 381403.0, 69617.0, 13862.0, 3530.0, 1144.0, 481.0, 202.0, 108.0, 70.0, 29.0, 15.0, 9.0, 15.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6701583862304688, -0.6347503662109375, -0.5993423461914062, -0.563934326171875, -0.5285263061523438, -0.4931182861328125, -0.45771026611328125, -0.42230224609375, -0.38689422607421875, -0.3514862060546875, -0.31607818603515625, -0.280670166015625, -0.24526214599609375, -0.2098541259765625, -0.17444610595703125, -0.1390380859375, -0.10363006591796875, -0.0682220458984375, -0.03281402587890625, 0.002593994140625, 0.03800201416015625, 0.0734100341796875, 0.10881805419921875, 0.14422607421875, 0.17963409423828125, 0.2150421142578125, 0.25045013427734375, 0.285858154296875, 0.32126617431640625, 0.3566741943359375, 0.39208221435546875, 0.427490234375, 0.46289825439453125, 0.4983062744140625, 0.5337142944335938, 0.569122314453125, 0.6045303344726562, 0.6399383544921875, 0.6753463745117188, 0.71075439453125, 0.7461624145507812, 0.7815704345703125, 0.8169784545898438, 0.852386474609375, 0.8877944946289062, 0.9232025146484375, 0.9586105346679688, 0.9940185546875, 1.0294265747070312, 1.0648345947265625, 1.1002426147460938, 1.135650634765625, 1.1710586547851562, 1.2064666748046875, 1.2418746948242188, 1.27728271484375, 1.3126907348632812, 1.3480987548828125, 1.3835067749023438, 1.418914794921875, 1.4543228149414062, 1.4897308349609375, 1.5251388549804688, 1.560546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 11.0, 11.0, 11.0, 22.0, 25.0, 23.0, 19.0, 42.0, 29.0, 45.0, 41.0, 37.0, 42.0, 47.0, 45.0, 64.0, 46.0, 52.0, 51.0, 46.0, 40.0, 36.0, 41.0, 29.0, 19.0, 18.0, 22.0, 16.0, 6.0, 11.0, 8.0, 4.0, 6.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3330078125, -0.3242053985595703, -0.3154029846191406, -0.30660057067871094, -0.29779815673828125, -0.28899574279785156, -0.2801933288574219, -0.2713909149169922, -0.2625885009765625, -0.2537860870361328, -0.24498367309570312, -0.23618125915527344, -0.22737884521484375, -0.21857643127441406, -0.20977401733398438, -0.2009716033935547, -0.192169189453125, -0.1833667755126953, -0.17456436157226562, -0.16576194763183594, -0.15695953369140625, -0.14815711975097656, -0.13935470581054688, -0.1305522918701172, -0.1217498779296875, -0.11294746398925781, -0.10414505004882812, -0.09534263610839844, -0.08654022216796875, -0.07773780822753906, -0.06893539428710938, -0.06013298034667969, -0.05133056640625, -0.04252815246582031, -0.033725738525390625, -0.024923324584960938, -0.01612091064453125, -0.0073184967041015625, 0.001483917236328125, 0.010286331176757812, 0.0190887451171875, 0.027891159057617188, 0.036693572998046875, 0.04549598693847656, 0.05429840087890625, 0.06310081481933594, 0.07190322875976562, 0.08070564270019531, 0.089508056640625, 0.09831047058105469, 0.10711288452148438, 0.11591529846191406, 0.12471771240234375, 0.13352012634277344, 0.14232254028320312, 0.1511249542236328, 0.1599273681640625, 0.1687297821044922, 0.17753219604492188, 0.18633460998535156, 0.19513702392578125, 0.20393943786621094, 0.21274185180664062, 0.2215442657470703, 0.2303466796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 8.0, 7.0, 18.0, 17.0, 30.0, 56.0, 57.0, 94.0, 156.0, 261.0, 472.0, 889.0, 2066.0, 6603.0, 51060.0, 837141.0, 133541.0, 10775.0, 2746.0, 1126.0, 605.0, 278.0, 198.0, 116.0, 66.0, 48.0, 35.0, 27.0, 21.0, 6.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0234375, -1.9614715576171875, -1.899505615234375, -1.8375396728515625, -1.77557373046875, -1.7136077880859375, -1.651641845703125, -1.5896759033203125, -1.5277099609375, -1.4657440185546875, -1.403778076171875, -1.3418121337890625, -1.27984619140625, -1.2178802490234375, -1.155914306640625, -1.0939483642578125, -1.031982421875, -0.9700164794921875, -0.908050537109375, -0.8460845947265625, -0.78411865234375, -0.7221527099609375, -0.660186767578125, -0.5982208251953125, -0.5362548828125, -0.4742889404296875, -0.412322998046875, -0.3503570556640625, -0.28839111328125, -0.2264251708984375, -0.164459228515625, -0.1024932861328125, -0.04052734375, 0.0214385986328125, 0.083404541015625, 0.1453704833984375, 0.20733642578125, 0.2693023681640625, 0.331268310546875, 0.3932342529296875, 0.4552001953125, 0.5171661376953125, 0.579132080078125, 0.6410980224609375, 0.70306396484375, 0.7650299072265625, 0.826995849609375, 0.8889617919921875, 0.950927734375, 1.0128936767578125, 1.074859619140625, 1.1368255615234375, 1.19879150390625, 1.2607574462890625, 1.322723388671875, 1.3846893310546875, 1.4466552734375, 1.5086212158203125, 1.570587158203125, 1.6325531005859375, 1.69451904296875, 1.7564849853515625, 1.818450927734375, 1.8804168701171875, 1.9423828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 7.0, 16.0, 22.0, 21.0, 20.0, 22.0, 36.0, 40.0, 41.0, 50.0, 52.0, 39.0, 45.0, 63.0, 51.0, 54.0, 54.0, 48.0, 44.0, 44.0, 46.0, 28.0, 30.0, 21.0, 20.0, 10.0, 8.0, 11.0, 8.0, 3.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.640380859375, -1.59033203125, -1.540283203125, -1.490234375, -1.440185546875, -1.39013671875, -1.340087890625, -1.2900390625, -1.239990234375, -1.18994140625, -1.139892578125, -1.08984375, -1.039794921875, -0.98974609375, -0.939697265625, -0.8896484375, -0.839599609375, -0.78955078125, -0.739501953125, -0.689453125, -0.639404296875, -0.58935546875, -0.539306640625, -0.4892578125, -0.439208984375, -0.38916015625, -0.339111328125, -0.2890625, -0.239013671875, -0.18896484375, -0.138916015625, -0.0888671875, -0.038818359375, 0.01123046875, 0.061279296875, 0.111328125, 0.161376953125, 0.21142578125, 0.261474609375, 0.3115234375, 0.361572265625, 0.41162109375, 0.461669921875, 0.51171875, 0.561767578125, 0.61181640625, 0.661865234375, 0.7119140625, 0.761962890625, 0.81201171875, 0.862060546875, 0.912109375, 0.962158203125, 1.01220703125, 1.062255859375, 1.1123046875, 1.162353515625, 1.21240234375, 1.262451171875, 1.3125, 1.362548828125, 1.41259765625, 1.462646484375, 1.5126953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 5.0, 8.0, 14.0, 32.0, 31.0, 62.0, 86.0, 164.0, 298.0, 847.0, 2742.0, 14499.0, 233415.0, 761224.0, 28790.0, 4145.0, 1165.0, 484.0, 230.0, 109.0, 68.0, 33.0, 34.0, 9.0, 8.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9443283081054688, -0.9174652099609375, -0.8906021118164062, -0.863739013671875, -0.8368759155273438, -0.8100128173828125, -0.7831497192382812, -0.75628662109375, -0.7294235229492188, -0.7025604248046875, -0.6756973266601562, -0.648834228515625, -0.6219711303710938, -0.5951080322265625, -0.5682449340820312, -0.5413818359375, -0.5145187377929688, -0.4876556396484375, -0.46079254150390625, -0.433929443359375, -0.40706634521484375, -0.3802032470703125, -0.35334014892578125, -0.32647705078125, -0.29961395263671875, -0.2727508544921875, -0.24588775634765625, -0.219024658203125, -0.19216156005859375, -0.1652984619140625, -0.13843536376953125, -0.111572265625, -0.08470916748046875, -0.0578460693359375, -0.03098297119140625, -0.004119873046875, 0.02274322509765625, 0.0496063232421875, 0.07646942138671875, 0.10333251953125, 0.13019561767578125, 0.1570587158203125, 0.18392181396484375, 0.210784912109375, 0.23764801025390625, 0.2645111083984375, 0.29137420654296875, 0.3182373046875, 0.34510040283203125, 0.3719635009765625, 0.39882659912109375, 0.425689697265625, 0.45255279541015625, 0.4794158935546875, 0.5062789916992188, 0.53314208984375, 0.5600051879882812, 0.5868682861328125, 0.6137313842773438, 0.640594482421875, 0.6674575805664062, 0.6943206787109375, 0.7211837768554688, 0.748046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 4.0, 12.0, 13.0, 7.0, 10.0, 9.0, 31.0, 31.0, 26.0, 29.0, 44.0, 58.0, 75.0, 148.0, 142.0, 87.0, 60.0, 48.0, 41.0, 28.0, 23.0, 21.0, 14.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001354217529296875, -0.0001307651400566101, -0.00012610852718353271, -0.00012145191431045532, -0.00011679530143737793, -0.00011213868856430054, -0.00010748207569122314, -0.00010282546281814575, -9.816884994506836e-05, -9.351223707199097e-05, -8.885562419891357e-05, -8.419901132583618e-05, -7.954239845275879e-05, -7.48857855796814e-05, -7.0229172706604e-05, -6.557255983352661e-05, -6.091594696044922e-05, -5.6259334087371826e-05, -5.1602721214294434e-05, -4.694610834121704e-05, -4.228949546813965e-05, -3.7632882595062256e-05, -3.297626972198486e-05, -2.831965684890747e-05, -2.3663043975830078e-05, -1.9006431102752686e-05, -1.4349818229675293e-05, -9.6932053565979e-06, -5.036592483520508e-06, -3.7997961044311523e-07, 4.276633262634277e-06, 8.93324613571167e-06, 1.3589859008789062e-05, 1.8246471881866455e-05, 2.2903084754943848e-05, 2.755969762802124e-05, 3.221631050109863e-05, 3.6872923374176025e-05, 4.152953624725342e-05, 4.618614912033081e-05, 5.08427619934082e-05, 5.5499374866485596e-05, 6.015598773956299e-05, 6.481260061264038e-05, 6.946921348571777e-05, 7.412582635879517e-05, 7.878243923187256e-05, 8.343905210494995e-05, 8.809566497802734e-05, 9.275227785110474e-05, 9.740889072418213e-05, 0.00010206550359725952, 0.00010672211647033691, 0.0001113787293434143, 0.0001160353422164917, 0.00012069195508956909, 0.00012534856796264648, 0.00013000518083572388, 0.00013466179370880127, 0.00013931840658187866, 0.00014397501945495605, 0.00014863163232803345, 0.00015328824520111084, 0.00015794485807418823, 0.00016260147094726562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 10.0, 10.0, 20.0, 23.0, 33.0, 43.0, 35.0, 58.0, 107.0, 165.0, 238.0, 441.0, 847.0, 1721.0, 4450.0, 14745.0, 85763.0, 811543.0, 103182.0, 16225.0, 4827.0, 1839.0, 893.0, 460.0, 278.0, 178.0, 110.0, 76.0, 63.0, 39.0, 31.0, 18.0, 9.0, 14.0, 11.0, 10.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6358261108398438, -0.6168670654296875, -0.5979080200195312, -0.578948974609375, -0.5599899291992188, -0.5410308837890625, -0.5220718383789062, -0.50311279296875, -0.48415374755859375, -0.4651947021484375, -0.44623565673828125, -0.427276611328125, -0.40831756591796875, -0.3893585205078125, -0.37039947509765625, -0.3514404296875, -0.33248138427734375, -0.3135223388671875, -0.29456329345703125, -0.275604248046875, -0.25664520263671875, -0.2376861572265625, -0.21872711181640625, -0.19976806640625, -0.18080902099609375, -0.1618499755859375, -0.14289093017578125, -0.123931884765625, -0.10497283935546875, -0.0860137939453125, -0.06705474853515625, -0.048095703125, -0.02913665771484375, -0.0101776123046875, 0.00878143310546875, 0.027740478515625, 0.04669952392578125, 0.0656585693359375, 0.08461761474609375, 0.10357666015625, 0.12253570556640625, 0.1414947509765625, 0.16045379638671875, 0.179412841796875, 0.19837188720703125, 0.2173309326171875, 0.23628997802734375, 0.2552490234375, 0.27420806884765625, 0.2931671142578125, 0.31212615966796875, 0.331085205078125, 0.35004425048828125, 0.3690032958984375, 0.38796234130859375, 0.40692138671875, 0.42588043212890625, 0.4448394775390625, 0.46379852294921875, 0.482757568359375, 0.5017166137695312, 0.5206756591796875, 0.5396347045898438, 0.55859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 3.0, 5.0, 7.0, 11.0, 13.0, 25.0, 32.0, 40.0, 61.0, 80.0, 93.0, 138.0, 113.0, 73.0, 69.0, 52.0, 40.0, 39.0, 24.0, 17.0, 10.0, 13.0, 6.0, 1.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.49810791015625, -0.4781494140625, -0.45819091796875, -0.438232421875, -0.41827392578125, -0.3983154296875, -0.37835693359375, -0.3583984375, -0.33843994140625, -0.3184814453125, -0.29852294921875, -0.278564453125, -0.25860595703125, -0.2386474609375, -0.21868896484375, -0.19873046875, -0.17877197265625, -0.1588134765625, -0.13885498046875, -0.118896484375, -0.09893798828125, -0.0789794921875, -0.05902099609375, -0.0390625, -0.01910400390625, 0.0008544921875, 0.02081298828125, 0.040771484375, 0.06072998046875, 0.0806884765625, 0.10064697265625, 0.12060546875, 0.14056396484375, 0.1605224609375, 0.18048095703125, 0.200439453125, 0.22039794921875, 0.2403564453125, 0.26031494140625, 0.2802734375, 0.30023193359375, 0.3201904296875, 0.34014892578125, 0.360107421875, 0.38006591796875, 0.4000244140625, 0.41998291015625, 0.43994140625, 0.45989990234375, 0.4798583984375, 0.49981689453125, 0.519775390625, 0.53973388671875, 0.5596923828125, 0.57965087890625, 0.599609375, 0.61956787109375, 0.6395263671875, 0.65948486328125, 0.679443359375, 0.69940185546875, 0.7193603515625, 0.73931884765625, 0.75927734375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 14.0, 15.0, 35.0, 73.0, 126.0, 197.0, 203.0, 145.0, 83.0, 40.0, 19.0, 9.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.508768081665039, -10.209827423095703, -9.910886764526367, -9.611946105957031, -9.313005447387695, -9.01406478881836, -8.715124130249023, -8.416183471679688, -8.117242813110352, -7.818302154541016, -7.51936149597168, -7.220420837402344, -6.921480178833008, -6.622539520263672, -6.323598384857178, -6.024657726287842, -5.725716590881348, -5.426775932312012, -5.127835273742676, -4.82889461517334, -4.529953956604004, -4.231013298034668, -3.932072162628174, -3.633131504058838, -3.334190845489502, -3.035250186920166, -2.73630952835083, -2.437368631362915, -2.138427972793579, -1.8394873142242432, -1.5405465364456177, -1.2416057586669922, -0.9426660537719727, -0.6437253355979919, -0.34478461742401123, -0.04584389925003052, 0.2530968189239502, 0.5520374774932861, 0.8509782552719116, 1.149919033050537, 1.448859691619873, 1.747800350189209, 2.046741008758545, 2.34568190574646, 2.644622564315796, 2.943563222885132, 3.242504119873047, 3.541444778442383, 3.8403854370117188, 4.139326095581055, 4.438266754150391, 4.737207412719727, 5.0361480712890625, 5.335088729858398, 5.634029865264893, 5.9329705238342285, 6.2319111824035645, 6.5308518409729, 6.829792499542236, 7.128733158111572, 7.427674293518066, 7.726614952087402, 8.025555610656738, 8.324496269226074, 8.62343692779541]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 8.0, 5.0, 21.0, 11.0, 9.0, 8.0, 27.0, 18.0, 23.0, 24.0, 20.0, 31.0, 38.0, 36.0, 44.0, 49.0, 66.0, 43.0, 57.0, 51.0, 48.0, 38.0, 31.0, 31.0, 34.0, 24.0, 29.0, 20.0, 17.0, 12.0, 26.0, 18.0, 15.0, 8.0, 10.0, 5.0, 5.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-6.334390640258789, -6.159178256988525, -5.983965873718262, -5.808753967285156, -5.633541584014893, -5.458329200744629, -5.283117294311523, -5.10790491104126, -4.932692527770996, -4.757480144500732, -4.582267761230469, -4.407055854797363, -4.2318434715271, -4.056631088256836, -3.8814189434051514, -3.706206798553467, -3.530994415283203, -3.3557820320129395, -3.180569887161255, -3.0053577423095703, -2.8301453590393066, -2.654932975769043, -2.4797208309173584, -2.304508686065674, -2.12929630279541, -1.954084038734436, -1.778871774673462, -1.6036595106124878, -1.4284472465515137, -1.2532349824905396, -1.0780227184295654, -0.9028104543685913, -0.7275986671447754, -0.5523864030838013, -0.37717413902282715, -0.20196187496185303, -0.026749610900878906, 0.14846265316009521, 0.32367491722106934, 0.49888718128204346, 0.6740994453430176, 0.8493117094039917, 1.0245239734649658, 1.19973623752594, 1.374948501586914, 1.5501607656478882, 1.7253730297088623, 1.9005852937698364, 2.0757975578308105, 2.251009941101074, 2.426222085952759, 2.6014342308044434, 2.776646614074707, 2.9518589973449707, 3.1270711421966553, 3.30228328704834, 3.4774956703186035, 3.652708053588867, 3.8279201984405518, 4.003132343292236, 4.1783447265625, 4.353557109832764, 4.528769493103027, 4.703981399536133, 4.8791937828063965]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 11.0, 12.0, 16.0, 32.0, 45.0, 52.0, 74.0, 148.0, 287.0, 506.0, 1036.0, 2584.0, 8136.0, 37478.0, 417761.0, 3380144.0, 302943.0, 31592.0, 7212.0, 2264.0, 934.0, 469.0, 213.0, 112.0, 83.0, 49.0, 27.0, 20.0, 7.0, 10.0, 2.0, 7.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75244140625, -0.7317962646484375, -0.711151123046875, -0.6905059814453125, -0.66986083984375, -0.6492156982421875, -0.628570556640625, -0.6079254150390625, -0.5872802734375, -0.5666351318359375, -0.545989990234375, -0.5253448486328125, -0.50469970703125, -0.4840545654296875, -0.463409423828125, -0.4427642822265625, -0.422119140625, -0.4014739990234375, -0.380828857421875, -0.3601837158203125, -0.33953857421875, -0.3188934326171875, -0.298248291015625, -0.2776031494140625, -0.2569580078125, -0.2363128662109375, -0.215667724609375, -0.1950225830078125, -0.17437744140625, -0.1537322998046875, -0.133087158203125, -0.1124420166015625, -0.091796875, -0.0711517333984375, -0.050506591796875, -0.0298614501953125, -0.00921630859375, 0.0114288330078125, 0.032073974609375, 0.0527191162109375, 0.0733642578125, 0.0940093994140625, 0.114654541015625, 0.1352996826171875, 0.15594482421875, 0.1765899658203125, 0.197235107421875, 0.2178802490234375, 0.238525390625, 0.2591705322265625, 0.279815673828125, 0.3004608154296875, 0.32110595703125, 0.3417510986328125, 0.362396240234375, 0.3830413818359375, 0.4036865234375, 0.4243316650390625, 0.444976806640625, 0.4656219482421875, 0.48626708984375, 0.5069122314453125, 0.527557373046875, 0.5482025146484375, 0.56884765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 8.0, 6.0, 6.0, 11.0, 11.0, 14.0, 16.0, 17.0, 26.0, 43.0, 35.0, 36.0, 52.0, 58.0, 38.0, 56.0, 67.0, 49.0, 57.0, 60.0, 46.0, 46.0, 49.0, 41.0, 33.0, 32.0, 23.0, 14.0, 13.0, 14.0, 7.0, 7.0, 5.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.404296875, -0.39418983459472656, -0.3840827941894531, -0.3739757537841797, -0.36386871337890625, -0.3537616729736328, -0.3436546325683594, -0.33354759216308594, -0.3234405517578125, -0.31333351135253906, -0.3032264709472656, -0.2931194305419922, -0.28301239013671875, -0.2729053497314453, -0.2627983093261719, -0.25269126892089844, -0.242584228515625, -0.23247718811035156, -0.22237014770507812, -0.2122631072998047, -0.20215606689453125, -0.1920490264892578, -0.18194198608398438, -0.17183494567871094, -0.1617279052734375, -0.15162086486816406, -0.14151382446289062, -0.1314067840576172, -0.12129974365234375, -0.11119270324707031, -0.10108566284179688, -0.09097862243652344, -0.08087158203125, -0.07076454162597656, -0.060657501220703125, -0.05055046081542969, -0.04044342041015625, -0.030336380004882812, -0.020229339599609375, -0.010122299194335938, -1.52587890625e-05, 0.010091781616210938, 0.020198822021484375, 0.030305862426757812, 0.04041290283203125, 0.05051994323730469, 0.060626983642578125, 0.07073402404785156, 0.080841064453125, 0.09094810485839844, 0.10105514526367188, 0.11116218566894531, 0.12126922607421875, 0.1313762664794922, 0.14148330688476562, 0.15159034729003906, 0.1616973876953125, 0.17180442810058594, 0.18191146850585938, 0.1920185089111328, 0.20212554931640625, 0.2122325897216797, 0.22233963012695312, 0.23244667053222656, 0.2425537109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 24.0, 37.0, 33.0, 75.0, 95.0, 111.0, 180.0, 209.0, 328.0, 1026.0, 10824.0, 4038097.0, 140462.0, 2040.0, 349.0, 151.0, 75.0, 53.0, 55.0, 24.0, 11.0, 8.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3125, -3.2331390380859375, -3.153778076171875, -3.0744171142578125, -2.99505615234375, -2.9156951904296875, -2.836334228515625, -2.7569732666015625, -2.6776123046875, -2.5982513427734375, -2.518890380859375, -2.4395294189453125, -2.36016845703125, -2.2808074951171875, -2.201446533203125, -2.1220855712890625, -2.042724609375, -1.9633636474609375, -1.884002685546875, -1.8046417236328125, -1.72528076171875, -1.6459197998046875, -1.566558837890625, -1.4871978759765625, -1.4078369140625, -1.3284759521484375, -1.249114990234375, -1.1697540283203125, -1.09039306640625, -1.0110321044921875, -0.931671142578125, -0.8523101806640625, -0.77294921875, -0.6935882568359375, -0.614227294921875, -0.5348663330078125, -0.45550537109375, -0.3761444091796875, -0.296783447265625, -0.2174224853515625, -0.1380615234375, -0.0587005615234375, 0.020660400390625, 0.1000213623046875, 0.17938232421875, 0.2587432861328125, 0.338104248046875, 0.4174652099609375, 0.496826171875, 0.5761871337890625, 0.655548095703125, 0.7349090576171875, 0.81427001953125, 0.8936309814453125, 0.972991943359375, 1.0523529052734375, 1.1317138671875, 1.2110748291015625, 1.290435791015625, 1.3697967529296875, 1.44915771484375, 1.5285186767578125, 1.607879638671875, 1.6872406005859375, 1.7666015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 14.0, 29.0, 116.0, 274.0, 1130.0, 1798.0, 498.0, 141.0, 47.0, 14.0, 8.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.560546875, -3.4948577880859375, -3.429168701171875, -3.3634796142578125, -3.29779052734375, -3.2321014404296875, -3.166412353515625, -3.1007232666015625, -3.0350341796875, -2.9693450927734375, -2.903656005859375, -2.8379669189453125, -2.77227783203125, -2.7065887451171875, -2.640899658203125, -2.5752105712890625, -2.509521484375, -2.4438323974609375, -2.378143310546875, -2.3124542236328125, -2.24676513671875, -2.1810760498046875, -2.115386962890625, -2.0496978759765625, -1.9840087890625, -1.9183197021484375, -1.852630615234375, -1.7869415283203125, -1.72125244140625, -1.6555633544921875, -1.589874267578125, -1.5241851806640625, -1.45849609375, -1.3928070068359375, -1.327117919921875, -1.2614288330078125, -1.19573974609375, -1.1300506591796875, -1.064361572265625, -0.9986724853515625, -0.9329833984375, -0.8672943115234375, -0.801605224609375, -0.7359161376953125, -0.67022705078125, -0.6045379638671875, -0.538848876953125, -0.4731597900390625, -0.407470703125, -0.3417816162109375, -0.276092529296875, -0.2104034423828125, -0.14471435546875, -0.0790252685546875, -0.013336181640625, 0.0523529052734375, 0.1180419921875, 0.1837310791015625, 0.249420166015625, 0.3151092529296875, 0.38079833984375, 0.4464874267578125, 0.512176513671875, 0.5778656005859375, 0.6435546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 24.0, 49.0, 87.0, 171.0, 316.0, 196.0, 78.0, 23.0, 17.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.600770950317383, -13.183714866638184, -12.7666597366333, -12.349603652954102, -11.932547569274902, -11.515491485595703, -11.09843635559082, -10.681380271911621, -10.264324188232422, -9.847268104553223, -9.43021297454834, -9.01315689086914, -8.596100807189941, -8.179044723510742, -7.761989593505859, -7.34493350982666, -6.927878379821777, -6.510822772979736, -6.093766689300537, -5.676711082458496, -5.259654998779297, -4.842599391937256, -4.425543785095215, -4.008487701416016, -3.5914320945739746, -3.1743762493133545, -2.7573204040527344, -2.3402647972106934, -1.9232089519500732, -1.5061531066894531, -1.089097499847412, -0.672041654586792, -0.2549858093261719, 0.16206997632980347, 0.5791257619857788, 0.9961814880371094, 1.4132373332977295, 1.8302931785583496, 2.2473487854003906, 2.6644046306610107, 3.081460475921631, 3.498516321182251, 3.915572166442871, 4.332627773284912, 4.749683380126953, 5.166739463806152, 5.583795070648193, 6.000850677490234, 6.417906761169434, 6.834962368011475, 7.252018451690674, 7.669074058532715, 8.086130142211914, 8.503185272216797, 8.920241355895996, 9.337297439575195, 9.754352569580078, 10.171408653259277, 10.58846378326416, 11.00551986694336, 11.422575950622559, 11.839632034301758, 12.25668716430664, 12.67374324798584, 13.090799331665039]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 4.0, 8.0, 6.0, 10.0, 7.0, 17.0, 19.0, 18.0, 22.0, 31.0, 34.0, 36.0, 44.0, 57.0, 54.0, 69.0, 71.0, 58.0, 51.0, 43.0, 46.0, 46.0, 44.0, 28.0, 27.0, 42.0, 20.0, 13.0, 18.0, 14.0, 8.0, 9.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.489697456359863, -7.2925801277160645, -7.095462799072266, -6.898344993591309, -6.70122766494751, -6.504110336303711, -6.306993007659912, -6.109875679016113, -5.912757873535156, -5.715640544891357, -5.518523216247559, -5.321405410766602, -5.124288082122803, -4.927170753479004, -4.730053424835205, -4.532936096191406, -4.335818767547607, -4.138701438903809, -3.9415838718414307, -3.744466543197632, -3.547348976135254, -3.350231647491455, -3.1531143188476562, -2.9559969902038574, -2.7588794231414795, -2.5617620944976807, -2.3646445274353027, -2.167527198791504, -1.9704097509384155, -1.7732923030853271, -1.5761749744415283, -1.37905752658844, -1.1819405555725098, -0.9848231077194214, -0.7877057194709778, -0.5905883312225342, -0.3934708833694458, -0.19635343551635742, 0.0007638931274414062, 0.19788134098052979, 0.39499878883361816, 0.5921162366867065, 0.7892336249351501, 0.9863510131835938, 1.1834684610366821, 1.3805859088897705, 1.5777032375335693, 1.7748206853866577, 1.971938133239746, 2.169055461883545, 2.366173028945923, 2.5632903575897217, 2.7604079246520996, 2.9575252532958984, 3.1546425819396973, 3.351759910583496, 3.548877477645874, 3.745994806289673, 3.943112373352051, 4.14022970199585, 4.337347030639648, 4.5344648361206055, 4.731581687927246, 4.928699493408203, 5.125816822052002]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 12.0, 19.0, 23.0, 29.0, 43.0, 61.0, 142.0, 246.0, 380.0, 788.0, 1743.0, 4388.0, 12962.0, 51212.0, 272822.0, 544561.0, 119873.0, 26431.0, 7518.0, 2755.0, 1251.0, 557.0, 275.0, 171.0, 97.0, 57.0, 39.0, 23.0, 15.0, 14.0, 10.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79443359375, -0.7616958618164062, -0.7289581298828125, -0.6962203979492188, -0.663482666015625, -0.6307449340820312, -0.5980072021484375, -0.5652694702148438, -0.53253173828125, -0.49979400634765625, -0.4670562744140625, -0.43431854248046875, -0.401580810546875, -0.36884307861328125, -0.3361053466796875, -0.30336761474609375, -0.2706298828125, -0.23789215087890625, -0.2051544189453125, -0.17241668701171875, -0.139678955078125, -0.10694122314453125, -0.0742034912109375, -0.04146575927734375, -0.00872802734375, 0.02400970458984375, 0.0567474365234375, 0.08948516845703125, 0.122222900390625, 0.15496063232421875, 0.1876983642578125, 0.22043609619140625, 0.253173828125, 0.28591156005859375, 0.3186492919921875, 0.35138702392578125, 0.384124755859375, 0.41686248779296875, 0.4496002197265625, 0.48233795166015625, 0.51507568359375, 0.5478134155273438, 0.5805511474609375, 0.6132888793945312, 0.646026611328125, 0.6787643432617188, 0.7115020751953125, 0.7442398071289062, 0.7769775390625, 0.8097152709960938, 0.8424530029296875, 0.8751907348632812, 0.907928466796875, 0.9406661987304688, 0.9734039306640625, 1.0061416625976562, 1.03887939453125, 1.0716171264648438, 1.1043548583984375, 1.1370925903320312, 1.169830322265625, 1.2025680541992188, 1.2353057861328125, 1.2680435180664062, 1.30078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 9.0, 2.0, 10.0, 15.0, 7.0, 20.0, 34.0, 37.0, 38.0, 52.0, 63.0, 68.0, 65.0, 58.0, 56.0, 77.0, 45.0, 58.0, 48.0, 47.0, 46.0, 29.0, 23.0, 25.0, 17.0, 17.0, 5.0, 10.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.51416015625, -0.5016937255859375, -0.489227294921875, -0.4767608642578125, -0.46429443359375, -0.4518280029296875, -0.439361572265625, -0.4268951416015625, -0.4144287109375, -0.4019622802734375, -0.389495849609375, -0.3770294189453125, -0.36456298828125, -0.3520965576171875, -0.339630126953125, -0.3271636962890625, -0.314697265625, -0.3022308349609375, -0.289764404296875, -0.2772979736328125, -0.26483154296875, -0.2523651123046875, -0.239898681640625, -0.2274322509765625, -0.2149658203125, -0.2024993896484375, -0.190032958984375, -0.1775665283203125, -0.16510009765625, -0.1526336669921875, -0.140167236328125, -0.1277008056640625, -0.115234375, -0.1027679443359375, -0.090301513671875, -0.0778350830078125, -0.06536865234375, -0.0529022216796875, -0.040435791015625, -0.0279693603515625, -0.0155029296875, -0.0030364990234375, 0.009429931640625, 0.0218963623046875, 0.03436279296875, 0.0468292236328125, 0.059295654296875, 0.0717620849609375, 0.084228515625, 0.0966949462890625, 0.109161376953125, 0.1216278076171875, 0.13409423828125, 0.1465606689453125, 0.159027099609375, 0.1714935302734375, 0.1839599609375, 0.1964263916015625, 0.208892822265625, 0.2213592529296875, 0.23382568359375, 0.2462921142578125, 0.258758544921875, 0.2712249755859375, 0.28369140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 6.0, 6.0, 12.0, 12.0, 19.0, 27.0, 44.0, 60.0, 98.0, 176.0, 366.0, 793.0, 2147.0, 11123.0, 288690.0, 722398.0, 17685.0, 2941.0, 946.0, 428.0, 226.0, 131.0, 67.0, 50.0, 29.0, 24.0, 16.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.762237548828125, -2.67877197265625, -2.595306396484375, -2.5118408203125, -2.428375244140625, -2.34490966796875, -2.261444091796875, -2.177978515625, -2.094512939453125, -2.01104736328125, -1.927581787109375, -1.8441162109375, -1.760650634765625, -1.67718505859375, -1.593719482421875, -1.51025390625, -1.426788330078125, -1.34332275390625, -1.259857177734375, -1.1763916015625, -1.092926025390625, -1.00946044921875, -0.925994873046875, -0.842529296875, -0.759063720703125, -0.67559814453125, -0.592132568359375, -0.5086669921875, -0.425201416015625, -0.34173583984375, -0.258270263671875, -0.1748046875, -0.091339111328125, -0.00787353515625, 0.075592041015625, 0.1590576171875, 0.242523193359375, 0.32598876953125, 0.409454345703125, 0.492919921875, 0.576385498046875, 0.65985107421875, 0.743316650390625, 0.8267822265625, 0.910247802734375, 0.99371337890625, 1.077178955078125, 1.16064453125, 1.244110107421875, 1.32757568359375, 1.411041259765625, 1.4945068359375, 1.577972412109375, 1.66143798828125, 1.744903564453125, 1.828369140625, 1.911834716796875, 1.99530029296875, 2.078765869140625, 2.1622314453125, 2.245697021484375, 2.32916259765625, 2.412628173828125, 2.49609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 7.0, 5.0, 6.0, 19.0, 18.0, 34.0, 35.0, 38.0, 44.0, 48.0, 57.0, 68.0, 54.0, 53.0, 81.0, 63.0, 62.0, 53.0, 53.0, 36.0, 44.0, 27.0, 24.0, 13.0, 15.0, 12.0, 5.0, 4.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1484375, -2.0902252197265625, -2.032012939453125, -1.9738006591796875, -1.91558837890625, -1.8573760986328125, -1.799163818359375, -1.7409515380859375, -1.6827392578125, -1.6245269775390625, -1.566314697265625, -1.5081024169921875, -1.44989013671875, -1.3916778564453125, -1.333465576171875, -1.2752532958984375, -1.217041015625, -1.1588287353515625, -1.100616455078125, -1.0424041748046875, -0.98419189453125, -0.9259796142578125, -0.867767333984375, -0.8095550537109375, -0.7513427734375, -0.6931304931640625, -0.634918212890625, -0.5767059326171875, -0.51849365234375, -0.4602813720703125, -0.402069091796875, -0.3438568115234375, -0.28564453125, -0.2274322509765625, -0.169219970703125, -0.1110076904296875, -0.05279541015625, 0.0054168701171875, 0.063629150390625, 0.1218414306640625, 0.1800537109375, 0.2382659912109375, 0.296478271484375, 0.3546905517578125, 0.41290283203125, 0.4711151123046875, 0.529327392578125, 0.5875396728515625, 0.645751953125, 0.7039642333984375, 0.762176513671875, 0.8203887939453125, 0.87860107421875, 0.9368133544921875, 0.995025634765625, 1.0532379150390625, 1.1114501953125, 1.1696624755859375, 1.227874755859375, 1.2860870361328125, 1.34429931640625, 1.4025115966796875, 1.460723876953125, 1.5189361572265625, 1.5771484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 2.0, 5.0, 11.0, 10.0, 18.0, 34.0, 72.0, 141.0, 377.0, 1180.0, 7855.0, 267899.0, 756966.0, 11686.0, 1535.0, 403.0, 156.0, 83.0, 43.0, 29.0, 17.0, 6.0, 4.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3427734375, -1.2995758056640625, -1.256378173828125, -1.2131805419921875, -1.16998291015625, -1.1267852783203125, -1.083587646484375, -1.0403900146484375, -0.9971923828125, -0.9539947509765625, -0.910797119140625, -0.8675994873046875, -0.82440185546875, -0.7812042236328125, -0.738006591796875, -0.6948089599609375, -0.651611328125, -0.6084136962890625, -0.565216064453125, -0.5220184326171875, -0.47882080078125, -0.4356231689453125, -0.392425537109375, -0.3492279052734375, -0.3060302734375, -0.2628326416015625, -0.219635009765625, -0.1764373779296875, -0.13323974609375, -0.0900421142578125, -0.046844482421875, -0.0036468505859375, 0.03955078125, 0.0827484130859375, 0.125946044921875, 0.1691436767578125, 0.21234130859375, 0.2555389404296875, 0.298736572265625, 0.3419342041015625, 0.3851318359375, 0.4283294677734375, 0.471527099609375, 0.5147247314453125, 0.55792236328125, 0.6011199951171875, 0.644317626953125, 0.6875152587890625, 0.730712890625, 0.7739105224609375, 0.817108154296875, 0.8603057861328125, 0.90350341796875, 0.9467010498046875, 0.989898681640625, 1.0330963134765625, 1.0762939453125, 1.1194915771484375, 1.162689208984375, 1.2058868408203125, 1.24908447265625, 1.2922821044921875, 1.335479736328125, 1.3786773681640625, 1.421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 7.0, 19.0, 12.0, 19.0, 28.0, 25.0, 40.0, 55.0, 87.0, 143.0, 159.0, 124.0, 58.0, 51.0, 40.0, 21.0, 20.0, 10.0, 9.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.00019502639770507812, -0.0001905187964439392, -0.0001860111951828003, -0.00018150359392166138, -0.00017699599266052246, -0.00017248839139938354, -0.00016798079013824463, -0.0001634731888771057, -0.0001589655876159668, -0.00015445798635482788, -0.00014995038509368896, -0.00014544278383255005, -0.00014093518257141113, -0.00013642758131027222, -0.0001319199800491333, -0.00012741237878799438, -0.00012290477752685547, -0.00011839717626571655, -0.00011388957500457764, -0.00010938197374343872, -0.0001048743724822998, -0.00010036677122116089, -9.585916996002197e-05, -9.135156869888306e-05, -8.684396743774414e-05, -8.233636617660522e-05, -7.782876491546631e-05, -7.332116365432739e-05, -6.881356239318848e-05, -6.430596113204956e-05, -5.9798359870910645e-05, -5.529075860977173e-05, -5.078315734863281e-05, -4.6275556087493896e-05, -4.176795482635498e-05, -3.7260353565216064e-05, -3.275275230407715e-05, -2.8245151042938232e-05, -2.3737549781799316e-05, -1.92299485206604e-05, -1.4722347259521484e-05, -1.0214745998382568e-05, -5.707144737243652e-06, -1.1995434761047363e-06, 3.3080577850341797e-06, 7.815659046173096e-06, 1.2323260307312012e-05, 1.6830861568450928e-05, 2.1338462829589844e-05, 2.584606409072876e-05, 3.0353665351867676e-05, 3.486126661300659e-05, 3.936886787414551e-05, 4.3876469135284424e-05, 4.838407039642334e-05, 5.2891671657562256e-05, 5.739927291870117e-05, 6.190687417984009e-05, 6.6414475440979e-05, 7.092207670211792e-05, 7.542967796325684e-05, 7.993727922439575e-05, 8.444488048553467e-05, 8.895248174667358e-05, 9.34600830078125e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 14.0, 20.0, 26.0, 39.0, 57.0, 85.0, 128.0, 252.0, 435.0, 1062.0, 2783.0, 9675.0, 64024.0, 865281.0, 88155.0, 11074.0, 3157.0, 1197.0, 464.0, 243.0, 137.0, 74.0, 57.0, 34.0, 22.0, 15.0, 9.0, 6.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6868820190429688, -0.6628265380859375, -0.6387710571289062, -0.614715576171875, -0.5906600952148438, -0.5666046142578125, -0.5425491333007812, -0.51849365234375, -0.49443817138671875, -0.4703826904296875, -0.44632720947265625, -0.422271728515625, -0.39821624755859375, -0.3741607666015625, -0.35010528564453125, -0.3260498046875, -0.30199432373046875, -0.2779388427734375, -0.25388336181640625, -0.229827880859375, -0.20577239990234375, -0.1817169189453125, -0.15766143798828125, -0.13360595703125, -0.10955047607421875, -0.0854949951171875, -0.06143951416015625, -0.037384033203125, -0.01332855224609375, 0.0107269287109375, 0.03478240966796875, 0.058837890625, 0.08289337158203125, 0.1069488525390625, 0.13100433349609375, 0.155059814453125, 0.17911529541015625, 0.2031707763671875, 0.22722625732421875, 0.25128173828125, 0.27533721923828125, 0.2993927001953125, 0.32344818115234375, 0.347503662109375, 0.37155914306640625, 0.3956146240234375, 0.41967010498046875, 0.4437255859375, 0.46778106689453125, 0.4918365478515625, 0.5158920288085938, 0.539947509765625, 0.5640029907226562, 0.5880584716796875, 0.6121139526367188, 0.63616943359375, 0.6602249145507812, 0.6842803955078125, 0.7083358764648438, 0.732391357421875, 0.7564468383789062, 0.7805023193359375, 0.8045578002929688, 0.82861328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 6.0, 3.0, 6.0, 5.0, 13.0, 21.0, 28.0, 41.0, 46.0, 101.0, 130.0, 137.0, 155.0, 92.0, 63.0, 45.0, 23.0, 25.0, 17.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7392578125, -0.7179718017578125, -0.696685791015625, -0.6753997802734375, -0.65411376953125, -0.6328277587890625, -0.611541748046875, -0.5902557373046875, -0.5689697265625, -0.5476837158203125, -0.526397705078125, -0.5051116943359375, -0.48382568359375, -0.4625396728515625, -0.441253662109375, -0.4199676513671875, -0.398681640625, -0.3773956298828125, -0.356109619140625, -0.3348236083984375, -0.31353759765625, -0.2922515869140625, -0.270965576171875, -0.2496795654296875, -0.2283935546875, -0.2071075439453125, -0.185821533203125, -0.1645355224609375, -0.14324951171875, -0.1219635009765625, -0.100677490234375, -0.0793914794921875, -0.05810546875, -0.0368194580078125, -0.015533447265625, 0.0057525634765625, 0.02703857421875, 0.0483245849609375, 0.069610595703125, 0.0908966064453125, 0.1121826171875, 0.1334686279296875, 0.154754638671875, 0.1760406494140625, 0.19732666015625, 0.2186126708984375, 0.239898681640625, 0.2611846923828125, 0.282470703125, 0.3037567138671875, 0.325042724609375, 0.3463287353515625, 0.36761474609375, 0.3889007568359375, 0.410186767578125, 0.4314727783203125, 0.4527587890625, 0.4740447998046875, 0.495330810546875, 0.5166168212890625, 0.53790283203125, 0.5591888427734375, 0.580474853515625, 0.6017608642578125, 0.623046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 16.0, 17.0, 64.0, 136.0, 275.0, 251.0, 138.0, 42.0, 22.0, 11.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.772589683532715, -13.339581489562988, -12.906572341918945, -12.473564147949219, -12.040555953979492, -11.60754680633545, -11.174538612365723, -10.74152946472168, -10.308521270751953, -9.875513076782227, -9.442503929138184, -9.009495735168457, -8.57648754119873, -8.143478393554688, -7.710470199584961, -7.277461528778076, -6.84445333480835, -6.411444664001465, -5.978436470031738, -5.5454277992248535, -5.112419128417969, -4.679410934448242, -4.246402263641357, -3.8133935928344727, -3.380385160446167, -2.9473767280578613, -2.5143680572509766, -2.081359624862671, -1.6483510732650757, -1.2153425216674805, -0.7823340892791748, -0.34932541847229004, 0.08368301391601562, 0.5166915655136108, 0.9497000575065613, 1.3827085494995117, 1.815717101097107, 2.248725652694702, 2.681734085083008, 3.1147427558898926, 3.5477511882781982, 3.980759620666504, 4.413768291473389, 4.846776962280273, 5.27978515625, 5.712793827056885, 6.1458024978637695, 6.578810691833496, 7.011819362640381, 7.444828033447266, 7.877836227416992, 8.310844421386719, 8.743853569030762, 9.176861763000488, 9.609870910644531, 10.042879104614258, 10.475887298583984, 10.908895492553711, 11.341904640197754, 11.77491283416748, 12.207921028137207, 12.64093017578125, 13.073938369750977, 13.506946563720703, 13.939955711364746]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 5.0, 6.0, 8.0, 9.0, 13.0, 14.0, 18.0, 21.0, 26.0, 24.0, 24.0, 35.0, 35.0, 43.0, 51.0, 61.0, 57.0, 67.0, 60.0, 63.0, 56.0, 34.0, 31.0, 39.0, 25.0, 20.0, 17.0, 24.0, 27.0, 21.0, 14.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.163899898529053, -6.953677654266357, -6.743455410003662, -6.533233165740967, -6.323010444641113, -6.112788200378418, -5.902565956115723, -5.692343711853027, -5.482121467590332, -5.271899223327637, -5.061676979064941, -4.851454734802246, -4.641232490539551, -4.4310102462768555, -4.220787525177002, -4.010565280914307, -3.8003430366516113, -3.590120792388916, -3.3798985481262207, -3.1696760654449463, -2.959453821182251, -2.7492315769195557, -2.5390090942382812, -2.328786849975586, -2.1185646057128906, -1.9083423614501953, -1.6981199979782104, -1.4878976345062256, -1.2776753902435303, -1.067453145980835, -0.8572307825088501, -0.6470084190368652, -0.4367856979370117, -0.22656339406967163, -0.016341090202331543, 0.19388121366500854, 0.40410351753234863, 0.614325761795044, 0.8245481252670288, 1.0347704887390137, 1.244992733001709, 1.4552149772644043, 1.6654373407363892, 1.875659704208374, 2.0858819484710693, 2.2961041927337646, 2.506326675415039, 2.7165489196777344, 2.9267711639404297, 3.136993408203125, 3.3472156524658203, 3.5574381351470947, 3.76766037940979, 3.9778826236724854, 4.18810510635376, 4.398327350616455, 4.60854959487915, 4.818771839141846, 5.028994083404541, 5.239216327667236, 5.44943904876709, 5.659661293029785, 5.8698835372924805, 6.080105781555176, 6.290328025817871]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 16.0, 27.0, 36.0, 55.0, 78.0, 121.0, 206.0, 384.0, 680.0, 1525.0, 4489.0, 21623.0, 415345.0, 3628384.0, 104875.0, 11297.0, 2796.0, 982.0, 503.0, 282.0, 160.0, 110.0, 65.0, 46.0, 45.0, 29.0, 16.0, 16.0, 11.0, 8.0, 7.0, 7.0, 7.0, 2.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.85986328125, -0.8340530395507812, -0.8082427978515625, -0.7824325561523438, -0.756622314453125, -0.7308120727539062, -0.7050018310546875, -0.6791915893554688, -0.65338134765625, -0.6275711059570312, -0.6017608642578125, -0.5759506225585938, -0.550140380859375, -0.5243301391601562, -0.4985198974609375, -0.47270965576171875, -0.4468994140625, -0.42108917236328125, -0.3952789306640625, -0.36946868896484375, -0.343658447265625, -0.31784820556640625, -0.2920379638671875, -0.26622772216796875, -0.24041748046875, -0.21460723876953125, -0.1887969970703125, -0.16298675537109375, -0.137176513671875, -0.11136627197265625, -0.0855560302734375, -0.05974578857421875, -0.033935546875, -0.00812530517578125, 0.0176849365234375, 0.04349517822265625, 0.069305419921875, 0.09511566162109375, 0.1209259033203125, 0.14673614501953125, 0.17254638671875, 0.19835662841796875, 0.2241668701171875, 0.24997711181640625, 0.275787353515625, 0.30159759521484375, 0.3274078369140625, 0.35321807861328125, 0.3790283203125, 0.40483856201171875, 0.4306488037109375, 0.45645904541015625, 0.482269287109375, 0.5080795288085938, 0.5338897705078125, 0.5597000122070312, 0.58551025390625, 0.6113204956054688, 0.6371307373046875, 0.6629409790039062, 0.688751220703125, 0.7145614624023438, 0.7403717041015625, 0.7661819458007812, 0.7919921875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 8.0, 7.0, 16.0, 24.0, 20.0, 44.0, 35.0, 52.0, 54.0, 68.0, 70.0, 75.0, 59.0, 67.0, 68.0, 76.0, 55.0, 59.0, 25.0, 30.0, 22.0, 22.0, 21.0, 11.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373291015625, -0.3600883483886719, -0.34688568115234375, -0.3336830139160156, -0.3204803466796875, -0.3072776794433594, -0.29407501220703125, -0.2808723449707031, -0.267669677734375, -0.2544670104980469, -0.24126434326171875, -0.22806167602539062, -0.2148590087890625, -0.20165634155273438, -0.18845367431640625, -0.17525100708007812, -0.16204833984375, -0.14884567260742188, -0.13564300537109375, -0.12244033813476562, -0.1092376708984375, -0.09603500366210938, -0.08283233642578125, -0.06962966918945312, -0.056427001953125, -0.043224334716796875, -0.03002166748046875, -0.016819000244140625, -0.0036163330078125, 0.009586334228515625, 0.02278900146484375, 0.035991668701171875, 0.0491943359375, 0.062397003173828125, 0.07559967041015625, 0.08880233764648438, 0.1020050048828125, 0.11520767211914062, 0.12841033935546875, 0.14161300659179688, 0.154815673828125, 0.16801834106445312, 0.18122100830078125, 0.19442367553710938, 0.2076263427734375, 0.22082901000976562, 0.23403167724609375, 0.24723434448242188, 0.26043701171875, 0.2736396789550781, 0.28684234619140625, 0.3000450134277344, 0.3132476806640625, 0.3264503479003906, 0.33965301513671875, 0.3528556823730469, 0.366058349609375, 0.3792610168457031, 0.39246368408203125, 0.4056663513183594, 0.4188690185546875, 0.4320716857910156, 0.44527435302734375, 0.4584770202636719, 0.4716796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 13.0, 26.0, 40.0, 51.0, 73.0, 92.0, 145.0, 298.0, 1036.0, 65808.0, 4123696.0, 2439.0, 307.0, 100.0, 51.0, 26.0, 33.0, 22.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.606201171875, -4.45849609375, -4.310791015625, -4.1630859375, -4.015380859375, -3.86767578125, -3.719970703125, -3.572265625, -3.424560546875, -3.27685546875, -3.129150390625, -2.9814453125, -2.833740234375, -2.68603515625, -2.538330078125, -2.390625, -2.242919921875, -2.09521484375, -1.947509765625, -1.7998046875, -1.652099609375, -1.50439453125, -1.356689453125, -1.208984375, -1.061279296875, -0.91357421875, -0.765869140625, -0.6181640625, -0.470458984375, -0.32275390625, -0.175048828125, -0.02734375, 0.120361328125, 0.26806640625, 0.415771484375, 0.5634765625, 0.711181640625, 0.85888671875, 1.006591796875, 1.154296875, 1.302001953125, 1.44970703125, 1.597412109375, 1.7451171875, 1.892822265625, 2.04052734375, 2.188232421875, 2.3359375, 2.483642578125, 2.63134765625, 2.779052734375, 2.9267578125, 3.074462890625, 3.22216796875, 3.369873046875, 3.517578125, 3.665283203125, 3.81298828125, 3.960693359375, 4.1083984375, 4.256103515625, 4.40380859375, 4.551513671875, 4.69921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 13.0, 32.0, 223.0, 2623.0, 1068.0, 106.0, 14.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.93359375, -5.825370788574219, -5.7171478271484375, -5.608924865722656, -5.500701904296875, -5.392478942871094, -5.2842559814453125, -5.176033020019531, -5.06781005859375, -4.959587097167969, -4.8513641357421875, -4.743141174316406, -4.634918212890625, -4.526695251464844, -4.4184722900390625, -4.310249328613281, -4.2020263671875, -4.093803405761719, -3.9855804443359375, -3.8773574829101562, -3.769134521484375, -3.6609115600585938, -3.5526885986328125, -3.4444656372070312, -3.33624267578125, -3.2280197143554688, -3.1197967529296875, -3.0115737915039062, -2.903350830078125, -2.7951278686523438, -2.6869049072265625, -2.5786819458007812, -2.470458984375, -2.3622360229492188, -2.2540130615234375, -2.1457901000976562, -2.037567138671875, -1.9293441772460938, -1.8211212158203125, -1.7128982543945312, -1.60467529296875, -1.4964523315429688, -1.3882293701171875, -1.2800064086914062, -1.171783447265625, -1.0635604858398438, -0.9553375244140625, -0.8471145629882812, -0.7388916015625, -0.6306686401367188, -0.5224456787109375, -0.41422271728515625, -0.305999755859375, -0.19777679443359375, -0.0895538330078125, 0.01866912841796875, 0.12689208984375, 0.23511505126953125, 0.3433380126953125, 0.45156097412109375, 0.559783935546875, 0.6680068969726562, 0.7762298583984375, 0.8844528198242188, 0.99267578125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 12.0, 19.0, 39.0, 136.0, 490.0, 242.0, 39.0, 11.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.63571548461914, -22.935924530029297, -22.236133575439453, -21.536344528198242, -20.8365535736084, -20.136762619018555, -19.436973571777344, -18.7371826171875, -18.037391662597656, -17.337600708007812, -16.63780975341797, -15.938020706176758, -15.238229751586914, -14.53843879699707, -13.838648796081543, -13.138858795166016, -12.439067840576172, -11.739276885986328, -11.0394868850708, -10.339696884155273, -9.63990592956543, -8.940114974975586, -8.240324974060059, -7.540534496307373, -6.8407440185546875, -6.140953540802002, -5.441163063049316, -4.741372585296631, -4.041582107543945, -3.3417916297912598, -2.642001152038574, -1.9422106742858887, -1.2424201965332031, -0.5426297187805176, 0.15716075897216797, 0.8569512367248535, 1.556741714477539, 2.2565321922302246, 2.95632266998291, 3.6561131477355957, 4.355903625488281, 5.055694103240967, 5.755484580993652, 6.455275058746338, 7.155065536499023, 7.854856014251709, 8.554646492004395, 9.254436492919922, 9.954227447509766, 10.65401840209961, 11.353808403015137, 12.053598403930664, 12.753389358520508, 13.453180313110352, 14.152970314025879, 14.852760314941406, 15.55255126953125, 16.252342224121094, 16.952133178710938, 17.65192222595215, 18.351713180541992, 19.051504135131836, 19.751293182373047, 20.45108413696289, 21.150875091552734]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 9.0, 10.0, 20.0, 22.0, 26.0, 31.0, 46.0, 48.0, 49.0, 46.0, 65.0, 50.0, 63.0, 53.0, 75.0, 60.0, 47.0, 41.0, 41.0, 43.0, 29.0, 16.0, 21.0, 13.0, 13.0, 15.0, 9.0, 10.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.843503952026367, -5.640341758728027, -5.4371795654296875, -5.234017372131348, -5.030855178833008, -4.827692985534668, -4.624530792236328, -4.421368598937988, -4.218206405639648, -4.015044212341309, -3.8118820190429688, -3.608719825744629, -3.405557632446289, -3.202395439147949, -2.9992332458496094, -2.7960710525512695, -2.5929086208343506, -2.3897464275360107, -2.186584234237671, -1.983422040939331, -1.7802598476409912, -1.5770975351333618, -1.373935341835022, -1.1707731485366821, -0.9676109552383423, -0.7644487619400024, -0.5612865686416626, -0.358124315738678, -0.15496212244033813, 0.048200130462646484, 0.25136232376098633, 0.45452451705932617, 0.657686710357666, 0.8608489036560059, 1.0640110969543457, 1.2671732902526855, 1.4703354835510254, 1.6734977960586548, 1.8766599893569946, 2.079822063446045, 2.2829842567443848, 2.4861464500427246, 2.6893086433410645, 2.8924708366394043, 3.095633029937744, 3.298795223236084, 3.501957416534424, 3.7051196098327637, 3.9082820415496826, 4.111444473266602, 4.314606666564941, 4.517768859863281, 4.720931053161621, 4.924093246459961, 5.127255439758301, 5.330417633056641, 5.5335798263549805, 5.73674201965332, 5.93990421295166, 6.14306640625, 6.34622859954834, 6.54939079284668, 6.7525529861450195, 6.955715179443359, 7.158877372741699]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 13.0, 13.0, 14.0, 19.0, 23.0, 43.0, 60.0, 102.0, 137.0, 224.0, 423.0, 822.0, 2333.0, 9484.0, 61004.0, 489585.0, 421932.0, 50258.0, 8125.0, 2140.0, 800.0, 389.0, 186.0, 135.0, 78.0, 53.0, 45.0, 28.0, 21.0, 11.0, 16.0, 9.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.005859375, -0.96710205078125, -0.9283447265625, -0.88958740234375, -0.850830078125, -0.81207275390625, -0.7733154296875, -0.73455810546875, -0.69580078125, -0.65704345703125, -0.6182861328125, -0.57952880859375, -0.540771484375, -0.50201416015625, -0.4632568359375, -0.42449951171875, -0.3857421875, -0.34698486328125, -0.3082275390625, -0.26947021484375, -0.230712890625, -0.19195556640625, -0.1531982421875, -0.11444091796875, -0.07568359375, -0.03692626953125, 0.0018310546875, 0.04058837890625, 0.079345703125, 0.11810302734375, 0.1568603515625, 0.19561767578125, 0.234375, 0.27313232421875, 0.3118896484375, 0.35064697265625, 0.389404296875, 0.42816162109375, 0.4669189453125, 0.50567626953125, 0.54443359375, 0.58319091796875, 0.6219482421875, 0.66070556640625, 0.699462890625, 0.73822021484375, 0.7769775390625, 0.81573486328125, 0.8544921875, 0.89324951171875, 0.9320068359375, 0.97076416015625, 1.009521484375, 1.04827880859375, 1.0870361328125, 1.12579345703125, 1.16455078125, 1.20330810546875, 1.2420654296875, 1.28082275390625, 1.319580078125, 1.35833740234375, 1.3970947265625, 1.43585205078125, 1.474609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 13.0, 19.0, 24.0, 26.0, 38.0, 35.0, 41.0, 51.0, 50.0, 53.0, 47.0, 68.0, 53.0, 59.0, 69.0, 56.0, 44.0, 49.0, 39.0, 35.0, 30.0, 20.0, 18.0, 15.0, 12.0, 10.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3595428466796875, -0.346282958984375, -0.3330230712890625, -0.31976318359375, -0.3065032958984375, -0.293243408203125, -0.2799835205078125, -0.2667236328125, -0.2534637451171875, -0.240203857421875, -0.2269439697265625, -0.21368408203125, -0.2004241943359375, -0.187164306640625, -0.1739044189453125, -0.16064453125, -0.1473846435546875, -0.134124755859375, -0.1208648681640625, -0.10760498046875, -0.0943450927734375, -0.081085205078125, -0.0678253173828125, -0.0545654296875, -0.0413055419921875, -0.028045654296875, -0.0147857666015625, -0.00152587890625, 0.0117340087890625, 0.024993896484375, 0.0382537841796875, 0.051513671875, 0.0647735595703125, 0.078033447265625, 0.0912933349609375, 0.10455322265625, 0.1178131103515625, 0.131072998046875, 0.1443328857421875, 0.1575927734375, 0.1708526611328125, 0.184112548828125, 0.1973724365234375, 0.21063232421875, 0.2238922119140625, 0.237152099609375, 0.2504119873046875, 0.263671875, 0.2769317626953125, 0.290191650390625, 0.3034515380859375, 0.31671142578125, 0.3299713134765625, 0.343231201171875, 0.3564910888671875, 0.3697509765625, 0.3830108642578125, 0.396270751953125, 0.4095306396484375, 0.42279052734375, 0.4360504150390625, 0.449310302734375, 0.4625701904296875, 0.475830078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 10.0, 9.0, 8.0, 15.0, 13.0, 21.0, 19.0, 40.0, 56.0, 88.0, 114.0, 228.0, 374.0, 757.0, 1685.0, 4252.0, 13280.0, 53742.0, 265612.0, 580649.0, 95005.0, 21566.0, 6329.0, 2382.0, 1036.0, 527.0, 257.0, 149.0, 90.0, 50.0, 50.0, 35.0, 23.0, 17.0, 17.0, 10.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.009765625, -0.980224609375, -0.95068359375, -0.921142578125, -0.8916015625, -0.862060546875, -0.83251953125, -0.802978515625, -0.7734375, -0.743896484375, -0.71435546875, -0.684814453125, -0.6552734375, -0.625732421875, -0.59619140625, -0.566650390625, -0.537109375, -0.507568359375, -0.47802734375, -0.448486328125, -0.4189453125, -0.389404296875, -0.35986328125, -0.330322265625, -0.30078125, -0.271240234375, -0.24169921875, -0.212158203125, -0.1826171875, -0.153076171875, -0.12353515625, -0.093994140625, -0.064453125, -0.034912109375, -0.00537109375, 0.024169921875, 0.0537109375, 0.083251953125, 0.11279296875, 0.142333984375, 0.171875, 0.201416015625, 0.23095703125, 0.260498046875, 0.2900390625, 0.319580078125, 0.34912109375, 0.378662109375, 0.408203125, 0.437744140625, 0.46728515625, 0.496826171875, 0.5263671875, 0.555908203125, 0.58544921875, 0.614990234375, 0.64453125, 0.674072265625, 0.70361328125, 0.733154296875, 0.7626953125, 0.792236328125, 0.82177734375, 0.851318359375, 0.880859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 5.0, 5.0, 9.0, 5.0, 5.0, 15.0, 14.0, 17.0, 21.0, 25.0, 21.0, 30.0, 36.0, 48.0, 31.0, 39.0, 48.0, 42.0, 64.0, 54.0, 53.0, 43.0, 42.0, 40.0, 39.0, 40.0, 29.0, 29.0, 29.0, 19.0, 14.0, 26.0, 17.0, 8.0, 8.0, 8.0, 5.0, 9.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.279296875, -1.2348480224609375, -1.190399169921875, -1.1459503173828125, -1.10150146484375, -1.0570526123046875, -1.012603759765625, -0.9681549072265625, -0.9237060546875, -0.8792572021484375, -0.834808349609375, -0.7903594970703125, -0.74591064453125, -0.7014617919921875, -0.657012939453125, -0.6125640869140625, -0.568115234375, -0.5236663818359375, -0.479217529296875, -0.4347686767578125, -0.39031982421875, -0.3458709716796875, -0.301422119140625, -0.2569732666015625, -0.2125244140625, -0.1680755615234375, -0.123626708984375, -0.0791778564453125, -0.03472900390625, 0.0097198486328125, 0.054168701171875, 0.0986175537109375, 0.14306640625, 0.1875152587890625, 0.231964111328125, 0.2764129638671875, 0.32086181640625, 0.3653106689453125, 0.409759521484375, 0.4542083740234375, 0.4986572265625, 0.5431060791015625, 0.587554931640625, 0.6320037841796875, 0.67645263671875, 0.7209014892578125, 0.765350341796875, 0.8097991943359375, 0.854248046875, 0.8986968994140625, 0.943145751953125, 0.9875946044921875, 1.03204345703125, 1.0764923095703125, 1.120941162109375, 1.1653900146484375, 1.2098388671875, 1.2542877197265625, 1.298736572265625, 1.3431854248046875, 1.38763427734375, 1.4320831298828125, 1.476531982421875, 1.5209808349609375, 1.5654296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 9.0, 5.0, 12.0, 12.0, 15.0, 21.0, 34.0, 63.0, 69.0, 124.0, 171.0, 324.0, 564.0, 1233.0, 2666.0, 6526.0, 17778.0, 55988.0, 220788.0, 580610.0, 110914.0, 31820.0, 10949.0, 4104.0, 1844.0, 825.0, 432.0, 221.0, 134.0, 110.0, 70.0, 24.0, 22.0, 16.0, 12.0, 5.0, 7.0, 5.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.24365234375, -0.2350311279296875, -0.226409912109375, -0.2177886962890625, -0.20916748046875, -0.2005462646484375, -0.191925048828125, -0.1833038330078125, -0.1746826171875, -0.1660614013671875, -0.157440185546875, -0.1488189697265625, -0.14019775390625, -0.1315765380859375, -0.122955322265625, -0.1143341064453125, -0.105712890625, -0.0970916748046875, -0.088470458984375, -0.0798492431640625, -0.07122802734375, -0.0626068115234375, -0.053985595703125, -0.0453643798828125, -0.0367431640625, -0.0281219482421875, -0.019500732421875, -0.0108795166015625, -0.00225830078125, 0.0063629150390625, 0.014984130859375, 0.0236053466796875, 0.0322265625, 0.0408477783203125, 0.049468994140625, 0.0580902099609375, 0.06671142578125, 0.0753326416015625, 0.083953857421875, 0.0925750732421875, 0.1011962890625, 0.1098175048828125, 0.118438720703125, 0.1270599365234375, 0.13568115234375, 0.1443023681640625, 0.152923583984375, 0.1615447998046875, 0.170166015625, 0.1787872314453125, 0.187408447265625, 0.1960296630859375, 0.20465087890625, 0.2132720947265625, 0.221893310546875, 0.2305145263671875, 0.2391357421875, 0.2477569580078125, 0.256378173828125, 0.2649993896484375, 0.27362060546875, 0.2822418212890625, 0.290863037109375, 0.2994842529296875, 0.30810546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 5.0, 0.0, 6.0, 3.0, 5.0, 4.0, 9.0, 7.0, 8.0, 9.0, 23.0, 15.0, 29.0, 36.0, 57.0, 101.0, 137.0, 151.0, 112.0, 79.0, 53.0, 56.0, 25.0, 21.0, 10.0, 10.0, 8.0, 4.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.914138793945312e-05, -6.59450888633728e-05, -6.274878978729248e-05, -5.955249071121216e-05, -5.6356191635131836e-05, -5.3159892559051514e-05, -4.996359348297119e-05, -4.676729440689087e-05, -4.357099533081055e-05, -4.0374696254730225e-05, -3.71783971786499e-05, -3.398209810256958e-05, -3.078579902648926e-05, -2.7589499950408936e-05, -2.4393200874328613e-05, -2.119690179824829e-05, -1.800060272216797e-05, -1.4804303646087646e-05, -1.1608004570007324e-05, -8.411705493927002e-06, -5.21540641784668e-06, -2.0191073417663574e-06, 1.1771917343139648e-06, 4.373490810394287e-06, 7.569789886474609e-06, 1.0766088962554932e-05, 1.3962388038635254e-05, 1.7158687114715576e-05, 2.03549861907959e-05, 2.355128526687622e-05, 2.6747584342956543e-05, 2.9943883419036865e-05, 3.314018249511719e-05, 3.633648157119751e-05, 3.953278064727783e-05, 4.2729079723358154e-05, 4.5925378799438477e-05, 4.91216778755188e-05, 5.231797695159912e-05, 5.551427602767944e-05, 5.8710575103759766e-05, 6.190687417984009e-05, 6.510317325592041e-05, 6.829947233200073e-05, 7.149577140808105e-05, 7.469207048416138e-05, 7.78883695602417e-05, 8.108466863632202e-05, 8.428096771240234e-05, 8.747726678848267e-05, 9.067356586456299e-05, 9.386986494064331e-05, 9.706616401672363e-05, 0.00010026246309280396, 0.00010345876216888428, 0.0001066550612449646, 0.00010985136032104492, 0.00011304765939712524, 0.00011624395847320557, 0.00011944025754928589, 0.0001226365566253662, 0.00012583285570144653, 0.00012902915477752686, 0.00013222545385360718, 0.0001354217529296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 7.0, 10.0, 16.0, 16.0, 35.0, 67.0, 114.0, 185.0, 352.0, 761.0, 1624.0, 4288.0, 13385.0, 50357.0, 248065.0, 602770.0, 92974.0, 22241.0, 6802.0, 2337.0, 1082.0, 460.0, 241.0, 140.0, 78.0, 48.0, 33.0, 13.0, 19.0, 15.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.43310546875, -0.4225940704345703, -0.4120826721191406, -0.40157127380371094, -0.39105987548828125, -0.38054847717285156, -0.3700370788574219, -0.3595256805419922, -0.3490142822265625, -0.3385028839111328, -0.3279914855957031, -0.31748008728027344, -0.30696868896484375, -0.29645729064941406, -0.2859458923339844, -0.2754344940185547, -0.264923095703125, -0.2544116973876953, -0.24390029907226562, -0.23338890075683594, -0.22287750244140625, -0.21236610412597656, -0.20185470581054688, -0.1913433074951172, -0.1808319091796875, -0.1703205108642578, -0.15980911254882812, -0.14929771423339844, -0.13878631591796875, -0.12827491760253906, -0.11776351928710938, -0.10725212097167969, -0.09674072265625, -0.08622932434082031, -0.07571792602539062, -0.06520652770996094, -0.05469512939453125, -0.04418373107910156, -0.033672332763671875, -0.023160934448242188, -0.0126495361328125, -0.0021381378173828125, 0.008373260498046875, 0.018884658813476562, 0.02939605712890625, 0.03990745544433594, 0.050418853759765625, 0.06093025207519531, 0.071441650390625, 0.08195304870605469, 0.09246444702148438, 0.10297584533691406, 0.11348724365234375, 0.12399864196777344, 0.13451004028320312, 0.1450214385986328, 0.1555328369140625, 0.1660442352294922, 0.17655563354492188, 0.18706703186035156, 0.19757843017578125, 0.20808982849121094, 0.21860122680664062, 0.2291126251220703, 0.2396240234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 11.0, 5.0, 12.0, 20.0, 25.0, 45.0, 45.0, 87.0, 107.0, 124.0, 111.0, 107.0, 81.0, 76.0, 28.0, 28.0, 25.0, 16.0, 17.0, 12.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5180549621582031, -0.5019302368164062, -0.4858055114746094, -0.4696807861328125, -0.4535560607910156, -0.43743133544921875, -0.4213066101074219, -0.405181884765625, -0.3890571594238281, -0.37293243408203125, -0.3568077087402344, -0.3406829833984375, -0.3245582580566406, -0.30843353271484375, -0.2923088073730469, -0.27618408203125, -0.2600593566894531, -0.24393463134765625, -0.22780990600585938, -0.2116851806640625, -0.19556045532226562, -0.17943572998046875, -0.16331100463867188, -0.147186279296875, -0.13106155395507812, -0.11493682861328125, -0.09881210327148438, -0.0826873779296875, -0.06656265258789062, -0.05043792724609375, -0.034313201904296875, -0.0181884765625, -0.002063751220703125, 0.01406097412109375, 0.030185699462890625, 0.0463104248046875, 0.062435150146484375, 0.07855987548828125, 0.09468460083007812, 0.110809326171875, 0.12693405151367188, 0.14305877685546875, 0.15918350219726562, 0.1753082275390625, 0.19143295288085938, 0.20755767822265625, 0.22368240356445312, 0.23980712890625, 0.2559318542480469, 0.27205657958984375, 0.2881813049316406, 0.3043060302734375, 0.3204307556152344, 0.33655548095703125, 0.3526802062988281, 0.368804931640625, 0.3849296569824219, 0.40105438232421875, 0.4171791076660156, 0.4333038330078125, 0.4494285583496094, 0.46555328369140625, 0.4816780090332031, 0.497802734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 5.0, 13.0, 20.0, 46.0, 119.0, 211.0, 284.0, 153.0, 76.0, 31.0, 13.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.921339988708496, -11.572976112365723, -11.22461223602295, -10.876248359680176, -10.527884483337402, -10.179520606994629, -9.831157684326172, -9.482793807983398, -9.134429931640625, -8.786066055297852, -8.437702178955078, -8.089338302612305, -7.740974426269531, -7.392610549926758, -7.044247150421143, -6.695883274078369, -6.3475189208984375, -5.999155044555664, -5.650791168212891, -5.302427291870117, -4.954063415527344, -4.60569953918457, -4.257336139678955, -3.9089722633361816, -3.560608386993408, -3.2122445106506348, -2.8638806343078613, -2.515516996383667, -2.1671531200408936, -1.8187892436981201, -1.4704256057739258, -1.1220617294311523, -0.7736978530883789, -0.42533403635025024, -0.07697021961212158, 0.2713935375213623, 0.6197574138641357, 0.9681212902069092, 1.3164849281311035, 1.664848804473877, 2.0132126808166504, 2.361576557159424, 2.7099404335021973, 3.0583040714263916, 3.406667947769165, 3.7550318241119385, 4.103395462036133, 4.451759338378906, 4.80012321472168, 5.148487091064453, 5.496850967407227, 5.84521484375, 6.193578720092773, 6.541942596435547, 6.890305995941162, 7.2386698722839355, 7.587033748626709, 7.935397624969482, 8.283761024475098, 8.632124900817871, 8.980488777160645, 9.328852653503418, 9.677216529846191, 10.025580406188965, 10.373944282531738]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 5.0, 10.0, 9.0, 12.0, 10.0, 13.0, 15.0, 23.0, 37.0, 22.0, 24.0, 26.0, 31.0, 29.0, 40.0, 50.0, 57.0, 70.0, 75.0, 77.0, 43.0, 43.0, 34.0, 39.0, 35.0, 21.0, 31.0, 17.0, 21.0, 13.0, 16.0, 10.0, 6.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.065862655639648, -7.836196422576904, -7.606529712677002, -7.376863479614258, -7.147197246551514, -6.9175310134887695, -6.687864303588867, -6.458198070526123, -6.228531837463379, -5.998865604400635, -5.769198894500732, -5.539532661437988, -5.309866428375244, -5.0802001953125, -4.850533485412598, -4.6208672523498535, -4.391200542449951, -4.161534309387207, -3.931867837905884, -3.7022013664245605, -3.4725351333618164, -3.242868661880493, -3.01320219039917, -2.783535957336426, -2.5538694858551025, -2.3242030143737793, -2.094536781311035, -1.864870309829712, -1.6352039575576782, -1.4055376052856445, -1.1758711338043213, -0.9462047815322876, -0.7165389060974121, -0.48687252402305603, -0.25720614194869995, -0.027539730072021484, 0.2021266222000122, 0.4317929744720459, 0.6614594459533691, 0.8911257982254028, 1.1207921504974365, 1.3504585027694702, 1.580124855041504, 1.8097913265228271, 2.0394577980041504, 2.2691240310668945, 2.4987905025482178, 2.728456974029541, 2.958123207092285, 3.1877896785736084, 3.4174559116363525, 3.647122383117676, 3.87678861618042, 4.106454849243164, 4.336121559143066, 4.5657877922058105, 4.795454025268555, 5.025120258331299, 5.254786968231201, 5.484453201293945, 5.7141194343566895, 5.943785667419434, 6.173452377319336, 6.40311861038208, 6.632785320281982]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 11.0, 11.0, 6.0, 9.0, 31.0, 40.0, 64.0, 109.0, 283.0, 537.0, 1412.0, 4792.0, 26763.0, 573097.0, 3452605.0, 118450.0, 11821.0, 2592.0, 884.0, 339.0, 164.0, 94.0, 42.0, 29.0, 20.0, 16.0, 10.0, 12.0, 9.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7955093383789062, -0.7692413330078125, -0.7429733276367188, -0.716705322265625, -0.6904373168945312, -0.6641693115234375, -0.6379013061523438, -0.61163330078125, -0.5853652954101562, -0.5590972900390625, -0.5328292846679688, -0.506561279296875, -0.48029327392578125, -0.4540252685546875, -0.42775726318359375, -0.4014892578125, -0.37522125244140625, -0.3489532470703125, -0.32268524169921875, -0.296417236328125, -0.27014923095703125, -0.2438812255859375, -0.21761322021484375, -0.19134521484375, -0.16507720947265625, -0.1388092041015625, -0.11254119873046875, -0.086273193359375, -0.06000518798828125, -0.0337371826171875, -0.00746917724609375, 0.018798828125, 0.04506683349609375, 0.0713348388671875, 0.09760284423828125, 0.123870849609375, 0.15013885498046875, 0.1764068603515625, 0.20267486572265625, 0.22894287109375, 0.25521087646484375, 0.2814788818359375, 0.30774688720703125, 0.334014892578125, 0.36028289794921875, 0.3865509033203125, 0.41281890869140625, 0.4390869140625, 0.46535491943359375, 0.4916229248046875, 0.5178909301757812, 0.544158935546875, 0.5704269409179688, 0.5966949462890625, 0.6229629516601562, 0.64923095703125, 0.6754989624023438, 0.7017669677734375, 0.7280349731445312, 0.754302978515625, 0.7805709838867188, 0.8068389892578125, 0.8331069946289062, 0.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 7.0, 11.0, 6.0, 12.0, 18.0, 18.0, 35.0, 39.0, 32.0, 40.0, 64.0, 57.0, 64.0, 60.0, 53.0, 59.0, 62.0, 61.0, 43.0, 55.0, 39.0, 32.0, 27.0, 36.0, 17.0, 12.0, 10.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.389404296875, -0.3757972717285156, -0.36219024658203125, -0.3485832214355469, -0.3349761962890625, -0.3213691711425781, -0.30776214599609375, -0.2941551208496094, -0.280548095703125, -0.2669410705566406, -0.25333404541015625, -0.23972702026367188, -0.2261199951171875, -0.21251296997070312, -0.19890594482421875, -0.18529891967773438, -0.17169189453125, -0.15808486938476562, -0.14447784423828125, -0.13087081909179688, -0.1172637939453125, -0.10365676879882812, -0.09004974365234375, -0.07644271850585938, -0.062835693359375, -0.049228668212890625, -0.03562164306640625, -0.022014617919921875, -0.0084075927734375, 0.005199432373046875, 0.01880645751953125, 0.032413482666015625, 0.0460205078125, 0.059627532958984375, 0.07323455810546875, 0.08684158325195312, 0.1004486083984375, 0.11405563354492188, 0.12766265869140625, 0.14126968383789062, 0.154876708984375, 0.16848373413085938, 0.18209075927734375, 0.19569778442382812, 0.2093048095703125, 0.22291183471679688, 0.23651885986328125, 0.2501258850097656, 0.26373291015625, 0.2773399353027344, 0.29094696044921875, 0.3045539855957031, 0.3181610107421875, 0.3317680358886719, 0.34537506103515625, 0.3589820861816406, 0.372589111328125, 0.3861961364746094, 0.39980316162109375, 0.4134101867675781, 0.4270172119140625, 0.4406242370605469, 0.45423126220703125, 0.4678382873535156, 0.4814453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 34.0, 39.0, 47.0, 77.0, 120.0, 216.0, 1441.0, 394313.0, 3794868.0, 2590.0, 241.0, 100.0, 80.0, 50.0, 22.0, 16.0, 13.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.740692138671875, -2.63568115234375, -2.530670166015625, -2.4256591796875, -2.320648193359375, -2.21563720703125, -2.110626220703125, -2.005615234375, -1.900604248046875, -1.79559326171875, -1.690582275390625, -1.5855712890625, -1.480560302734375, -1.37554931640625, -1.270538330078125, -1.16552734375, -1.060516357421875, -0.95550537109375, -0.850494384765625, -0.7454833984375, -0.640472412109375, -0.53546142578125, -0.430450439453125, -0.325439453125, -0.220428466796875, -0.11541748046875, -0.010406494140625, 0.0946044921875, 0.199615478515625, 0.30462646484375, 0.409637451171875, 0.5146484375, 0.619659423828125, 0.72467041015625, 0.829681396484375, 0.9346923828125, 1.039703369140625, 1.14471435546875, 1.249725341796875, 1.354736328125, 1.459747314453125, 1.56475830078125, 1.669769287109375, 1.7747802734375, 1.879791259765625, 1.98480224609375, 2.089813232421875, 2.19482421875, 2.299835205078125, 2.40484619140625, 2.509857177734375, 2.6148681640625, 2.719879150390625, 2.82489013671875, 2.929901123046875, 3.034912109375, 3.139923095703125, 3.24493408203125, 3.349945068359375, 3.4549560546875, 3.559967041015625, 3.66497802734375, 3.769989013671875, 3.875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 11.0, 14.0, 31.0, 100.0, 293.0, 1263.0, 1723.0, 408.0, 129.0, 70.0, 19.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.01171875, -2.9528350830078125, -2.893951416015625, -2.8350677490234375, -2.77618408203125, -2.7173004150390625, -2.658416748046875, -2.5995330810546875, -2.5406494140625, -2.4817657470703125, -2.422882080078125, -2.3639984130859375, -2.30511474609375, -2.2462310791015625, -2.187347412109375, -2.1284637451171875, -2.069580078125, -2.0106964111328125, -1.951812744140625, -1.8929290771484375, -1.83404541015625, -1.7751617431640625, -1.716278076171875, -1.6573944091796875, -1.5985107421875, -1.5396270751953125, -1.480743408203125, -1.4218597412109375, -1.36297607421875, -1.3040924072265625, -1.245208740234375, -1.1863250732421875, -1.12744140625, -1.0685577392578125, -1.009674072265625, -0.9507904052734375, -0.89190673828125, -0.8330230712890625, -0.774139404296875, -0.7152557373046875, -0.6563720703125, -0.5974884033203125, -0.538604736328125, -0.4797210693359375, -0.42083740234375, -0.3619537353515625, -0.303070068359375, -0.2441864013671875, -0.185302734375, -0.1264190673828125, -0.067535400390625, -0.0086517333984375, 0.05023193359375, 0.1091156005859375, 0.167999267578125, 0.2268829345703125, 0.2857666015625, 0.3446502685546875, 0.403533935546875, 0.4624176025390625, 0.52130126953125, 0.5801849365234375, 0.639068603515625, 0.6979522705078125, 0.7568359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 4.0, 17.0, 36.0, 77.0, 202.0, 286.0, 218.0, 85.0, 32.0, 18.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.529682159423828, -8.208880424499512, -7.888078212738037, -7.567276477813721, -7.246474266052246, -6.92567253112793, -6.604870796203613, -6.284068584442139, -5.963266372680664, -5.642464637756348, -5.321662425994873, -5.000860691070557, -4.680058479309082, -4.359256744384766, -4.038455009460449, -3.7176527976989746, -3.396851062774658, -3.0760490894317627, -2.755247116088867, -2.434445381164551, -2.113643169403076, -1.7928413152694702, -1.4720394611358643, -1.1512374877929688, -0.8304355144500732, -0.5096335411071777, -0.188831627368927, 0.13197028636932373, 0.45277225971221924, 0.7735742330551147, 1.0943760871887207, 1.4151780605316162, 1.7359800338745117, 2.0567820072174072, 2.3775839805603027, 2.698385715484619, 3.0191879272460938, 3.33998966217041, 3.6607916355133057, 3.981593608856201, 4.302395820617676, 4.623197555541992, 4.943999767303467, 5.264801502227783, 5.585603713989258, 5.906405448913574, 6.227207183837891, 6.548009395599365, 6.868811130523682, 7.189612865447998, 7.510415077209473, 7.831216812133789, 8.152018547058105, 8.472821235656738, 8.793622970581055, 9.114424705505371, 9.435226440429688, 9.756028175354004, 10.07682991027832, 10.397632598876953, 10.71843433380127, 11.039236068725586, 11.360037803649902, 11.680839538574219, 12.001642227172852]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 8.0, 11.0, 12.0, 10.0, 16.0, 13.0, 22.0, 32.0, 31.0, 33.0, 39.0, 44.0, 48.0, 62.0, 48.0, 54.0, 61.0, 46.0, 61.0, 50.0, 46.0, 37.0, 32.0, 28.0, 25.0, 21.0, 20.0, 14.0, 17.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90915846824646, -3.790902614593506, -3.672646999359131, -3.5543911457061768, -3.4361355304718018, -3.3178796768188477, -3.1996240615844727, -3.0813682079315186, -2.9631123542785645, -2.8448565006256104, -2.7266008853912354, -2.6083450317382812, -2.4900894165039062, -2.371833562850952, -2.253577709197998, -2.135322093963623, -2.017066478729248, -1.8988107442855835, -1.780555009841919, -1.6622991561889648, -1.5440435409545898, -1.4257876873016357, -1.3075319528579712, -1.1892762184143066, -1.071020483970642, -0.9527647495269775, -0.834509015083313, -0.7162532210350037, -0.5979974865913391, -0.47974175214767456, -0.36148595809936523, -0.24323022365570068, -0.12497425079345703, -0.006718501448631287, 0.11153724789619446, 0.2297930121421814, 0.34804874658584595, 0.4663044810295105, 0.5845602750778198, 0.7028160095214844, 0.8210717439651489, 0.9393274784088135, 1.057583212852478, 1.1758389472961426, 1.2940948009490967, 1.4123504161834717, 1.5306062698364258, 1.6488620042800903, 1.7671177387237549, 1.8853734731674194, 2.003629207611084, 2.121885061264038, 2.240140676498413, 2.358396530151367, 2.476652145385742, 2.5949079990386963, 2.7131638526916504, 2.8314197063446045, 2.9496753215789795, 3.0679311752319336, 3.1861867904663086, 3.3044426441192627, 3.422698497772217, 3.540954113006592, 3.659209728240967]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 1.0, 8.0, 17.0, 19.0, 36.0, 45.0, 74.0, 118.0, 193.0, 329.0, 628.0, 1419.0, 3558.0, 10062.0, 36328.0, 163397.0, 526175.0, 234194.0, 50286.0, 13864.0, 4389.0, 1654.0, 726.0, 373.0, 238.0, 157.0, 74.0, 64.0, 34.0, 24.0, 15.0, 11.0, 9.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.03515625, -1.0076370239257812, -0.9801177978515625, -0.9525985717773438, -0.925079345703125, -0.8975601196289062, -0.8700408935546875, -0.8425216674804688, -0.81500244140625, -0.7874832153320312, -0.7599639892578125, -0.7324447631835938, -0.704925537109375, -0.6774063110351562, -0.6498870849609375, -0.6223678588867188, -0.5948486328125, -0.5673294067382812, -0.5398101806640625, -0.5122909545898438, -0.484771728515625, -0.45725250244140625, -0.4297332763671875, -0.40221405029296875, -0.37469482421875, -0.34717559814453125, -0.3196563720703125, -0.29213714599609375, -0.264617919921875, -0.23709869384765625, -0.2095794677734375, -0.18206024169921875, -0.154541015625, -0.12702178955078125, -0.0995025634765625, -0.07198333740234375, -0.044464111328125, -0.01694488525390625, 0.0105743408203125, 0.03809356689453125, 0.06561279296875, 0.09313201904296875, 0.1206512451171875, 0.14817047119140625, 0.175689697265625, 0.20320892333984375, 0.2307281494140625, 0.25824737548828125, 0.2857666015625, 0.31328582763671875, 0.3408050537109375, 0.36832427978515625, 0.395843505859375, 0.42336273193359375, 0.4508819580078125, 0.47840118408203125, 0.50592041015625, 0.5334396362304688, 0.5609588623046875, 0.5884780883789062, 0.615997314453125, 0.6435165405273438, 0.6710357666015625, 0.6985549926757812, 0.72607421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 1.0, 8.0, 7.0, 16.0, 5.0, 12.0, 19.0, 18.0, 28.0, 19.0, 30.0, 31.0, 31.0, 64.0, 58.0, 49.0, 44.0, 40.0, 53.0, 55.0, 42.0, 63.0, 44.0, 41.0, 37.0, 38.0, 31.0, 29.0, 24.0, 8.0, 19.0, 9.0, 11.0, 5.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.30498504638671875, -0.2928314208984375, -0.28067779541015625, -0.268524169921875, -0.25637054443359375, -0.2442169189453125, -0.23206329345703125, -0.21990966796875, -0.20775604248046875, -0.1956024169921875, -0.18344879150390625, -0.171295166015625, -0.15914154052734375, -0.1469879150390625, -0.13483428955078125, -0.1226806640625, -0.11052703857421875, -0.0983734130859375, -0.08621978759765625, -0.074066162109375, -0.06191253662109375, -0.0497589111328125, -0.03760528564453125, -0.02545166015625, -0.01329803466796875, -0.0011444091796875, 0.01100921630859375, 0.023162841796875, 0.03531646728515625, 0.0474700927734375, 0.05962371826171875, 0.07177734375, 0.08393096923828125, 0.0960845947265625, 0.10823822021484375, 0.120391845703125, 0.13254547119140625, 0.1446990966796875, 0.15685272216796875, 0.16900634765625, 0.18115997314453125, 0.1933135986328125, 0.20546722412109375, 0.217620849609375, 0.22977447509765625, 0.2419281005859375, 0.25408172607421875, 0.2662353515625, 0.27838897705078125, 0.2905426025390625, 0.30269622802734375, 0.314849853515625, 0.32700347900390625, 0.3391571044921875, 0.35131072998046875, 0.36346435546875, 0.37561798095703125, 0.3877716064453125, 0.39992523193359375, 0.412078857421875, 0.42423248291015625, 0.4363861083984375, 0.44853973388671875, 0.460693359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 11.0, 15.0, 19.0, 27.0, 44.0, 68.0, 101.0, 228.0, 449.0, 1130.0, 3972.0, 26355.0, 618393.0, 369456.0, 22588.0, 3650.0, 1083.0, 459.0, 205.0, 117.0, 50.0, 40.0, 20.0, 16.0, 12.0, 9.0, 7.0, 2.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.612213134765625, -1.55841064453125, -1.504608154296875, -1.4508056640625, -1.397003173828125, -1.34320068359375, -1.289398193359375, -1.235595703125, -1.181793212890625, -1.12799072265625, -1.074188232421875, -1.0203857421875, -0.966583251953125, -0.91278076171875, -0.858978271484375, -0.80517578125, -0.751373291015625, -0.69757080078125, -0.643768310546875, -0.5899658203125, -0.536163330078125, -0.48236083984375, -0.428558349609375, -0.374755859375, -0.320953369140625, -0.26715087890625, -0.213348388671875, -0.1595458984375, -0.105743408203125, -0.05194091796875, 0.001861572265625, 0.0556640625, 0.109466552734375, 0.16326904296875, 0.217071533203125, 0.2708740234375, 0.324676513671875, 0.37847900390625, 0.432281494140625, 0.486083984375, 0.539886474609375, 0.59368896484375, 0.647491455078125, 0.7012939453125, 0.755096435546875, 0.80889892578125, 0.862701416015625, 0.91650390625, 0.970306396484375, 1.02410888671875, 1.077911376953125, 1.1317138671875, 1.185516357421875, 1.23931884765625, 1.293121337890625, 1.346923828125, 1.400726318359375, 1.45452880859375, 1.508331298828125, 1.5621337890625, 1.615936279296875, 1.66973876953125, 1.723541259765625, 1.77734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 7.0, 11.0, 11.0, 19.0, 10.0, 18.0, 26.0, 25.0, 34.0, 41.0, 41.0, 50.0, 43.0, 59.0, 55.0, 63.0, 63.0, 57.0, 39.0, 53.0, 40.0, 30.0, 40.0, 23.0, 30.0, 19.0, 19.0, 12.0, 9.0, 12.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.6599578857421875, -1.609954833984375, -1.5599517822265625, -1.50994873046875, -1.4599456787109375, -1.409942626953125, -1.3599395751953125, -1.3099365234375, -1.2599334716796875, -1.209930419921875, -1.1599273681640625, -1.10992431640625, -1.0599212646484375, -1.009918212890625, -0.9599151611328125, -0.909912109375, -0.8599090576171875, -0.809906005859375, -0.7599029541015625, -0.70989990234375, -0.6598968505859375, -0.609893798828125, -0.5598907470703125, -0.5098876953125, -0.4598846435546875, -0.409881591796875, -0.3598785400390625, -0.30987548828125, -0.2598724365234375, -0.209869384765625, -0.1598663330078125, -0.10986328125, -0.0598602294921875, -0.009857177734375, 0.0401458740234375, 0.09014892578125, 0.1401519775390625, 0.190155029296875, 0.2401580810546875, 0.2901611328125, 0.3401641845703125, 0.390167236328125, 0.4401702880859375, 0.49017333984375, 0.5401763916015625, 0.590179443359375, 0.6401824951171875, 0.690185546875, 0.7401885986328125, 0.790191650390625, 0.8401947021484375, 0.89019775390625, 0.9402008056640625, 0.990203857421875, 1.0402069091796875, 1.0902099609375, 1.1402130126953125, 1.190216064453125, 1.2402191162109375, 1.29022216796875, 1.3402252197265625, 1.390228271484375, 1.4402313232421875, 1.490234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 9.0, 11.0, 11.0, 14.0, 25.0, 25.0, 59.0, 68.0, 111.0, 151.0, 238.0, 432.0, 829.0, 1736.0, 3897.0, 10238.0, 33654.0, 167629.0, 708562.0, 86643.0, 21340.0, 7060.0, 2789.0, 1349.0, 667.0, 346.0, 223.0, 136.0, 95.0, 47.0, 41.0, 30.0, 12.0, 17.0, 14.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.297607421875, -0.2877922058105469, -0.27797698974609375, -0.2681617736816406, -0.2583465576171875, -0.24853134155273438, -0.23871612548828125, -0.22890090942382812, -0.219085693359375, -0.20927047729492188, -0.19945526123046875, -0.18964004516601562, -0.1798248291015625, -0.17000961303710938, -0.16019439697265625, -0.15037918090820312, -0.14056396484375, -0.13074874877929688, -0.12093353271484375, -0.11111831665039062, -0.1013031005859375, -0.09148788452148438, -0.08167266845703125, -0.07185745239257812, -0.062042236328125, -0.052227020263671875, -0.04241180419921875, -0.032596588134765625, -0.0227813720703125, -0.012966156005859375, -0.00315093994140625, 0.006664276123046875, 0.0164794921875, 0.026294708251953125, 0.03610992431640625, 0.045925140380859375, 0.0557403564453125, 0.06555557250976562, 0.07537078857421875, 0.08518600463867188, 0.095001220703125, 0.10481643676757812, 0.11463165283203125, 0.12444686889648438, 0.1342620849609375, 0.14407730102539062, 0.15389251708984375, 0.16370773315429688, 0.17352294921875, 0.18333816528320312, 0.19315338134765625, 0.20296859741210938, 0.2127838134765625, 0.22259902954101562, 0.23241424560546875, 0.24222946166992188, 0.252044677734375, 0.2618598937988281, 0.27167510986328125, 0.2814903259277344, 0.2913055419921875, 0.3011207580566406, 0.31093597412109375, 0.3207511901855469, 0.33056640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 12.0, 10.0, 14.0, 14.0, 11.0, 26.0, 34.0, 33.0, 61.0, 74.0, 108.0, 156.0, 126.0, 90.0, 65.0, 39.0, 22.0, 23.0, 19.0, 9.0, 12.0, 10.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.548664093017578e-05, -9.265542030334473e-05, -8.982419967651367e-05, -8.699297904968262e-05, -8.416175842285156e-05, -8.133053779602051e-05, -7.849931716918945e-05, -7.56680965423584e-05, -7.283687591552734e-05, -7.000565528869629e-05, -6.717443466186523e-05, -6.434321403503418e-05, -6.151199340820312e-05, -5.868077278137207e-05, -5.5849552154541016e-05, -5.301833152770996e-05, -5.0187110900878906e-05, -4.735589027404785e-05, -4.45246696472168e-05, -4.169344902038574e-05, -3.886222839355469e-05, -3.603100776672363e-05, -3.319978713989258e-05, -3.0368566513061523e-05, -2.753734588623047e-05, -2.4706125259399414e-05, -2.187490463256836e-05, -1.9043684005737305e-05, -1.621246337890625e-05, -1.3381242752075195e-05, -1.055002212524414e-05, -7.718801498413086e-06, -4.887580871582031e-06, -2.0563602447509766e-06, 7.748603820800781e-07, 3.606081008911133e-06, 6.4373016357421875e-06, 9.268522262573242e-06, 1.2099742889404297e-05, 1.4930963516235352e-05, 1.7762184143066406e-05, 2.059340476989746e-05, 2.3424625396728516e-05, 2.625584602355957e-05, 2.9087066650390625e-05, 3.191828727722168e-05, 3.4749507904052734e-05, 3.758072853088379e-05, 4.0411949157714844e-05, 4.32431697845459e-05, 4.607439041137695e-05, 4.890561103820801e-05, 5.173683166503906e-05, 5.456805229187012e-05, 5.739927291870117e-05, 6.0230493545532227e-05, 6.306171417236328e-05, 6.589293479919434e-05, 6.872415542602539e-05, 7.155537605285645e-05, 7.43865966796875e-05, 7.721781730651855e-05, 8.004903793334961e-05, 8.288025856018066e-05, 8.571147918701172e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 4.0, 10.0, 8.0, 20.0, 23.0, 33.0, 69.0, 89.0, 131.0, 194.0, 361.0, 767.0, 1589.0, 3750.0, 12035.0, 50514.0, 579118.0, 337556.0, 44416.0, 11128.0, 3600.0, 1499.0, 702.0, 351.0, 212.0, 120.0, 86.0, 45.0, 33.0, 20.0, 22.0, 11.0, 9.0, 3.0, 4.0, 0.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.304443359375, -0.29315185546875, -0.2818603515625, -0.27056884765625, -0.25927734375, -0.24798583984375, -0.2366943359375, -0.22540283203125, -0.214111328125, -0.20281982421875, -0.1915283203125, -0.18023681640625, -0.1689453125, -0.15765380859375, -0.1463623046875, -0.13507080078125, -0.123779296875, -0.11248779296875, -0.1011962890625, -0.08990478515625, -0.07861328125, -0.06732177734375, -0.0560302734375, -0.04473876953125, -0.033447265625, -0.02215576171875, -0.0108642578125, 0.00042724609375, 0.01171875, 0.02301025390625, 0.0343017578125, 0.04559326171875, 0.056884765625, 0.06817626953125, 0.0794677734375, 0.09075927734375, 0.10205078125, 0.11334228515625, 0.1246337890625, 0.13592529296875, 0.147216796875, 0.15850830078125, 0.1697998046875, 0.18109130859375, 0.1923828125, 0.20367431640625, 0.2149658203125, 0.22625732421875, 0.237548828125, 0.24884033203125, 0.2601318359375, 0.27142333984375, 0.28271484375, 0.29400634765625, 0.3052978515625, 0.31658935546875, 0.327880859375, 0.33917236328125, 0.3504638671875, 0.36175537109375, 0.373046875, 0.38433837890625, 0.3956298828125, 0.40692138671875, 0.418212890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 7.0, 10.0, 8.0, 5.0, 12.0, 19.0, 24.0, 26.0, 39.0, 53.0, 72.0, 88.0, 113.0, 109.0, 107.0, 82.0, 68.0, 38.0, 21.0, 19.0, 15.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.464599609375, -0.4529609680175781, -0.44132232666015625, -0.4296836853027344, -0.4180450439453125, -0.4064064025878906, -0.39476776123046875, -0.3831291198730469, -0.371490478515625, -0.3598518371582031, -0.34821319580078125, -0.3365745544433594, -0.3249359130859375, -0.3132972717285156, -0.30165863037109375, -0.2900199890136719, -0.27838134765625, -0.2667427062988281, -0.25510406494140625, -0.24346542358398438, -0.2318267822265625, -0.22018814086914062, -0.20854949951171875, -0.19691085815429688, -0.185272216796875, -0.17363357543945312, -0.16199493408203125, -0.15035629272460938, -0.1387176513671875, -0.12707901000976562, -0.11544036865234375, -0.10380172729492188, -0.0921630859375, -0.08052444458007812, -0.06888580322265625, -0.057247161865234375, -0.0456085205078125, -0.033969879150390625, -0.02233123779296875, -0.010692596435546875, 0.000946044921875, 0.012584686279296875, 0.02422332763671875, 0.035861968994140625, 0.0475006103515625, 0.059139251708984375, 0.07077789306640625, 0.08241653442382812, 0.09405517578125, 0.10569381713867188, 0.11733245849609375, 0.12897109985351562, 0.1406097412109375, 0.15224838256835938, 0.16388702392578125, 0.17552566528320312, 0.187164306640625, 0.19880294799804688, 0.21044158935546875, 0.22208023071289062, 0.2337188720703125, 0.24535751342773438, 0.25699615478515625, 0.2686347961425781, 0.2802734375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 13.0, 10.0, 21.0, 27.0, 68.0, 112.0, 222.0, 266.0, 129.0, 68.0, 27.0, 16.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.044835090637207, -8.753379821777344, -8.46192455291748, -8.1704683303833, -7.8790130615234375, -7.587557792663574, -7.296102523803711, -7.004647254943848, -6.713191509246826, -6.421736240386963, -6.130280494689941, -5.838825225830078, -5.547369956970215, -5.255914211273193, -4.96445894241333, -4.673003196716309, -4.381547927856445, -4.090092658996582, -3.7986369132995605, -3.5071816444396973, -3.215726137161255, -2.9242706298828125, -2.632815361022949, -2.341359853744507, -2.0499043464660645, -1.758448839187622, -1.4669934511184692, -1.1755380630493164, -0.884082555770874, -0.5926270484924316, -0.3011716604232788, -0.009716272354125977, 0.28173828125, 0.5731937289237976, 0.8646491765975952, 1.156104564666748, 1.4475600719451904, 1.7390155792236328, 2.030470848083496, 2.3219263553619385, 2.613381862640381, 2.9048373699188232, 3.1962928771972656, 3.487748146057129, 3.7792036533355713, 4.070659160614014, 4.362114429473877, 4.653570175170898, 4.945025444030762, 5.236480712890625, 5.5279364585876465, 5.81939172744751, 6.110847473144531, 6.4023027420043945, 6.693758010864258, 6.985213279724121, 7.276669025421143, 7.568124294281006, 7.859580039978027, 8.15103530883789, 8.442490577697754, 8.733945846557617, 9.025402069091797, 9.31685733795166, 9.608312606811523]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 3.0, 3.0, 11.0, 8.0, 12.0, 17.0, 16.0, 20.0, 18.0, 27.0, 29.0, 27.0, 31.0, 33.0, 49.0, 67.0, 76.0, 72.0, 74.0, 68.0, 53.0, 35.0, 20.0, 24.0, 32.0, 15.0, 22.0, 19.0, 22.0, 11.0, 11.0, 13.0, 9.0, 10.0, 8.0, 3.0, 7.0, 4.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.7383294105529785, -6.555067539215088, -6.3718061447143555, -6.188544273376465, -6.005282402038574, -5.822020530700684, -5.638759136199951, -5.4554972648620605, -5.272235870361328, -5.0889739990234375, -4.905712604522705, -4.7224507331848145, -4.539188861846924, -4.355927467346191, -4.172665596008301, -3.98940372467041, -3.8061418533325195, -3.622880220413208, -3.4396183490753174, -3.256356716156006, -3.0730948448181152, -2.8898332118988037, -2.706571578979492, -2.5233097076416016, -2.34004807472229, -2.1567864418029785, -1.973524570465088, -1.7902629375457764, -1.6070011854171753, -1.4237394332885742, -1.2404778003692627, -1.0572160482406616, -0.8739538192749023, -0.6906920671463013, -0.507430374622345, -0.32416868209838867, -0.1409069299697876, 0.04235482215881348, 0.225616455078125, 0.4088782072067261, 0.5921399593353271, 0.7754017114639282, 0.9586634039878845, 1.1419250965118408, 1.325186848640442, 1.508448600769043, 1.6917102336883545, 1.8749719858169556, 2.0582337379455566, 2.241495370864868, 2.424757242202759, 2.6080188751220703, 2.791280746459961, 2.9745423793792725, 3.157804012298584, 3.3410658836364746, 3.524327516555786, 3.7075891494750977, 3.8908510208129883, 4.074112892150879, 4.257374286651611, 4.440636157989502, 4.623897552490234, 4.807159423828125, 4.990421295166016]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 15.0, 22.0, 32.0, 48.0, 101.0, 257.0, 714.0, 2600.0, 16300.0, 639654.0, 3481664.0, 46445.0, 4606.0, 1020.0, 391.0, 146.0, 86.0, 45.0, 41.0, 30.0, 12.0, 8.0, 7.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.19775390625, -1.1552734375, -1.11279296875, -1.0703125, -1.02783203125, -0.9853515625, -0.94287109375, -0.900390625, -0.85791015625, -0.8154296875, -0.77294921875, -0.73046875, -0.68798828125, -0.6455078125, -0.60302734375, -0.560546875, -0.51806640625, -0.4755859375, -0.43310546875, -0.390625, -0.34814453125, -0.3056640625, -0.26318359375, -0.220703125, -0.17822265625, -0.1357421875, -0.09326171875, -0.05078125, -0.00830078125, 0.0341796875, 0.07666015625, 0.119140625, 0.16162109375, 0.2041015625, 0.24658203125, 0.2890625, 0.33154296875, 0.3740234375, 0.41650390625, 0.458984375, 0.50146484375, 0.5439453125, 0.58642578125, 0.62890625, 0.67138671875, 0.7138671875, 0.75634765625, 0.798828125, 0.84130859375, 0.8837890625, 0.92626953125, 0.96875, 1.01123046875, 1.0537109375, 1.09619140625, 1.138671875, 1.18115234375, 1.2236328125, 1.26611328125, 1.30859375, 1.35107421875, 1.3935546875, 1.43603515625, 1.478515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 13.0, 8.0, 17.0, 25.0, 19.0, 22.0, 27.0, 29.0, 32.0, 48.0, 56.0, 44.0, 62.0, 51.0, 47.0, 41.0, 55.0, 52.0, 52.0, 49.0, 35.0, 38.0, 43.0, 28.0, 21.0, 10.0, 12.0, 16.0, 15.0, 3.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33060455322265625, -0.3181915283203125, -0.30577850341796875, -0.293365478515625, -0.28095245361328125, -0.2685394287109375, -0.25612640380859375, -0.24371337890625, -0.23130035400390625, -0.2188873291015625, -0.20647430419921875, -0.194061279296875, -0.18164825439453125, -0.1692352294921875, -0.15682220458984375, -0.1444091796875, -0.13199615478515625, -0.1195831298828125, -0.10717010498046875, -0.094757080078125, -0.08234405517578125, -0.0699310302734375, -0.05751800537109375, -0.04510498046875, -0.03269195556640625, -0.0202789306640625, -0.00786590576171875, 0.004547119140625, 0.01696014404296875, 0.0293731689453125, 0.04178619384765625, 0.05419921875, 0.06661224365234375, 0.0790252685546875, 0.09143829345703125, 0.103851318359375, 0.11626434326171875, 0.1286773681640625, 0.14109039306640625, 0.15350341796875, 0.16591644287109375, 0.1783294677734375, 0.19074249267578125, 0.203155517578125, 0.21556854248046875, 0.2279815673828125, 0.24039459228515625, 0.2528076171875, 0.26522064208984375, 0.2776336669921875, 0.29004669189453125, 0.302459716796875, 0.31487274169921875, 0.3272857666015625, 0.33969879150390625, 0.35211181640625, 0.36452484130859375, 0.3769378662109375, 0.38935089111328125, 0.401763916015625, 0.41417694091796875, 0.4265899658203125, 0.43900299072265625, 0.451416015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 22.0, 38.0, 58.0, 80.0, 124.0, 267.0, 4189.0, 4160283.0, 28274.0, 601.0, 137.0, 87.0, 59.0, 25.0, 18.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23046875, -6.06939697265625, -5.9083251953125, -5.74725341796875, -5.586181640625, -5.42510986328125, -5.2640380859375, -5.10296630859375, -4.94189453125, -4.78082275390625, -4.6197509765625, -4.45867919921875, -4.297607421875, -4.13653564453125, -3.9754638671875, -3.81439208984375, -3.6533203125, -3.49224853515625, -3.3311767578125, -3.17010498046875, -3.009033203125, -2.84796142578125, -2.6868896484375, -2.52581787109375, -2.36474609375, -2.20367431640625, -2.0426025390625, -1.88153076171875, -1.720458984375, -1.55938720703125, -1.3983154296875, -1.23724365234375, -1.076171875, -0.91510009765625, -0.7540283203125, -0.59295654296875, -0.431884765625, -0.27081298828125, -0.1097412109375, 0.05133056640625, 0.21240234375, 0.37347412109375, 0.5345458984375, 0.69561767578125, 0.856689453125, 1.01776123046875, 1.1788330078125, 1.33990478515625, 1.5009765625, 1.66204833984375, 1.8231201171875, 1.98419189453125, 2.145263671875, 2.30633544921875, 2.4674072265625, 2.62847900390625, 2.78955078125, 2.95062255859375, 3.1116943359375, 3.27276611328125, 3.433837890625, 3.59490966796875, 3.7559814453125, 3.91705322265625, 4.078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 20.0, 55.0, 186.0, 901.0, 2146.0, 548.0, 131.0, 40.0, 24.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.40625, -4.322021484375, -4.23779296875, -4.153564453125, -4.0693359375, -3.985107421875, -3.90087890625, -3.816650390625, -3.732421875, -3.648193359375, -3.56396484375, -3.479736328125, -3.3955078125, -3.311279296875, -3.22705078125, -3.142822265625, -3.05859375, -2.974365234375, -2.89013671875, -2.805908203125, -2.7216796875, -2.637451171875, -2.55322265625, -2.468994140625, -2.384765625, -2.300537109375, -2.21630859375, -2.132080078125, -2.0478515625, -1.963623046875, -1.87939453125, -1.795166015625, -1.7109375, -1.626708984375, -1.54248046875, -1.458251953125, -1.3740234375, -1.289794921875, -1.20556640625, -1.121337890625, -1.037109375, -0.952880859375, -0.86865234375, -0.784423828125, -0.7001953125, -0.615966796875, -0.53173828125, -0.447509765625, -0.36328125, -0.279052734375, -0.19482421875, -0.110595703125, -0.0263671875, 0.057861328125, 0.14208984375, 0.226318359375, 0.310546875, 0.394775390625, 0.47900390625, 0.563232421875, 0.6474609375, 0.731689453125, 0.81591796875, 0.900146484375, 0.984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 15.0, 14.0, 63.0, 168.0, 322.0, 261.0, 87.0, 41.0, 17.0, 5.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0472211837768555, -4.522011756896973, -3.99680233001709, -3.471592903137207, -2.946383476257324, -2.4211740493774414, -1.8959646224975586, -1.3707551956176758, -0.845545768737793, -0.32033634185791016, 0.20487308502197266, 0.7300825119018555, 1.2552919387817383, 1.780501365661621, 2.305710792541504, 2.8309202194213867, 3.3561296463012695, 3.8813390731811523, 4.406548500061035, 4.931757926940918, 5.456967353820801, 5.982176780700684, 6.507386207580566, 7.032595634460449, 7.557805061340332, 8.083014488220215, 8.608223915100098, 9.13343334197998, 9.658642768859863, 10.183852195739746, 10.709061622619629, 11.234271049499512, 11.759479522705078, 12.284688949584961, 12.809898376464844, 13.335107803344727, 13.86031723022461, 14.385526657104492, 14.910736083984375, 15.435945510864258, 15.96115493774414, 16.486364364624023, 17.011573791503906, 17.53678321838379, 18.061992645263672, 18.587202072143555, 19.112411499023438, 19.63762092590332, 20.162830352783203, 20.688039779663086, 21.21324920654297, 21.73845863342285, 22.263668060302734, 22.788877487182617, 23.3140869140625, 23.839296340942383, 24.364505767822266, 24.88971519470215, 25.41492462158203, 25.940134048461914, 26.465343475341797, 26.99055290222168, 27.515762329101562, 28.040971755981445, 28.566181182861328]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 11.0, 11.0, 19.0, 19.0, 16.0, 27.0, 31.0, 32.0, 35.0, 39.0, 40.0, 63.0, 50.0, 48.0, 54.0, 50.0, 44.0, 60.0, 53.0, 48.0, 39.0, 29.0, 36.0, 27.0, 24.0, 26.0, 16.0, 8.0, 11.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1863203048706055, -5.015599727630615, -4.844879150390625, -4.674158573150635, -4.5034379959106445, -4.332717418670654, -4.161996841430664, -3.991276502609253, -3.8205559253692627, -3.6498353481292725, -3.4791147708892822, -3.308394432067871, -3.137673854827881, -2.9669532775878906, -2.7962327003479004, -2.62551212310791, -2.45479154586792, -2.2840709686279297, -2.1133503913879395, -1.9426299333572388, -1.7719093561172485, -1.6011887788772583, -1.4304683208465576, -1.2597477436065674, -1.0890271663665771, -0.9183065891265869, -0.7475860714912415, -0.576865553855896, -0.40614497661590576, -0.23542439937591553, -0.06470394134521484, 0.10601663589477539, 0.2767372131347656, 0.44745776057243347, 0.6181783080101013, 0.7888988256454468, 0.959619402885437, 1.1303399801254272, 1.301060438156128, 1.4717810153961182, 1.6425015926361084, 1.8132221698760986, 1.9839427471160889, 2.1546630859375, 2.3253836631774902, 2.4961042404174805, 2.6668248176574707, 2.837545394897461, 3.008265972137451, 3.1789865493774414, 3.3497071266174316, 3.520427703857422, 3.691148281097412, 3.8618688583374023, 4.032588958740234, 4.203310012817383, 4.374030113220215, 4.544750690460205, 4.715471267700195, 4.8861918449401855, 5.056912422180176, 5.227632999420166, 5.398353576660156, 5.569073677062988, 5.739794731140137]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 7.0, 17.0, 16.0, 28.0, 51.0, 66.0, 82.0, 135.0, 230.0, 341.0, 578.0, 1038.0, 1883.0, 3425.0, 7360.0, 17229.0, 46453.0, 146403.0, 426777.0, 268070.0, 79212.0, 27340.0, 10957.0, 5062.0, 2454.0, 1366.0, 704.0, 455.0, 285.0, 169.0, 110.0, 74.0, 60.0, 37.0, 19.0, 21.0, 10.0, 8.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.8984375, -0.8739852905273438, -0.8495330810546875, -0.8250808715820312, -0.800628662109375, -0.7761764526367188, -0.7517242431640625, -0.7272720336914062, -0.70281982421875, -0.6783676147460938, -0.6539154052734375, -0.6294631958007812, -0.605010986328125, -0.5805587768554688, -0.5561065673828125, -0.5316543579101562, -0.5072021484375, -0.48274993896484375, -0.4582977294921875, -0.43384552001953125, -0.409393310546875, -0.38494110107421875, -0.3604888916015625, -0.33603668212890625, -0.31158447265625, -0.28713226318359375, -0.2626800537109375, -0.23822784423828125, -0.213775634765625, -0.18932342529296875, -0.1648712158203125, -0.14041900634765625, -0.115966796875, -0.09151458740234375, -0.0670623779296875, -0.04261016845703125, -0.018157958984375, 0.00629425048828125, 0.0307464599609375, 0.05519866943359375, 0.07965087890625, 0.10410308837890625, 0.1285552978515625, 0.15300750732421875, 0.177459716796875, 0.20191192626953125, 0.2263641357421875, 0.25081634521484375, 0.2752685546875, 0.29972076416015625, 0.3241729736328125, 0.34862518310546875, 0.373077392578125, 0.39752960205078125, 0.4219818115234375, 0.44643402099609375, 0.47088623046875, 0.49533843994140625, 0.5197906494140625, 0.5442428588867188, 0.568695068359375, 0.5931472778320312, 0.6175994873046875, 0.6420516967773438, 0.66650390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 2.0, 5.0, 7.0, 15.0, 12.0, 12.0, 20.0, 20.0, 25.0, 24.0, 40.0, 41.0, 55.0, 51.0, 48.0, 52.0, 47.0, 47.0, 55.0, 49.0, 51.0, 52.0, 46.0, 41.0, 24.0, 32.0, 30.0, 16.0, 20.0, 10.0, 18.0, 10.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.3586578369140625, -0.345489501953125, -0.3323211669921875, -0.31915283203125, -0.3059844970703125, -0.292816162109375, -0.2796478271484375, -0.2664794921875, -0.2533111572265625, -0.240142822265625, -0.2269744873046875, -0.21380615234375, -0.2006378173828125, -0.187469482421875, -0.1743011474609375, -0.1611328125, -0.1479644775390625, -0.134796142578125, -0.1216278076171875, -0.10845947265625, -0.0952911376953125, -0.082122802734375, -0.0689544677734375, -0.0557861328125, -0.0426177978515625, -0.029449462890625, -0.0162811279296875, -0.00311279296875, 0.0100555419921875, 0.023223876953125, 0.0363922119140625, 0.049560546875, 0.0627288818359375, 0.075897216796875, 0.0890655517578125, 0.10223388671875, 0.1154022216796875, 0.128570556640625, 0.1417388916015625, 0.1549072265625, 0.1680755615234375, 0.181243896484375, 0.1944122314453125, 0.20758056640625, 0.2207489013671875, 0.233917236328125, 0.2470855712890625, 0.26025390625, 0.2734222412109375, 0.286590576171875, 0.2997589111328125, 0.31292724609375, 0.3260955810546875, 0.339263916015625, 0.3524322509765625, 0.3656005859375, 0.3787689208984375, 0.391937255859375, 0.4051055908203125, 0.41827392578125, 0.4314422607421875, 0.444610595703125, 0.4577789306640625, 0.470947265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 11.0, 13.0, 12.0, 23.0, 43.0, 51.0, 77.0, 132.0, 246.0, 451.0, 756.0, 1685.0, 4669.0, 20962.0, 178005.0, 770202.0, 56233.0, 9681.0, 2780.0, 1114.0, 556.0, 292.0, 198.0, 118.0, 79.0, 41.0, 34.0, 25.0, 16.0, 11.0, 11.0, 1.0, 5.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2822265625, -1.236846923828125, -1.19146728515625, -1.146087646484375, -1.1007080078125, -1.055328369140625, -1.00994873046875, -0.964569091796875, -0.919189453125, -0.873809814453125, -0.82843017578125, -0.783050537109375, -0.7376708984375, -0.692291259765625, -0.64691162109375, -0.601531982421875, -0.55615234375, -0.510772705078125, -0.46539306640625, -0.420013427734375, -0.3746337890625, -0.329254150390625, -0.28387451171875, -0.238494873046875, -0.193115234375, -0.147735595703125, -0.10235595703125, -0.056976318359375, -0.0115966796875, 0.033782958984375, 0.07916259765625, 0.124542236328125, 0.169921875, 0.215301513671875, 0.26068115234375, 0.306060791015625, 0.3514404296875, 0.396820068359375, 0.44219970703125, 0.487579345703125, 0.532958984375, 0.578338623046875, 0.62371826171875, 0.669097900390625, 0.7144775390625, 0.759857177734375, 0.80523681640625, 0.850616455078125, 0.89599609375, 0.941375732421875, 0.98675537109375, 1.032135009765625, 1.0775146484375, 1.122894287109375, 1.16827392578125, 1.213653564453125, 1.259033203125, 1.304412841796875, 1.34979248046875, 1.395172119140625, 1.4405517578125, 1.485931396484375, 1.53131103515625, 1.576690673828125, 1.6220703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 8.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 14.0, 17.0, 11.0, 23.0, 14.0, 15.0, 18.0, 22.0, 31.0, 38.0, 39.0, 32.0, 37.0, 34.0, 45.0, 49.0, 58.0, 44.0, 36.0, 48.0, 41.0, 41.0, 37.0, 30.0, 29.0, 23.0, 9.0, 26.0, 21.0, 16.0, 13.0, 20.0, 11.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.142578125, -1.1016693115234375, -1.060760498046875, -1.0198516845703125, -0.97894287109375, -0.9380340576171875, -0.897125244140625, -0.8562164306640625, -0.8153076171875, -0.7743988037109375, -0.733489990234375, -0.6925811767578125, -0.65167236328125, -0.6107635498046875, -0.569854736328125, -0.5289459228515625, -0.488037109375, -0.4471282958984375, -0.406219482421875, -0.3653106689453125, -0.32440185546875, -0.2834930419921875, -0.242584228515625, -0.2016754150390625, -0.1607666015625, -0.1198577880859375, -0.078948974609375, -0.0380401611328125, 0.00286865234375, 0.0437774658203125, 0.084686279296875, 0.1255950927734375, 0.16650390625, 0.2074127197265625, 0.248321533203125, 0.2892303466796875, 0.33013916015625, 0.3710479736328125, 0.411956787109375, 0.4528656005859375, 0.4937744140625, 0.5346832275390625, 0.575592041015625, 0.6165008544921875, 0.65740966796875, 0.6983184814453125, 0.739227294921875, 0.7801361083984375, 0.821044921875, 0.8619537353515625, 0.902862548828125, 0.9437713623046875, 0.98468017578125, 1.0255889892578125, 1.066497802734375, 1.1074066162109375, 1.1483154296875, 1.1892242431640625, 1.230133056640625, 1.2710418701171875, 1.31195068359375, 1.3528594970703125, 1.393768310546875, 1.4346771240234375, 1.4755859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 13.0, 8.0, 16.0, 25.0, 38.0, 46.0, 91.0, 173.0, 397.0, 1073.0, 4610.0, 31167.0, 887756.0, 110097.0, 9812.0, 2107.0, 595.0, 236.0, 98.0, 67.0, 32.0, 23.0, 22.0, 7.0, 6.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.666015625, -0.64501953125, -0.6240234375, -0.60302734375, -0.58203125, -0.56103515625, -0.5400390625, -0.51904296875, -0.498046875, -0.47705078125, -0.4560546875, -0.43505859375, -0.4140625, -0.39306640625, -0.3720703125, -0.35107421875, -0.330078125, -0.30908203125, -0.2880859375, -0.26708984375, -0.24609375, -0.22509765625, -0.2041015625, -0.18310546875, -0.162109375, -0.14111328125, -0.1201171875, -0.09912109375, -0.078125, -0.05712890625, -0.0361328125, -0.01513671875, 0.005859375, 0.02685546875, 0.0478515625, 0.06884765625, 0.08984375, 0.11083984375, 0.1318359375, 0.15283203125, 0.173828125, 0.19482421875, 0.2158203125, 0.23681640625, 0.2578125, 0.27880859375, 0.2998046875, 0.32080078125, 0.341796875, 0.36279296875, 0.3837890625, 0.40478515625, 0.42578125, 0.44677734375, 0.4677734375, 0.48876953125, 0.509765625, 0.53076171875, 0.5517578125, 0.57275390625, 0.59375, 0.61474609375, 0.6357421875, 0.65673828125, 0.677734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 5.0, 16.0, 16.0, 11.0, 37.0, 53.0, 77.0, 180.0, 261.0, 157.0, 72.0, 27.0, 15.0, 16.0, 14.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021958351135253906, -0.0002137012779712677, -0.00020781904458999634, -0.00020193681120872498, -0.0001960545778274536, -0.00019017234444618225, -0.0001842901110649109, -0.00017840787768363953, -0.00017252564430236816, -0.0001666434109210968, -0.00016076117753982544, -0.00015487894415855408, -0.00014899671077728271, -0.00014311447739601135, -0.00013723224401474, -0.00013135001063346863, -0.00012546777725219727, -0.0001195855438709259, -0.00011370331048965454, -0.00010782107710838318, -0.00010193884372711182, -9.605661034584045e-05, -9.017437696456909e-05, -8.429214358329773e-05, -7.840991020202637e-05, -7.2527676820755e-05, -6.664544343948364e-05, -6.076321005821228e-05, -5.488097667694092e-05, -4.8998743295669556e-05, -4.311650991439819e-05, -3.723427653312683e-05, -3.135204315185547e-05, -2.5469809770584106e-05, -1.9587576389312744e-05, -1.3705343008041382e-05, -7.82310962677002e-06, -1.9408762454986572e-06, 3.941357135772705e-06, 9.823590517044067e-06, 1.570582389831543e-05, 2.1588057279586792e-05, 2.7470290660858154e-05, 3.3352524042129517e-05, 3.923475742340088e-05, 4.511699080467224e-05, 5.0999224185943604e-05, 5.6881457567214966e-05, 6.276369094848633e-05, 6.864592432975769e-05, 7.452815771102905e-05, 8.041039109230042e-05, 8.629262447357178e-05, 9.217485785484314e-05, 9.80570912361145e-05, 0.00010393932461738586, 0.00010982155799865723, 0.00011570379137992859, 0.00012158602476119995, 0.0001274682581424713, 0.00013335049152374268, 0.00013923272490501404, 0.0001451149582862854, 0.00015099719166755676, 0.00015687942504882812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 0.0, 9.0, 5.0, 7.0, 16.0, 23.0, 25.0, 51.0, 72.0, 115.0, 248.0, 473.0, 993.0, 2643.0, 8416.0, 36158.0, 664892.0, 293493.0, 29753.0, 7087.0, 2227.0, 882.0, 418.0, 221.0, 136.0, 69.0, 41.0, 33.0, 16.0, 13.0, 7.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.418701171875, -0.4042320251464844, -0.38976287841796875, -0.3752937316894531, -0.3608245849609375, -0.3463554382324219, -0.33188629150390625, -0.3174171447753906, -0.302947998046875, -0.2884788513183594, -0.27400970458984375, -0.2595405578613281, -0.2450714111328125, -0.23060226440429688, -0.21613311767578125, -0.20166397094726562, -0.18719482421875, -0.17272567749023438, -0.15825653076171875, -0.14378738403320312, -0.1293182373046875, -0.11484909057617188, -0.10037994384765625, -0.08591079711914062, -0.071441650390625, -0.056972503662109375, -0.04250335693359375, -0.028034210205078125, -0.0135650634765625, 0.000904083251953125, 0.01537322998046875, 0.029842376708984375, 0.0443115234375, 0.058780670166015625, 0.07324981689453125, 0.08771896362304688, 0.1021881103515625, 0.11665725708007812, 0.13112640380859375, 0.14559555053710938, 0.160064697265625, 0.17453384399414062, 0.18900299072265625, 0.20347213745117188, 0.2179412841796875, 0.23241043090820312, 0.24687957763671875, 0.2613487243652344, 0.27581787109375, 0.2902870178222656, 0.30475616455078125, 0.3192253112792969, 0.3336944580078125, 0.3481636047363281, 0.36263275146484375, 0.3771018981933594, 0.391571044921875, 0.4060401916503906, 0.42050933837890625, 0.4349784851074219, 0.4494476318359375, 0.4639167785644531, 0.47838592529296875, 0.4928550720214844, 0.50732421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 6.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 4.0, 13.0, 10.0, 15.0, 10.0, 17.0, 21.0, 30.0, 32.0, 59.0, 61.0, 77.0, 77.0, 94.0, 88.0, 77.0, 56.0, 61.0, 30.0, 26.0, 15.0, 18.0, 16.0, 13.0, 13.0, 11.0, 2.0, 7.0, 7.0, 2.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.365478515625, -0.35546875, -0.345458984375, -0.33544921875, -0.325439453125, -0.3154296875, -0.305419921875, -0.29541015625, -0.285400390625, -0.275390625, -0.265380859375, -0.25537109375, -0.245361328125, -0.2353515625, -0.225341796875, -0.21533203125, -0.205322265625, -0.1953125, -0.185302734375, -0.17529296875, -0.165283203125, -0.1552734375, -0.145263671875, -0.13525390625, -0.125244140625, -0.115234375, -0.105224609375, -0.09521484375, -0.085205078125, -0.0751953125, -0.065185546875, -0.05517578125, -0.045166015625, -0.03515625, -0.025146484375, -0.01513671875, -0.005126953125, 0.0048828125, 0.014892578125, 0.02490234375, 0.034912109375, 0.044921875, 0.054931640625, 0.06494140625, 0.074951171875, 0.0849609375, 0.094970703125, 0.10498046875, 0.114990234375, 0.125, 0.135009765625, 0.14501953125, 0.155029296875, 0.1650390625, 0.175048828125, 0.18505859375, 0.195068359375, 0.205078125, 0.215087890625, 0.22509765625, 0.235107421875, 0.2451171875, 0.255126953125, 0.26513671875, 0.275146484375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 6.0, 14.0, 14.0, 62.0, 83.0, 259.0, 304.0, 131.0, 53.0, 41.0, 18.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.180699348449707, -14.828330039978027, -14.475959777832031, -14.123590469360352, -13.771220207214355, -13.418850898742676, -13.06648063659668, -12.714111328125, -12.36174201965332, -12.00937271118164, -11.657002449035645, -11.304633140563965, -10.952262878417969, -10.599893569946289, -10.24752426147461, -9.895153999328613, -9.542783737182617, -9.190414428710938, -8.838044166564941, -8.485674858093262, -8.133304595947266, -7.780935287475586, -7.428565502166748, -7.07619571685791, -6.723825931549072, -6.371456146240234, -6.0190863609313965, -5.666716575622559, -5.314347267150879, -4.961977005004883, -4.609607696533203, -4.257237911224365, -3.904867172241211, -3.552497386932373, -3.200127601623535, -2.8477580547332764, -2.4953882694244385, -2.1430184841156006, -1.7906489372253418, -1.438279151916504, -1.085909366607666, -0.7335396409034729, -0.3811699151992798, -0.028800249099731445, 0.32356953620910645, 0.6759393215179443, 1.0283088684082031, 1.380678653717041, 1.733048439025879, 2.085418224334717, 2.4377880096435547, 2.7901575565338135, 3.1425273418426514, 3.4948971271514893, 3.847266674041748, 4.199636459350586, 4.552006244659424, 4.904376029968262, 5.2567458152771, 5.6091156005859375, 5.961484909057617, 6.313855171203613, 6.666224479675293, 7.018594264984131, 7.370964050292969]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 13.0, 11.0, 9.0, 18.0, 15.0, 18.0, 26.0, 16.0, 36.0, 31.0, 30.0, 65.0, 71.0, 67.0, 63.0, 67.0, 83.0, 71.0, 48.0, 33.0, 34.0, 22.0, 23.0, 20.0, 12.0, 19.0, 14.0, 12.0, 6.0, 10.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.743718147277832, -6.538629055023193, -6.333540439605713, -6.128451347351074, -5.9233622550964355, -5.718273162841797, -5.513184547424316, -5.308095455169678, -5.103006362915039, -4.8979172706604, -4.69282865524292, -4.487739562988281, -4.282650470733643, -4.077561378479004, -3.8724727630615234, -3.6673836708068848, -3.4622950553894043, -3.2572062015533447, -3.052117109298706, -2.8470282554626465, -2.641939163208008, -2.4368503093719482, -2.2317614555358887, -2.02667236328125, -1.8215835094451904, -1.6164945363998413, -1.4114055633544922, -1.2063167095184326, -1.0012277364730835, -0.7961387634277344, -0.5910499095916748, -0.3859609365463257, -0.18087148666381836, 0.024217456579208374, 0.2293063998222351, 0.43439531326293945, 0.6394842863082886, 0.8445732593536377, 1.0496621131896973, 1.2547510862350464, 1.4598400592803955, 1.6649290323257446, 1.8700180053710938, 2.0751068592071533, 2.280195713043213, 2.4852848052978516, 2.690373659133911, 2.8954625129699707, 3.1005516052246094, 3.305640459060669, 3.5107295513153076, 3.715818405151367, 3.920907497406006, 4.1259965896606445, 4.331085205078125, 4.536174297332764, 4.741263389587402, 4.946352481842041, 5.1514410972595215, 5.35653018951416, 5.561619281768799, 5.7667083740234375, 5.971796989440918, 6.176886081695557, 6.381974697113037]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 11.0, 20.0, 24.0, 45.0, 81.0, 122.0, 251.0, 429.0, 869.0, 1721.0, 4017.0, 10872.0, 37081.0, 194090.0, 1855969.0, 1837738.0, 196283.0, 36192.0, 10661.0, 4011.0, 1723.0, 887.0, 469.0, 262.0, 163.0, 84.0, 61.0, 36.0, 28.0, 20.0, 14.0, 5.0, 5.0, 5.0, 3.0, 8.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8935546875, -0.86376953125, -0.833984375, -0.80419921875, -0.7744140625, -0.74462890625, -0.71484375, -0.68505859375, -0.6552734375, -0.62548828125, -0.595703125, -0.56591796875, -0.5361328125, -0.50634765625, -0.4765625, -0.44677734375, -0.4169921875, -0.38720703125, -0.357421875, -0.32763671875, -0.2978515625, -0.26806640625, -0.23828125, -0.20849609375, -0.1787109375, -0.14892578125, -0.119140625, -0.08935546875, -0.0595703125, -0.02978515625, 0.0, 0.02978515625, 0.0595703125, 0.08935546875, 0.119140625, 0.14892578125, 0.1787109375, 0.20849609375, 0.23828125, 0.26806640625, 0.2978515625, 0.32763671875, 0.357421875, 0.38720703125, 0.4169921875, 0.44677734375, 0.4765625, 0.50634765625, 0.5361328125, 0.56591796875, 0.595703125, 0.62548828125, 0.6552734375, 0.68505859375, 0.71484375, 0.74462890625, 0.7744140625, 0.80419921875, 0.833984375, 0.86376953125, 0.8935546875, 0.92333984375, 0.953125, 0.98291015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 2.0, 4.0, 6.0, 5.0, 14.0, 11.0, 12.0, 17.0, 26.0, 14.0, 25.0, 34.0, 37.0, 31.0, 47.0, 47.0, 47.0, 37.0, 41.0, 52.0, 54.0, 46.0, 46.0, 44.0, 46.0, 43.0, 36.0, 39.0, 24.0, 24.0, 20.0, 15.0, 9.0, 11.0, 9.0, 13.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3587989807128906, -0.34699249267578125, -0.3351860046386719, -0.3233795166015625, -0.3115730285644531, -0.29976654052734375, -0.2879600524902344, -0.276153564453125, -0.2643470764160156, -0.25254058837890625, -0.24073410034179688, -0.2289276123046875, -0.21712112426757812, -0.20531463623046875, -0.19350814819335938, -0.18170166015625, -0.16989517211914062, -0.15808868408203125, -0.14628219604492188, -0.1344757080078125, -0.12266921997070312, -0.11086273193359375, -0.09905624389648438, -0.087249755859375, -0.07544326782226562, -0.06363677978515625, -0.051830291748046875, -0.0400238037109375, -0.028217315673828125, -0.01641082763671875, -0.004604339599609375, 0.0072021484375, 0.019008636474609375, 0.03081512451171875, 0.042621612548828125, 0.0544281005859375, 0.06623458862304688, 0.07804107666015625, 0.08984756469726562, 0.101654052734375, 0.11346054077148438, 0.12526702880859375, 0.13707351684570312, 0.1488800048828125, 0.16068649291992188, 0.17249298095703125, 0.18429946899414062, 0.19610595703125, 0.20791244506835938, 0.21971893310546875, 0.23152542114257812, 0.2433319091796875, 0.2551383972167969, 0.26694488525390625, 0.2787513732910156, 0.290557861328125, 0.3023643493652344, 0.31417083740234375, 0.3259773254394531, 0.3377838134765625, 0.3495903015136719, 0.36139678955078125, 0.3732032775878906, 0.385009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 16.0, 27.0, 62.0, 135.0, 385.0, 1338.0, 13730.0, 4127094.0, 48648.0, 2005.0, 499.0, 153.0, 90.0, 36.0, 21.0, 15.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -3.9915771484375, -3.815185546875, -3.6387939453125, -3.46240234375, -3.2860107421875, -3.109619140625, -2.9332275390625, -2.7568359375, -2.5804443359375, -2.404052734375, -2.2276611328125, -2.05126953125, -1.8748779296875, -1.698486328125, -1.5220947265625, -1.345703125, -1.1693115234375, -0.992919921875, -0.8165283203125, -0.64013671875, -0.4637451171875, -0.287353515625, -0.1109619140625, 0.0654296875, 0.2418212890625, 0.418212890625, 0.5946044921875, 0.77099609375, 0.9473876953125, 1.123779296875, 1.3001708984375, 1.4765625, 1.6529541015625, 1.829345703125, 2.0057373046875, 2.18212890625, 2.3585205078125, 2.534912109375, 2.7113037109375, 2.8876953125, 3.0640869140625, 3.240478515625, 3.4168701171875, 3.59326171875, 3.7696533203125, 3.946044921875, 4.1224365234375, 4.298828125, 4.4752197265625, 4.651611328125, 4.8280029296875, 5.00439453125, 5.1807861328125, 5.357177734375, 5.5335693359375, 5.7099609375, 5.8863525390625, 6.062744140625, 6.2391357421875, 6.41552734375, 6.5919189453125, 6.768310546875, 6.9447021484375, 7.12109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 27.0, 47.0, 74.0, 156.0, 306.0, 644.0, 1190.0, 888.0, 380.0, 174.0, 85.0, 49.0, 23.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.670989990234375, -3.57830810546875, -3.485626220703125, -3.3929443359375, -3.300262451171875, -3.20758056640625, -3.114898681640625, -3.022216796875, -2.929534912109375, -2.83685302734375, -2.744171142578125, -2.6514892578125, -2.558807373046875, -2.46612548828125, -2.373443603515625, -2.28076171875, -2.188079833984375, -2.09539794921875, -2.002716064453125, -1.9100341796875, -1.817352294921875, -1.72467041015625, -1.631988525390625, -1.539306640625, -1.446624755859375, -1.35394287109375, -1.261260986328125, -1.1685791015625, -1.075897216796875, -0.98321533203125, -0.890533447265625, -0.7978515625, -0.705169677734375, -0.61248779296875, -0.519805908203125, -0.4271240234375, -0.334442138671875, -0.24176025390625, -0.149078369140625, -0.056396484375, 0.036285400390625, 0.12896728515625, 0.221649169921875, 0.3143310546875, 0.407012939453125, 0.49969482421875, 0.592376708984375, 0.68505859375, 0.777740478515625, 0.87042236328125, 0.963104248046875, 1.0557861328125, 1.148468017578125, 1.24114990234375, 1.333831787109375, 1.426513671875, 1.519195556640625, 1.61187744140625, 1.704559326171875, 1.7972412109375, 1.889923095703125, 1.98260498046875, 2.075286865234375, 2.16796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 8.0, 10.0, 25.0, 55.0, 83.0, 172.0, 184.0, 173.0, 91.0, 70.0, 41.0, 27.0, 8.0, 15.0, 4.0, 5.0, 4.0, 4.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.804410934448242, -22.21473503112793, -21.62506103515625, -21.035385131835938, -20.445709228515625, -19.856033325195312, -19.266357421875, -18.67668342590332, -18.087007522583008, -17.497331619262695, -16.907657623291016, -16.317981719970703, -15.72830581665039, -15.138629913330078, -14.548954963684082, -13.959280014038086, -13.369604110717773, -12.779928207397461, -12.190253257751465, -11.600578308105469, -11.010902404785156, -10.421226501464844, -9.831551551818848, -9.241876602172852, -8.652200698852539, -8.062524795532227, -7.4728498458862305, -6.883174419403076, -6.293498992919922, -5.703823566436768, -5.114148139953613, -4.524472713470459, -3.934795379638672, -3.3451199531555176, -2.7554445266723633, -2.165769100189209, -1.5760936737060547, -0.9864182472229004, -0.3967428207397461, 0.1929326057434082, 0.7826080322265625, 1.3722834587097168, 1.961958885192871, 2.5516343116760254, 3.1413097381591797, 3.730985164642334, 4.320660591125488, 4.910336017608643, 5.500011444091797, 6.089686870574951, 6.6793622970581055, 7.26903772354126, 7.858713150024414, 8.448389053344727, 9.038064002990723, 9.627738952636719, 10.217414855957031, 10.807090759277344, 11.39676570892334, 11.986440658569336, 12.576116561889648, 13.165792465209961, 13.755467414855957, 14.345142364501953, 14.934818267822266]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 8.0, 7.0, 19.0, 18.0, 24.0, 29.0, 39.0, 58.0, 57.0, 77.0, 118.0, 90.0, 102.0, 82.0, 64.0, 48.0, 42.0, 35.0, 28.0, 24.0, 15.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.61494255065918, -16.147159576416016, -15.679378509521484, -15.211596488952637, -14.743814468383789, -14.276032447814941, -13.808250427246094, -13.34046745300293, -12.872686386108398, -12.40490436553955, -11.937122344970703, -11.469340324401855, -11.001558303833008, -10.53377628326416, -10.065994262695312, -9.598211288452148, -9.1304292678833, -8.662647247314453, -8.194865226745605, -7.727083206176758, -7.25930118560791, -6.7915191650390625, -6.323736667633057, -5.855954647064209, -5.388172626495361, -4.920390605926514, -4.452608585357666, -3.9848263263702393, -3.5170443058013916, -3.049262285232544, -2.581480026245117, -2.1136980056762695, -1.6459150314331055, -1.1781330108642578, -0.7103508710861206, -0.2425687313079834, 0.22521328926086426, 0.6929953098297119, 1.1607775688171387, 1.6285595893859863, 2.096341609954834, 2.5641236305236816, 3.0319056510925293, 3.499687910079956, 3.9674699306488037, 4.4352521896362305, 4.903034210205078, 5.370816230773926, 5.838598251342773, 6.306380271911621, 6.774162292480469, 7.241944313049316, 7.709726333618164, 8.177508354187012, 8.64529037475586, 9.113073348999023, 9.580854415893555, 10.048636436462402, 10.51641845703125, 10.984200477600098, 11.451982498168945, 11.919764518737793, 12.38754653930664, 12.855329513549805, 13.323111534118652]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 4.0, 8.0, 10.0, 20.0, 32.0, 50.0, 86.0, 179.0, 301.0, 604.0, 1472.0, 4139.0, 14445.0, 81976.0, 702673.0, 205189.0, 26918.0, 6488.0, 2200.0, 871.0, 393.0, 206.0, 97.0, 67.0, 39.0, 22.0, 22.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0182342529296875, -0.982757568359375, -0.9472808837890625, -0.91180419921875, -0.8763275146484375, -0.840850830078125, -0.8053741455078125, -0.7698974609375, -0.7344207763671875, -0.698944091796875, -0.6634674072265625, -0.62799072265625, -0.5925140380859375, -0.557037353515625, -0.5215606689453125, -0.486083984375, -0.4506072998046875, -0.415130615234375, -0.3796539306640625, -0.34417724609375, -0.3087005615234375, -0.273223876953125, -0.2377471923828125, -0.2022705078125, -0.1667938232421875, -0.131317138671875, -0.0958404541015625, -0.06036376953125, -0.0248870849609375, 0.010589599609375, 0.0460662841796875, 0.08154296875, 0.1170196533203125, 0.152496337890625, 0.1879730224609375, 0.22344970703125, 0.2589263916015625, 0.294403076171875, 0.3298797607421875, 0.3653564453125, 0.4008331298828125, 0.436309814453125, 0.4717864990234375, 0.50726318359375, 0.5427398681640625, 0.578216552734375, 0.6136932373046875, 0.649169921875, 0.6846466064453125, 0.720123291015625, 0.7555999755859375, 0.79107666015625, 0.8265533447265625, 0.862030029296875, 0.8975067138671875, 0.9329833984375, 0.9684600830078125, 1.003936767578125, 1.0394134521484375, 1.07489013671875, 1.1103668212890625, 1.145843505859375, 1.1813201904296875, 1.216796875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 13.0, 14.0, 21.0, 34.0, 45.0, 61.0, 105.0, 95.0, 120.0, 113.0, 115.0, 95.0, 58.0, 46.0, 26.0, 21.0, 16.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.38629150390625, -1.3497314453125, -1.31317138671875, -1.276611328125, -1.24005126953125, -1.2034912109375, -1.16693115234375, -1.13037109375, -1.09381103515625, -1.0572509765625, -1.02069091796875, -0.984130859375, -0.94757080078125, -0.9110107421875, -0.87445068359375, -0.837890625, -0.80133056640625, -0.7647705078125, -0.72821044921875, -0.691650390625, -0.65509033203125, -0.6185302734375, -0.58197021484375, -0.54541015625, -0.50885009765625, -0.4722900390625, -0.43572998046875, -0.399169921875, -0.36260986328125, -0.3260498046875, -0.28948974609375, -0.2529296875, -0.21636962890625, -0.1798095703125, -0.14324951171875, -0.106689453125, -0.07012939453125, -0.0335693359375, 0.00299072265625, 0.03955078125, 0.07611083984375, 0.1126708984375, 0.14923095703125, 0.185791015625, 0.22235107421875, 0.2589111328125, 0.29547119140625, 0.33203125, 0.36859130859375, 0.4051513671875, 0.44171142578125, 0.478271484375, 0.51483154296875, 0.5513916015625, 0.58795166015625, 0.62451171875, 0.66107177734375, 0.6976318359375, 0.73419189453125, 0.770751953125, 0.80731201171875, 0.8438720703125, 0.88043212890625, 0.9169921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 8.0, 13.0, 18.0, 17.0, 26.0, 27.0, 35.0, 60.0, 100.0, 144.0, 238.0, 438.0, 853.0, 1975.0, 6507.0, 34324.0, 817026.0, 162298.0, 17340.0, 4071.0, 1422.0, 632.0, 343.0, 193.0, 126.0, 80.0, 53.0, 37.0, 27.0, 14.0, 19.0, 16.0, 14.0, 12.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.1650390625, -1.130584716796875, -1.09613037109375, -1.061676025390625, -1.0272216796875, -0.992767333984375, -0.95831298828125, -0.923858642578125, -0.889404296875, -0.854949951171875, -0.82049560546875, -0.786041259765625, -0.7515869140625, -0.717132568359375, -0.68267822265625, -0.648223876953125, -0.61376953125, -0.579315185546875, -0.54486083984375, -0.510406494140625, -0.4759521484375, -0.441497802734375, -0.40704345703125, -0.372589111328125, -0.338134765625, -0.303680419921875, -0.26922607421875, -0.234771728515625, -0.2003173828125, -0.165863037109375, -0.13140869140625, -0.096954345703125, -0.0625, -0.028045654296875, 0.00640869140625, 0.040863037109375, 0.0753173828125, 0.109771728515625, 0.14422607421875, 0.178680419921875, 0.213134765625, 0.247589111328125, 0.28204345703125, 0.316497802734375, 0.3509521484375, 0.385406494140625, 0.41986083984375, 0.454315185546875, 0.48876953125, 0.523223876953125, 0.55767822265625, 0.592132568359375, 0.6265869140625, 0.661041259765625, 0.69549560546875, 0.729949951171875, 0.764404296875, 0.798858642578125, 0.83331298828125, 0.867767333984375, 0.9022216796875, 0.936676025390625, 0.97113037109375, 1.005584716796875, 1.0400390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 7.0, 11.0, 9.0, 13.0, 20.0, 16.0, 20.0, 27.0, 35.0, 35.0, 37.0, 41.0, 53.0, 58.0, 85.0, 81.0, 62.0, 68.0, 36.0, 50.0, 38.0, 30.0, 20.0, 28.0, 12.0, 15.0, 9.0, 12.0, 18.0, 7.0, 9.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.24609375, -2.17864990234375, -2.1112060546875, -2.04376220703125, -1.976318359375, -1.90887451171875, -1.8414306640625, -1.77398681640625, -1.70654296875, -1.63909912109375, -1.5716552734375, -1.50421142578125, -1.436767578125, -1.36932373046875, -1.3018798828125, -1.23443603515625, -1.1669921875, -1.09954833984375, -1.0321044921875, -0.96466064453125, -0.897216796875, -0.82977294921875, -0.7623291015625, -0.69488525390625, -0.62744140625, -0.55999755859375, -0.4925537109375, -0.42510986328125, -0.357666015625, -0.29022216796875, -0.2227783203125, -0.15533447265625, -0.087890625, -0.02044677734375, 0.0469970703125, 0.11444091796875, 0.181884765625, 0.24932861328125, 0.3167724609375, 0.38421630859375, 0.45166015625, 0.51910400390625, 0.5865478515625, 0.65399169921875, 0.721435546875, 0.78887939453125, 0.8563232421875, 0.92376708984375, 0.9912109375, 1.05865478515625, 1.1260986328125, 1.19354248046875, 1.260986328125, 1.32843017578125, 1.3958740234375, 1.46331787109375, 1.53076171875, 1.59820556640625, 1.6656494140625, 1.73309326171875, 1.800537109375, 1.86798095703125, 1.9354248046875, 2.00286865234375, 2.0703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 13.0, 21.0, 32.0, 33.0, 34.0, 57.0, 86.0, 137.0, 197.0, 341.0, 498.0, 996.0, 1765.0, 3751.0, 9124.0, 28469.0, 165787.0, 767752.0, 46214.0, 13038.0, 4979.0, 2226.0, 1118.0, 658.0, 375.0, 236.0, 151.0, 100.0, 79.0, 58.0, 35.0, 29.0, 14.0, 16.0, 15.0, 7.0, 2.0, 6.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0], "bins": [-0.1251220703125, -0.12134933471679688, -0.11757659912109375, -0.11380386352539062, -0.1100311279296875, -0.10625839233398438, -0.10248565673828125, -0.09871292114257812, -0.094940185546875, -0.09116744995117188, -0.08739471435546875, -0.08362197875976562, -0.0798492431640625, -0.07607650756835938, -0.07230377197265625, -0.06853103637695312, -0.06475830078125, -0.060985565185546875, -0.05721282958984375, -0.053440093994140625, -0.0496673583984375, -0.045894622802734375, -0.04212188720703125, -0.038349151611328125, -0.034576416015625, -0.030803680419921875, -0.02703094482421875, -0.023258209228515625, -0.0194854736328125, -0.015712738037109375, -0.01194000244140625, -0.008167266845703125, -0.00439453125, -0.000621795654296875, 0.00315093994140625, 0.006923675537109375, 0.0106964111328125, 0.014469146728515625, 0.01824188232421875, 0.022014617919921875, 0.025787353515625, 0.029560089111328125, 0.03333282470703125, 0.037105560302734375, 0.0408782958984375, 0.044651031494140625, 0.04842376708984375, 0.052196502685546875, 0.05596923828125, 0.059741973876953125, 0.06351470947265625, 0.06728744506835938, 0.0710601806640625, 0.07483291625976562, 0.07860565185546875, 0.08237838745117188, 0.086151123046875, 0.08992385864257812, 0.09369659423828125, 0.09746932983398438, 0.1012420654296875, 0.10501480102539062, 0.10878753662109375, 0.11256027221679688, 0.1163330078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 4.0, 8.0, 11.0, 17.0, 18.0, 23.0, 19.0, 42.0, 44.0, 48.0, 77.0, 81.0, 99.0, 94.0, 103.0, 65.0, 53.0, 38.0, 30.0, 21.0, 13.0, 10.0, 17.0, 11.0, 7.0, 6.0, 2.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-05, -3.825034946203232e-05, -3.7161633372306824e-05, -3.607291728258133e-05, -3.4984201192855835e-05, -3.389548510313034e-05, -3.2806769013404846e-05, -3.171805292367935e-05, -3.062933683395386e-05, -2.9540620744228363e-05, -2.845190465450287e-05, -2.7363188564777374e-05, -2.627447247505188e-05, -2.5185756385326385e-05, -2.409704029560089e-05, -2.3008324205875397e-05, -2.1919608116149902e-05, -2.0830892026424408e-05, -1.9742175936698914e-05, -1.865345984697342e-05, -1.7564743757247925e-05, -1.647602766752243e-05, -1.5387311577796936e-05, -1.4298595488071442e-05, -1.3209879398345947e-05, -1.2121163308620453e-05, -1.1032447218894958e-05, -9.943731129169464e-06, -8.85501503944397e-06, -7.766298949718475e-06, -6.677582859992981e-06, -5.5888667702674866e-06, -4.500150680541992e-06, -3.411434590816498e-06, -2.3227185010910034e-06, -1.234002411365509e-06, -1.4528632164001465e-07, 9.434297680854797e-07, 2.032145857810974e-06, 3.1208619475364685e-06, 4.209578037261963e-06, 5.298294126987457e-06, 6.387010216712952e-06, 7.475726306438446e-06, 8.56444239616394e-06, 9.653158485889435e-06, 1.074187457561493e-05, 1.1830590665340424e-05, 1.2919306755065918e-05, 1.4008022844791412e-05, 1.5096738934516907e-05, 1.61854550242424e-05, 1.7274171113967896e-05, 1.836288720369339e-05, 1.9451603293418884e-05, 2.054031938314438e-05, 2.1629035472869873e-05, 2.2717751562595367e-05, 2.3806467652320862e-05, 2.4895183742046356e-05, 2.598389983177185e-05, 2.7072615921497345e-05, 2.816133201122284e-05, 2.9250048100948334e-05, 3.0338764190673828e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 4.0, 6.0, 11.0, 11.0, 10.0, 19.0, 32.0, 36.0, 53.0, 80.0, 102.0, 155.0, 260.0, 434.0, 787.0, 1351.0, 2306.0, 4573.0, 9862.0, 24107.0, 83287.0, 762770.0, 107502.0, 28373.0, 11285.0, 5140.0, 2476.0, 1399.0, 806.0, 465.0, 302.0, 174.0, 116.0, 86.0, 42.0, 37.0, 27.0, 25.0, 8.0, 8.0, 10.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.102294921875, -0.09905529022216797, -0.09581565856933594, -0.0925760269165039, -0.08933639526367188, -0.08609676361083984, -0.08285713195800781, -0.07961750030517578, -0.07637786865234375, -0.07313823699951172, -0.06989860534667969, -0.06665897369384766, -0.06341934204101562, -0.060179710388183594, -0.05694007873535156, -0.05370044708251953, -0.0504608154296875, -0.04722118377685547, -0.04398155212402344, -0.040741920471191406, -0.037502288818359375, -0.034262657165527344, -0.031023025512695312, -0.02778339385986328, -0.02454376220703125, -0.02130413055419922, -0.018064498901367188, -0.014824867248535156, -0.011585235595703125, -0.008345603942871094, -0.0051059722900390625, -0.0018663406372070312, 0.001373291015625, 0.004612922668457031, 0.007852554321289062, 0.011092185974121094, 0.014331817626953125, 0.017571449279785156, 0.020811080932617188, 0.02405071258544922, 0.02729034423828125, 0.03052997589111328, 0.03376960754394531, 0.037009239196777344, 0.040248870849609375, 0.043488502502441406, 0.04672813415527344, 0.04996776580810547, 0.0532073974609375, 0.05644702911376953, 0.05968666076660156, 0.0629262924194336, 0.06616592407226562, 0.06940555572509766, 0.07264518737792969, 0.07588481903076172, 0.07912445068359375, 0.08236408233642578, 0.08560371398925781, 0.08884334564208984, 0.09208297729492188, 0.0953226089477539, 0.09856224060058594, 0.10180187225341797, 0.10504150390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 11.0, 8.0, 10.0, 11.0, 10.0, 12.0, 22.0, 31.0, 29.0, 24.0, 56.0, 72.0, 103.0, 99.0, 95.0, 88.0, 86.0, 47.0, 49.0, 28.0, 14.0, 21.0, 13.0, 9.0, 7.0, 13.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2066650390625, -0.20105552673339844, -0.19544601440429688, -0.1898365020751953, -0.18422698974609375, -0.1786174774169922, -0.17300796508789062, -0.16739845275878906, -0.1617889404296875, -0.15617942810058594, -0.15056991577148438, -0.1449604034423828, -0.13935089111328125, -0.1337413787841797, -0.12813186645507812, -0.12252235412597656, -0.116912841796875, -0.11130332946777344, -0.10569381713867188, -0.10008430480957031, -0.09447479248046875, -0.08886528015136719, -0.08325576782226562, -0.07764625549316406, -0.0720367431640625, -0.06642723083496094, -0.060817718505859375, -0.05520820617675781, -0.04959869384765625, -0.04398918151855469, -0.038379669189453125, -0.03277015686035156, -0.02716064453125, -0.021551132202148438, -0.015941619873046875, -0.010332107543945312, -0.00472259521484375, 0.0008869171142578125, 0.006496429443359375, 0.012105941772460938, 0.0177154541015625, 0.023324966430664062, 0.028934478759765625, 0.03454399108886719, 0.04015350341796875, 0.04576301574707031, 0.051372528076171875, 0.05698204040527344, 0.062591552734375, 0.06820106506347656, 0.07381057739257812, 0.07942008972167969, 0.08502960205078125, 0.09063911437988281, 0.09624862670898438, 0.10185813903808594, 0.1074676513671875, 0.11307716369628906, 0.11868667602539062, 0.12429618835449219, 0.12990570068359375, 0.1355152130126953, 0.14112472534179688, 0.14673423767089844, 0.15234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 19.0, 38.0, 82.0, 271.0, 464.0, 75.0, 30.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.785268783569336, -19.27933120727539, -18.773391723632812, -18.267452239990234, -17.76151466369629, -17.255577087402344, -16.749637603759766, -16.243698120117188, -15.737760543823242, -15.23182201385498, -14.725883483886719, -14.219944953918457, -13.714006423950195, -13.208067893981934, -12.702129364013672, -12.19619083404541, -11.690252304077148, -11.184313774108887, -10.678375244140625, -10.172436714172363, -9.666498184204102, -9.16055965423584, -8.654621124267578, -8.148682594299316, -7.642744064331055, -7.136805534362793, -6.630867004394531, -6.1249284744262695, -5.618989944458008, -5.113051414489746, -4.607112884521484, -4.101174354553223, -3.595235824584961, -3.089297294616699, -2.5833587646484375, -2.077420234680176, -1.571481704711914, -1.0655431747436523, -0.5596046447753906, -0.053666114807128906, 0.4522724151611328, 0.9582109451293945, 1.4641494750976562, 1.970088005065918, 2.4760265350341797, 2.9819650650024414, 3.487903594970703, 3.993842124938965, 4.499780654907227, 5.005719184875488, 5.51165771484375, 6.017596244812012, 6.523534774780273, 7.029473304748535, 7.535411834716797, 8.041350364685059, 8.54728889465332, 9.053227424621582, 9.559165954589844, 10.065104484558105, 10.571043014526367, 11.076981544494629, 11.58292007446289, 12.088858604431152, 12.594797134399414]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 7.0, 11.0, 10.0, 15.0, 17.0, 26.0, 19.0, 24.0, 37.0, 37.0, 62.0, 107.0, 168.0, 130.0, 69.0, 44.0, 38.0, 20.0, 20.0, 22.0, 15.0, 14.0, 13.0, 9.0, 8.0, 6.0, 5.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.757657051086426, -5.540931701660156, -5.324206352233887, -5.107481002807617, -4.8907551765441895, -4.67402982711792, -4.45730447769165, -4.240579128265381, -4.023853302001953, -3.8071279525756836, -3.590402364730835, -3.3736770153045654, -3.156951427459717, -2.9402260780334473, -2.7235007286071777, -2.506775379180908, -2.2900500297546387, -2.073324680328369, -1.8565990924835205, -1.639873743057251, -1.423148274421692, -1.2064228057861328, -0.9896974563598633, -0.7729719877243042, -0.5562465190887451, -0.3395210802555084, -0.12279564142227173, 0.09392976760864258, 0.31065523624420166, 0.5273807048797607, 0.7441060543060303, 0.9608315229415894, 1.1775569915771484, 1.3942824602127075, 1.6110079288482666, 1.8277332782745361, 2.0444588661193848, 2.2611842155456543, 2.477909564971924, 2.6946349143981934, 2.911360502243042, 3.1280858516693115, 3.34481143951416, 3.5615367889404297, 3.778262138366699, 3.994987726211548, 4.211712837219238, 4.428438663482666, 4.6451640129089355, 4.861889362335205, 5.078614711761475, 5.295340538024902, 5.512065887451172, 5.728791236877441, 5.945516586303711, 6.1622419357299805, 6.37896728515625, 6.5956926345825195, 6.812417984008789, 7.029143333435059, 7.245869159698486, 7.462594509124756, 7.679319858551025, 7.896045207977295, 8.112771034240723]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 10.0, 10.0, 6.0, 9.0, 16.0, 13.0, 15.0, 13.0, 19.0, 18.0, 28.0, 26.0, 30.0, 35.0, 59.0, 235.0, 127.0, 48.0, 35.0, 31.0, 27.0, 20.0, 19.0, 27.0, 17.0, 10.0, 17.0, 13.0, 10.0, 8.0, 9.0, 10.0, 3.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.446533203125, -0.43294525146484375, -0.4193572998046875, -0.40576934814453125, -0.392181396484375, -0.37859344482421875, -0.3650054931640625, -0.35141754150390625, -0.33782958984375, -0.32424163818359375, -0.3106536865234375, -0.29706573486328125, -0.283477783203125, -0.26988983154296875, -0.2563018798828125, -0.24271392822265625, -0.2291259765625, -0.21553802490234375, -0.2019500732421875, -0.18836212158203125, -0.174774169921875, -0.16118621826171875, -0.1475982666015625, -0.13401031494140625, -0.12042236328125, -0.10683441162109375, -0.0932464599609375, -0.07965850830078125, -0.066070556640625, -0.05248260498046875, -0.0388946533203125, -0.02530670166015625, -0.01171875, 0.00186920166015625, 0.0154571533203125, 0.02904510498046875, 0.042633056640625, 0.05622100830078125, 0.0698089599609375, 0.08339691162109375, 0.09698486328125, 0.11057281494140625, 0.1241607666015625, 0.13774871826171875, 0.151336669921875, 0.16492462158203125, 0.1785125732421875, 0.19210052490234375, 0.2056884765625, 0.21927642822265625, 0.2328643798828125, 0.24645233154296875, 0.260040283203125, 0.27362823486328125, 0.2872161865234375, 0.30080413818359375, 0.31439208984375, 0.32798004150390625, 0.3415679931640625, 0.35515594482421875, 0.368743896484375, 0.38233184814453125, 0.3959197998046875, 0.40950775146484375, 0.423095703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 7.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 17.0, 30.0, 63.0, 131.0, 307.0, 1012.0, 6654.0, 8359688.0, 18215.0, 1716.0, 384.0, 171.0, 77.0, 26.0, 15.0, 14.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.210654258728027, -5.9687347412109375, -5.726815223693848, -5.484895706176758, -5.242976188659668, -5.001056671142578, -4.759137153625488, -4.51721715927124, -4.27529764175415, -4.0333781242370605, -3.7914586067199707, -3.549539089202881, -3.307619333267212, -3.065699815750122, -2.8237802982330322, -2.5818605422973633, -2.3399412631988525, -2.0980217456817627, -1.8561021089553833, -1.6141825914382935, -1.372262954711914, -1.1303434371948242, -0.8884239196777344, -0.646504282951355, -0.40458476543426514, -0.1626652032136917, 0.07925435900688171, 0.32117390632629395, 0.5630934834480286, 0.8050130605697632, 1.046932578086853, 1.2888522148132324, 1.5307717323303223, 1.772691249847412, 2.014610767364502, 2.256530284881592, 2.4984500408172607, 2.7403695583343506, 2.9822890758514404, 3.2242088317871094, 3.466128349304199, 3.708047866821289, 3.949967384338379, 4.191886901855469, 4.433806419372559, 4.675725936889648, 4.917645454406738, 5.159565448760986, 5.401484489440918, 5.643404006958008, 5.885323524475098, 6.1272430419921875, 6.369162559509277, 6.611082077026367, 6.853001594543457, 7.094921588897705, 7.336841106414795, 7.578760623931885, 7.820680141448975, 8.062600135803223, 8.304519653320312, 8.546439170837402, 8.788358688354492, 9.030278205871582, 9.272197723388672]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 7.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.100747108459473, -6.846602916717529, -6.592458724975586, -6.338314533233643, -6.084170341491699, -5.830026149749756, -5.5758819580078125, -5.321737766265869, -5.067593574523926, -4.813449382781982, -4.559305191040039, -4.305160999298096, -4.051016807556152, -3.796872615814209, -3.5427284240722656, -3.2885842323303223, -3.034440040588379, -2.7802958488464355, -2.526151657104492, -2.272007465362549, -2.0178632736206055, -1.763719081878662, -1.5095748901367188, -1.2554306983947754, -1.001286506652832, -0.7471423149108887, -0.4929981231689453, -0.23885393142700195, 0.015290260314941406, 0.26943445205688477, 0.5235786437988281, 0.7777228355407715, 1.0318660736083984, 1.2860102653503418, 1.5401544570922852, 1.7942986488342285, 2.048442840576172, 2.3025870323181152, 2.5567312240600586, 2.810875415802002, 3.0650196075439453, 3.3191637992858887, 3.573307991027832, 3.8274521827697754, 4.081596374511719, 4.335740566253662, 4.5898847579956055, 4.844028949737549, 5.098173141479492, 5.3523173332214355, 5.606461524963379, 5.860605716705322, 6.114749908447266, 6.368894100189209, 6.623038291931152, 6.877182483673096, 7.131326675415039, 7.385470867156982, 7.639615058898926, 7.893759250640869, 8.147903442382812, 8.402048110961914, 8.6561918258667, 8.910335540771484, 9.164480209350586]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 25.0, 23.0, 34.0, 54.0, 96.0, 200.0, 372.0, 1043.0, 3369.0, 15236.0, 83808.0, 292086.0, 103736.0, 18331.0, 3932.0, 1080.0, 387.0, 178.0, 100.0, 67.0, 41.0, 30.0, 13.0, 8.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.22467041015625, -6.0391845703125, -5.85369873046875, -5.668212890625, -5.48272705078125, -5.2972412109375, -5.11175537109375, -4.92626953125, -4.74078369140625, -4.5552978515625, -4.36981201171875, -4.184326171875, -3.99884033203125, -3.8133544921875, -3.62786865234375, -3.4423828125, -3.25689697265625, -3.0714111328125, -2.88592529296875, -2.700439453125, -2.51495361328125, -2.3294677734375, -2.14398193359375, -1.95849609375, -1.77301025390625, -1.5875244140625, -1.40203857421875, -1.216552734375, -1.03106689453125, -0.8455810546875, -0.66009521484375, -0.474609375, -0.28912353515625, -0.1036376953125, 0.08184814453125, 0.267333984375, 0.45281982421875, 0.6383056640625, 0.82379150390625, 1.00927734375, 1.19476318359375, 1.3802490234375, 1.56573486328125, 1.751220703125, 1.93670654296875, 2.1221923828125, 2.30767822265625, 2.4931640625, 2.67864990234375, 2.8641357421875, 3.04962158203125, 3.235107421875, 3.42059326171875, 3.6060791015625, 3.79156494140625, 3.97705078125, 4.16253662109375, 4.3480224609375, 4.53350830078125, 4.718994140625, 4.90447998046875, 5.0899658203125, 5.27545166015625, 5.4609375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 13.0, 25.0, 30.0, 31.0, 38.0, 60.0, 72.0, 100.0, 110.0, 104.0, 92.0, 77.0, 59.0, 59.0, 38.0, 18.0, 17.0, 20.0, 12.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8699569702148438, -0.8419647216796875, -0.8139724731445312, -0.785980224609375, -0.7579879760742188, -0.7299957275390625, -0.7020034790039062, -0.67401123046875, -0.6460189819335938, -0.6180267333984375, -0.5900344848632812, -0.562042236328125, -0.5340499877929688, -0.5060577392578125, -0.47806549072265625, -0.4500732421875, -0.42208099365234375, -0.3940887451171875, -0.36609649658203125, -0.338104248046875, -0.31011199951171875, -0.2821197509765625, -0.25412750244140625, -0.22613525390625, -0.19814300537109375, -0.1701507568359375, -0.14215850830078125, -0.114166259765625, -0.08617401123046875, -0.0581817626953125, -0.03018951416015625, -0.002197265625, 0.02579498291015625, 0.0537872314453125, 0.08177947998046875, 0.109771728515625, 0.13776397705078125, 0.1657562255859375, 0.19374847412109375, 0.22174072265625, 0.24973297119140625, 0.2777252197265625, 0.30571746826171875, 0.333709716796875, 0.36170196533203125, 0.3896942138671875, 0.41768646240234375, 0.4456787109375, 0.47367095947265625, 0.5016632080078125, 0.5296554565429688, 0.557647705078125, 0.5856399536132812, 0.6136322021484375, 0.6416244506835938, 0.66961669921875, 0.6976089477539062, 0.7256011962890625, 0.7535934448242188, 0.781585693359375, 0.8095779418945312, 0.8375701904296875, 0.8655624389648438, 0.8935546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 12.0, 16.0, 29.0, 56.0, 83.0, 91.0, 61.0, 45.0, 24.0, 15.0, 6.0, 5.0, 7.0, 8.0, 7.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.62237548828125, -3.473726749420166, -3.325077772140503, -3.176429033279419, -3.027780055999756, -2.879131317138672, -2.730482578277588, -2.581833839416504, -2.433184862136841, -2.284536123275757, -2.1358871459960938, -1.9872384071350098, -1.8385895490646362, -1.6899406909942627, -1.5412919521331787, -1.3926430940628052, -1.2439942359924316, -1.095345377922058, -0.9466965794563293, -0.7980477809906006, -0.649398922920227, -0.5007500648498535, -0.35210126638412476, -0.203452467918396, -0.05480360984802246, 0.09384521842002869, 0.24249404668807983, 0.391142874956131, 0.5397917032241821, 0.6884405612945557, 0.8370893597602844, 0.9857381582260132, 1.1343865394592285, 1.283035397529602, 1.4316842555999756, 1.5803329944610596, 1.728981852531433, 1.8776307106018066, 2.0262794494628906, 2.1749281883239746, 2.3235771656036377, 2.4722259044647217, 2.6208748817443848, 2.7695236206054688, 2.9181723594665527, 3.066821336746216, 3.2154700756073, 3.364119052886963, 3.512767791748047, 3.661416530609131, 3.810065507888794, 3.958714246749878, 4.107363224029541, 4.256011962890625, 4.404660701751709, 4.553309440612793, 4.701958656311035, 4.850607395172119, 4.999256134033203, 5.147905349731445, 5.296554088592529, 5.445202827453613, 5.593851566314697, 5.742500305175781, 5.891149044036865]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 9.0, 3.0, 5.0, 3.0, 4.0, 8.0, 12.0, 24.0, 50.0, 67.0, 79.0, 71.0, 55.0, 23.0, 15.0, 6.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2175278663635254, -3.1092283725738525, -3.0009288787841797, -2.892629384994507, -2.784329891204834, -2.676030397415161, -2.5677309036254883, -2.4594314098358154, -2.3511319160461426, -2.2428324222564697, -2.134532928466797, -2.026233434677124, -1.9179339408874512, -1.8096344470977783, -1.7013349533081055, -1.5930354595184326, -1.4847360849380493, -1.3764365911483765, -1.2681370973587036, -1.1598376035690308, -1.051538109779358, -0.9432386755943298, -0.834939181804657, -0.7266396880149841, -0.6183401942253113, -0.5100407004356384, -0.4017412066459656, -0.2934417426586151, -0.18514224886894226, -0.0768427848815918, 0.031456708908081055, 0.1397562026977539, 0.24805569648742676, 0.3563551902770996, 0.46465468406677246, 0.5729541778564453, 0.6812536716461182, 0.7895531058311462, 0.8978525996208191, 1.0061521530151367, 1.1144516468048096, 1.2227511405944824, 1.3310506343841553, 1.4393501281738281, 1.547649621963501, 1.6559491157531738, 1.7642486095428467, 1.8725481033325195, 1.9808474779129028, 2.089146852493286, 2.197446346282959, 2.305745840072632, 2.4140453338623047, 2.5223448276519775, 2.6306443214416504, 2.7389438152313232, 2.847243309020996, 2.955542802810669, 3.063842296600342, 3.1721417903900146, 3.2804412841796875, 3.3887407779693604, 3.497040271759033, 3.605339765548706, 3.713639259338379]}, "eval/loss": 5.143069744110107, "eval/wer": 1.9922848076160253, "eval/runtime": 936.1477, "eval/samples_per_second": 2.822, "eval/steps_per_second": 0.354, "train/train_runtime": 6254.5702, "train/train_samples_per_second": 4.563, "train/train_steps_per_second": 0.143, "train/total_flos": 0.0, "train/train_loss": 4.602872911590097} \ No newline at end of file +{"train/loss": 3.9886, "train/learning_rate": 1.5306122448979589e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7667, "_timestamp": 1646228994, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 4.0, 15.0, 91.0, 568.0, 276.0, 52.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.2979507446289, -57.26783752441406, -42.23772430419922, -27.20760726928711, -12.177494049072266, 2.8526229858398438, 17.882736206054688, 32.91284942626953, 47.942962646484375, 62.97307586669922, 78.00318908691406, 93.03330993652344, 108.06341552734375, 123.09353637695312, 138.1236572265625, 153.1537628173828, 168.18386840820312, 183.2139892578125, 198.2440948486328, 213.2742156982422, 228.3043212890625, 243.33444213867188, 258.36456298828125, 273.3946533203125, 288.4248046875, 303.4549255371094, 318.48504638671875, 333.51513671875, 348.5452575683594, 363.57537841796875, 378.6054992675781, 393.6356201171875, 408.6656799316406, 423.69580078125, 438.7259216308594, 453.7560119628906, 468.7861328125, 483.8162536621094, 498.84637451171875, 513.87646484375, 528.9066162109375, 543.9367065429688, 558.9668579101562, 573.9969482421875, 589.027099609375, 604.0571899414062, 619.0872802734375, 634.117431640625, 649.1475219726562, 664.1776123046875, 679.207763671875, 694.2378540039062, 709.2680053710938, 724.298095703125, 739.3281860351562, 754.3583374023438, 769.388427734375, 784.4185180664062, 799.4486694335938, 814.478759765625, 829.5089111328125, 844.5390014648438, 859.569091796875, 874.5992431640625, 889.6293334960938]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 8.0, 12.0, 14.0, 11.0, 21.0, 29.0, 24.0, 17.0, 27.0, 32.0, 42.0, 41.0, 35.0, 69.0, 50.0, 54.0, 33.0, 43.0, 40.0, 34.0, 33.0, 37.0, 44.0, 17.0, 16.0, 17.0, 22.0, 23.0, 20.0, 12.0, 13.0, 9.0, 12.0, 11.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-187.4065704345703, -181.70559692382812, -176.00462341308594, -170.3036346435547, -164.6026611328125, -158.9016876220703, -153.20071411132812, -147.49972534179688, -141.7987518310547, -136.0977783203125, -130.3968048095703, -124.6958236694336, -118.99484252929688, -113.29386901855469, -107.5928955078125, -101.89191436767578, -96.1909408569336, -90.4899673461914, -84.78898620605469, -79.0880126953125, -73.38703155517578, -67.6860580444336, -61.98508071899414, -56.28410339355469, -50.583126068115234, -44.88214874267578, -39.18117141723633, -33.480194091796875, -27.779218673706055, -22.0782413482666, -16.37726593017578, -10.676288604736328, -4.975311279296875, 0.7256655693054199, 6.426642417907715, 12.127618789672852, 17.828596115112305, 23.529573440551758, 29.230548858642578, 34.93152618408203, 40.632503509521484, 46.33348083496094, 52.03445816040039, 57.735435485839844, 63.43640899658203, 69.13739013671875, 74.83836364746094, 80.53933715820312, 86.24031829833984, 91.94129180908203, 97.64227294921875, 103.34324645996094, 109.04422760009766, 114.74520111083984, 120.44618225097656, 126.14715576171875, 131.84812927246094, 137.54910278320312, 143.2500762939453, 148.95106506347656, 154.65203857421875, 160.35301208496094, 166.05398559570312, 171.75497436523438, 177.45594787597656]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 10.0, 4.0, 6.0, 9.0, 17.0, 11.0, 17.0, 11.0, 8.0, 17.0, 17.0, 17.0, 22.0, 21.0, 39.0, 37.0, 37.0, 35.0, 45.0, 41.0, 44.0, 35.0, 36.0, 53.0, 30.0, 37.0, 40.0, 27.0, 28.0, 31.0, 37.0, 21.0, 20.0, 20.0, 12.0, 14.0, 16.0, 14.0, 13.0, 6.0, 9.0, 4.0, 2.0, 11.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.8203125, -2.726715087890625, -2.63311767578125, -2.539520263671875, -2.4459228515625, -2.352325439453125, -2.25872802734375, -2.165130615234375, -2.071533203125, -1.977935791015625, -1.88433837890625, -1.790740966796875, -1.6971435546875, -1.603546142578125, -1.50994873046875, -1.416351318359375, -1.32275390625, -1.229156494140625, -1.13555908203125, -1.041961669921875, -0.9483642578125, -0.854766845703125, -0.76116943359375, -0.667572021484375, -0.573974609375, -0.480377197265625, -0.38677978515625, -0.293182373046875, -0.1995849609375, -0.105987548828125, -0.01239013671875, 0.081207275390625, 0.1748046875, 0.268402099609375, 0.36199951171875, 0.455596923828125, 0.5491943359375, 0.642791748046875, 0.73638916015625, 0.829986572265625, 0.923583984375, 1.017181396484375, 1.11077880859375, 1.204376220703125, 1.2979736328125, 1.391571044921875, 1.48516845703125, 1.578765869140625, 1.67236328125, 1.765960693359375, 1.85955810546875, 1.953155517578125, 2.0467529296875, 2.140350341796875, 2.23394775390625, 2.327545166015625, 2.421142578125, 2.514739990234375, 2.60833740234375, 2.701934814453125, 2.7955322265625, 2.889129638671875, 2.98272705078125, 3.076324462890625, 3.169921875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 6.0, 8.0, 8.0, 12.0, 9.0, 14.0, 17.0, 22.0, 32.0, 43.0, 66.0, 68.0, 99.0, 132.0, 171.0, 248.0, 312.0, 466.0, 683.0, 1046.0, 1649.0, 2886.0, 5272.0, 10830.0, 25433.0, 75018.0, 590166.0, 3261944.0, 143562.0, 40160.0, 15802.0, 7394.0, 3940.0, 2196.0, 1401.0, 849.0, 662.0, 447.0, 294.0, 227.0, 149.0, 118.0, 105.0, 77.0, 48.0, 37.0, 36.0, 31.0, 16.0, 24.0, 14.0, 16.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 5.0], "bins": [-30.125, -29.12841796875, -28.1318359375, -27.13525390625, -26.138671875, -25.14208984375, -24.1455078125, -23.14892578125, -22.15234375, -21.15576171875, -20.1591796875, -19.16259765625, -18.166015625, -17.16943359375, -16.1728515625, -15.17626953125, -14.1796875, -13.18310546875, -12.1865234375, -11.18994140625, -10.193359375, -9.19677734375, -8.2001953125, -7.20361328125, -6.20703125, -5.21044921875, -4.2138671875, -3.21728515625, -2.220703125, -1.22412109375, -0.2275390625, 0.76904296875, 1.765625, 2.76220703125, 3.7587890625, 4.75537109375, 5.751953125, 6.74853515625, 7.7451171875, 8.74169921875, 9.73828125, 10.73486328125, 11.7314453125, 12.72802734375, 13.724609375, 14.72119140625, 15.7177734375, 16.71435546875, 17.7109375, 18.70751953125, 19.7041015625, 20.70068359375, 21.697265625, 22.69384765625, 23.6904296875, 24.68701171875, 25.68359375, 26.68017578125, 27.6767578125, 28.67333984375, 29.669921875, 30.66650390625, 31.6630859375, 32.65966796875, 33.65625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 9.0, 6.0, 16.0, 15.0, 16.0, 28.0, 48.0, 48.0, 78.0, 105.0, 139.0, 186.0, 281.0, 453.0, 722.0, 656.0, 386.0, 244.0, 162.0, 107.0, 98.0, 65.0, 65.0, 48.0, 25.0, 14.0, 17.0, 10.0, 13.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.572021484375, -18.89404296875, -18.216064453125, -17.5380859375, -16.860107421875, -16.18212890625, -15.504150390625, -14.826171875, -14.148193359375, -13.47021484375, -12.792236328125, -12.1142578125, -11.436279296875, -10.75830078125, -10.080322265625, -9.40234375, -8.724365234375, -8.04638671875, -7.368408203125, -6.6904296875, -6.012451171875, -5.33447265625, -4.656494140625, -3.978515625, -3.300537109375, -2.62255859375, -1.944580078125, -1.2666015625, -0.588623046875, 0.08935546875, 0.767333984375, 1.4453125, 2.123291015625, 2.80126953125, 3.479248046875, 4.1572265625, 4.835205078125, 5.51318359375, 6.191162109375, 6.869140625, 7.547119140625, 8.22509765625, 8.903076171875, 9.5810546875, 10.259033203125, 10.93701171875, 11.614990234375, 12.29296875, 12.970947265625, 13.64892578125, 14.326904296875, 15.0048828125, 15.682861328125, 16.36083984375, 17.038818359375, 17.716796875, 18.394775390625, 19.07275390625, 19.750732421875, 20.4287109375, 21.106689453125, 21.78466796875, 22.462646484375, 23.140625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 11.0, 13.0, 23.0, 30.0, 35.0, 48.0, 64.0, 93.0, 157.0, 237.0, 358.0, 670.0, 1683.0, 5761.0, 30858.0, 307033.0, 3546984.0, 263835.0, 27888.0, 5292.0, 1521.0, 598.0, 341.0, 235.0, 168.0, 96.0, 63.0, 52.0, 38.0, 32.0, 14.0, 12.0, 10.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.03125, -53.28271484375, -51.5341796875, -49.78564453125, -48.037109375, -46.28857421875, -44.5400390625, -42.79150390625, -41.04296875, -39.29443359375, -37.5458984375, -35.79736328125, -34.048828125, -32.30029296875, -30.5517578125, -28.80322265625, -27.0546875, -25.30615234375, -23.5576171875, -21.80908203125, -20.060546875, -18.31201171875, -16.5634765625, -14.81494140625, -13.06640625, -11.31787109375, -9.5693359375, -7.82080078125, -6.072265625, -4.32373046875, -2.5751953125, -0.82666015625, 0.921875, 2.67041015625, 4.4189453125, 6.16748046875, 7.916015625, 9.66455078125, 11.4130859375, 13.16162109375, 14.91015625, 16.65869140625, 18.4072265625, 20.15576171875, 21.904296875, 23.65283203125, 25.4013671875, 27.14990234375, 28.8984375, 30.64697265625, 32.3955078125, 34.14404296875, 35.892578125, 37.64111328125, 39.3896484375, 41.13818359375, 42.88671875, 44.63525390625, 46.3837890625, 48.13232421875, 49.880859375, 51.62939453125, 53.3779296875, 55.12646484375, 56.875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 14.0, 105.0, 385.0, 399.0, 89.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.84393310546875, -206.4600830078125, -197.07623291015625, -187.69239807128906, -178.3085479736328, -168.92469787597656, -159.54086303710938, -150.15701293945312, -140.77316284179688, -131.38931274414062, -122.0054702758789, -112.62162780761719, -103.23777770996094, -93.85392761230469, -84.47008514404297, -75.08624267578125, -65.702392578125, -56.318546295166016, -46.93470001220703, -37.55085372924805, -28.167007446289062, -18.783161163330078, -9.399314880371094, -0.015472412109375, 9.368377685546875, 18.75222396850586, 28.136070251464844, 37.51991653442383, 46.90376281738281, 56.2876091003418, 65.67145538330078, 75.0552978515625, 84.43914794921875, 93.822998046875, 103.20684051513672, 112.59068298339844, 121.97453308105469, 131.35838317871094, 140.74221801757812, 150.12606811523438, 159.50991821289062, 168.89376831054688, 178.27761840820312, 187.6614532470703, 197.04530334472656, 206.4291534423828, 215.81298828125, 225.19683837890625, 234.5806884765625, 243.96453857421875, 253.348388671875, 262.73223876953125, 272.1160888671875, 281.4999084472656, 290.8837585449219, 300.2676086425781, 309.6514587402344, 319.0353088378906, 328.4191589355469, 337.8030090332031, 347.18682861328125, 356.5706787109375, 365.95452880859375, 375.33837890625, 384.72222900390625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 7.0, 5.0, 8.0, 12.0, 14.0, 10.0, 20.0, 23.0, 21.0, 22.0, 18.0, 32.0, 22.0, 22.0, 30.0, 43.0, 42.0, 39.0, 37.0, 31.0, 35.0, 31.0, 38.0, 38.0, 33.0, 32.0, 28.0, 32.0, 26.0, 19.0, 37.0, 20.0, 25.0, 10.0, 15.0, 17.0, 16.0, 17.0, 9.0, 10.0, 13.0, 8.0, 7.0, 2.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-61.95584487915039, -60.02712631225586, -58.098411560058594, -56.16969299316406, -54.24097442626953, -52.312255859375, -50.38353729248047, -48.4548225402832, -46.52610397338867, -44.59738540649414, -42.668670654296875, -40.739952087402344, -38.81123352050781, -36.88251495361328, -34.95379638671875, -33.025081634521484, -31.096363067626953, -29.167644500732422, -27.238927841186523, -25.310211181640625, -23.381492614746094, -21.452774047851562, -19.524057388305664, -17.595340728759766, -15.666622161865234, -13.73790454864502, -11.809186935424805, -9.88046932220459, -7.951751708984375, -6.02303409576416, -4.094316482543945, -2.1655988693237305, -0.23688507080078125, 1.6918325424194336, 3.6205501556396484, 5.549267768859863, 7.477985382080078, 9.406702995300293, 11.335420608520508, 13.264138221740723, 15.192855834960938, 17.12157440185547, 19.050291061401367, 20.979007720947266, 22.907726287841797, 24.836444854736328, 26.765161514282227, 28.693878173828125, 30.622596740722656, 32.55131530761719, 34.48003387451172, 36.408748626708984, 38.337467193603516, 40.26618576049805, 42.19490051269531, 44.123619079589844, 46.052337646484375, 47.981056213378906, 49.90977478027344, 51.8384895324707, 53.767208099365234, 55.695926666259766, 57.62464141845703, 59.55335998535156, 61.482078552246094]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 17.0, 10.0, 21.0, 22.0, 19.0, 16.0, 28.0, 29.0, 38.0, 39.0, 35.0, 37.0, 35.0, 40.0, 35.0, 49.0, 40.0, 39.0, 53.0, 35.0, 34.0, 28.0, 38.0, 29.0, 24.0, 31.0, 24.0, 20.0, 18.0, 24.0, 13.0, 5.0, 7.0, 14.0, 8.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.40625, -3.29998779296875, -3.1937255859375, -3.08746337890625, -2.981201171875, -2.87493896484375, -2.7686767578125, -2.66241455078125, -2.55615234375, -2.44989013671875, -2.3436279296875, -2.23736572265625, -2.131103515625, -2.02484130859375, -1.9185791015625, -1.81231689453125, -1.7060546875, -1.59979248046875, -1.4935302734375, -1.38726806640625, -1.281005859375, -1.17474365234375, -1.0684814453125, -0.96221923828125, -0.85595703125, -0.74969482421875, -0.6434326171875, -0.53717041015625, -0.430908203125, -0.32464599609375, -0.2183837890625, -0.11212158203125, -0.005859375, 0.10040283203125, 0.2066650390625, 0.31292724609375, 0.419189453125, 0.52545166015625, 0.6317138671875, 0.73797607421875, 0.84423828125, 0.95050048828125, 1.0567626953125, 1.16302490234375, 1.269287109375, 1.37554931640625, 1.4818115234375, 1.58807373046875, 1.6943359375, 1.80059814453125, 1.9068603515625, 2.01312255859375, 2.119384765625, 2.22564697265625, 2.3319091796875, 2.43817138671875, 2.54443359375, 2.65069580078125, 2.7569580078125, 2.86322021484375, 2.969482421875, 3.07574462890625, 3.1820068359375, 3.28826904296875, 3.39453125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 8.0, 8.0, 13.0, 16.0, 19.0, 18.0, 37.0, 46.0, 81.0, 109.0, 140.0, 212.0, 287.0, 386.0, 585.0, 879.0, 1182.0, 1779.0, 2635.0, 4106.0, 6326.0, 10356.0, 18347.0, 35125.0, 74670.0, 167542.0, 303342.0, 218033.0, 99117.0, 45615.0, 22942.0, 12542.0, 7568.0, 4718.0, 3067.0, 2073.0, 1438.0, 912.0, 677.0, 463.0, 324.0, 246.0, 158.0, 121.0, 82.0, 59.0, 45.0, 35.0, 33.0, 20.0, 5.0, 7.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5427474975585938, -0.5244598388671875, -0.5061721801757812, -0.487884521484375, -0.46959686279296875, -0.4513092041015625, -0.43302154541015625, -0.41473388671875, -0.39644622802734375, -0.3781585693359375, -0.35987091064453125, -0.341583251953125, -0.32329559326171875, -0.3050079345703125, -0.28672027587890625, -0.2684326171875, -0.25014495849609375, -0.2318572998046875, -0.21356964111328125, -0.195281982421875, -0.17699432373046875, -0.1587066650390625, -0.14041900634765625, -0.12213134765625, -0.10384368896484375, -0.0855560302734375, -0.06726837158203125, -0.048980712890625, -0.03069305419921875, -0.0124053955078125, 0.00588226318359375, 0.024169921875, 0.04245758056640625, 0.0607452392578125, 0.07903289794921875, 0.097320556640625, 0.11560821533203125, 0.1338958740234375, 0.15218353271484375, 0.17047119140625, 0.18875885009765625, 0.2070465087890625, 0.22533416748046875, 0.243621826171875, 0.26190948486328125, 0.2801971435546875, 0.29848480224609375, 0.3167724609375, 0.33506011962890625, 0.3533477783203125, 0.37163543701171875, 0.389923095703125, 0.40821075439453125, 0.4264984130859375, 0.44478607177734375, 0.46307373046875, 0.48136138916015625, 0.4996490478515625, 0.5179367065429688, 0.536224365234375, 0.5545120239257812, 0.5727996826171875, 0.5910873413085938, 0.609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 7.0, 7.0, 13.0, 13.0, 19.0, 12.0, 14.0, 21.0, 22.0, 36.0, 31.0, 43.0, 37.0, 39.0, 41.0, 30.0, 35.0, 44.0, 1074.0, 35.0, 36.0, 38.0, 33.0, 46.0, 31.0, 29.0, 25.0, 34.0, 25.0, 27.0, 13.0, 19.0, 18.0, 11.0, 5.0, 13.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.453125, -2.38079833984375, -2.3084716796875, -2.23614501953125, -2.163818359375, -2.09149169921875, -2.0191650390625, -1.94683837890625, -1.87451171875, -1.80218505859375, -1.7298583984375, -1.65753173828125, -1.585205078125, -1.51287841796875, -1.4405517578125, -1.36822509765625, -1.2958984375, -1.22357177734375, -1.1512451171875, -1.07891845703125, -1.006591796875, -0.93426513671875, -0.8619384765625, -0.78961181640625, -0.71728515625, -0.64495849609375, -0.5726318359375, -0.50030517578125, -0.427978515625, -0.35565185546875, -0.2833251953125, -0.21099853515625, -0.138671875, -0.06634521484375, 0.0059814453125, 0.07830810546875, 0.150634765625, 0.22296142578125, 0.2952880859375, 0.36761474609375, 0.43994140625, 0.51226806640625, 0.5845947265625, 0.65692138671875, 0.729248046875, 0.80157470703125, 0.8739013671875, 0.94622802734375, 1.0185546875, 1.09088134765625, 1.1632080078125, 1.23553466796875, 1.307861328125, 1.38018798828125, 1.4525146484375, 1.52484130859375, 1.59716796875, 1.66949462890625, 1.7418212890625, 1.81414794921875, 1.886474609375, 1.95880126953125, 2.0311279296875, 2.10345458984375, 2.17578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 10.0, 7.0, 22.0, 28.0, 42.0, 71.0, 83.0, 142.0, 184.0, 326.0, 467.0, 802.0, 1226.0, 1775.0, 2914.0, 4930.0, 7982.0, 13186.0, 22162.0, 38312.0, 67263.0, 124524.0, 346759.0, 1153099.0, 135616.0, 73224.0, 41065.0, 24111.0, 14278.0, 8553.0, 5093.0, 3245.0, 2003.0, 1289.0, 800.0, 532.0, 306.0, 226.0, 154.0, 113.0, 83.0, 40.0, 19.0, 23.0, 14.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.318115234375, -0.30849456787109375, -0.2988739013671875, -0.28925323486328125, -0.279632568359375, -0.27001190185546875, -0.2603912353515625, -0.25077056884765625, -0.24114990234375, -0.23152923583984375, -0.2219085693359375, -0.21228790283203125, -0.202667236328125, -0.19304656982421875, -0.1834259033203125, -0.17380523681640625, -0.1641845703125, -0.15456390380859375, -0.1449432373046875, -0.13532257080078125, -0.125701904296875, -0.11608123779296875, -0.1064605712890625, -0.09683990478515625, -0.08721923828125, -0.07759857177734375, -0.0679779052734375, -0.05835723876953125, -0.048736572265625, -0.03911590576171875, -0.0294952392578125, -0.01987457275390625, -0.01025390625, -0.00063323974609375, 0.0089874267578125, 0.01860809326171875, 0.028228759765625, 0.03784942626953125, 0.0474700927734375, 0.05709075927734375, 0.06671142578125, 0.07633209228515625, 0.0859527587890625, 0.09557342529296875, 0.105194091796875, 0.11481475830078125, 0.1244354248046875, 0.13405609130859375, 0.1436767578125, 0.15329742431640625, 0.1629180908203125, 0.17253875732421875, 0.182159423828125, 0.19178009033203125, 0.2014007568359375, 0.21102142333984375, 0.22064208984375, 0.23026275634765625, 0.2398834228515625, 0.24950408935546875, 0.259124755859375, 0.26874542236328125, 0.2783660888671875, 0.28798675537109375, 0.297607421875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 5.0, 3.0, 4.0, 11.0, 8.0, 9.0, 17.0, 12.0, 24.0, 30.0, 34.0, 39.0, 40.0, 68.0, 108.0, 178.0, 100.0, 71.0, 35.0, 40.0, 26.0, 26.0, 20.0, 15.0, 7.0, 10.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.017913818359375, -0.01740741729736328, -0.016901016235351562, -0.016394615173339844, -0.015888214111328125, -0.015381813049316406, -0.014875411987304688, -0.014369010925292969, -0.01386260986328125, -0.013356208801269531, -0.012849807739257812, -0.012343406677246094, -0.011837005615234375, -0.011330604553222656, -0.010824203491210938, -0.010317802429199219, -0.0098114013671875, -0.009305000305175781, -0.008798599243164062, -0.008292198181152344, -0.007785797119140625, -0.007279396057128906, -0.0067729949951171875, -0.006266593933105469, -0.00576019287109375, -0.005253791809082031, -0.0047473907470703125, -0.004240989685058594, -0.003734588623046875, -0.0032281875610351562, -0.0027217864990234375, -0.0022153854370117188, -0.001708984375, -0.0012025833129882812, -0.0006961822509765625, -0.00018978118896484375, 0.000316619873046875, 0.0008230209350585938, 0.0013294219970703125, 0.0018358230590820312, 0.00234222412109375, 0.0028486251831054688, 0.0033550262451171875, 0.0038614273071289062, 0.004367828369140625, 0.004874229431152344, 0.0053806304931640625, 0.005887031555175781, 0.0063934326171875, 0.006899833679199219, 0.0074062347412109375, 0.007912635803222656, 0.008419036865234375, 0.008925437927246094, 0.009431838989257812, 0.009938240051269531, 0.01044464111328125, 0.010951042175292969, 0.011457443237304688, 0.011963844299316406, 0.012470245361328125, 0.012976646423339844, 0.013483047485351562, 0.013989448547363281, 0.014495849609375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 9.0, 15.0, 20.0, 16.0, 13.0, 21.0, 33.0, 36.0, 54.0, 54.0, 83.0, 126.0, 126.0, 183.0, 315.0, 2369.0, 959639.0, 83637.0, 814.0, 230.0, 172.0, 118.0, 101.0, 63.0, 57.0, 37.0, 42.0, 20.0, 22.0, 13.0, 17.0, 12.0, 9.0, 8.0, 12.0, 10.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.29931640625, -0.29046630859375, -0.2816162109375, -0.27276611328125, -0.263916015625, -0.25506591796875, -0.2462158203125, -0.23736572265625, -0.228515625, -0.21966552734375, -0.2108154296875, -0.20196533203125, -0.193115234375, -0.18426513671875, -0.1754150390625, -0.16656494140625, -0.15771484375, -0.14886474609375, -0.1400146484375, -0.13116455078125, -0.122314453125, -0.11346435546875, -0.1046142578125, -0.09576416015625, -0.0869140625, -0.07806396484375, -0.0692138671875, -0.06036376953125, -0.051513671875, -0.04266357421875, -0.0338134765625, -0.02496337890625, -0.01611328125, -0.00726318359375, 0.0015869140625, 0.01043701171875, 0.019287109375, 0.02813720703125, 0.0369873046875, 0.04583740234375, 0.0546875, 0.06353759765625, 0.0723876953125, 0.08123779296875, 0.090087890625, 0.09893798828125, 0.1077880859375, 0.11663818359375, 0.12548828125, 0.13433837890625, 0.1431884765625, 0.15203857421875, 0.160888671875, 0.16973876953125, 0.1785888671875, 0.18743896484375, 0.1962890625, 0.20513916015625, 0.2139892578125, 0.22283935546875, 0.231689453125, 0.24053955078125, 0.2493896484375, 0.25823974609375, 0.26708984375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 51.0, 864.0, 85.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08904317021369934, -0.08130837976932526, -0.07357358187437057, -0.0658387839794159, -0.05810399353504181, -0.050369199365377426, -0.04263440519571304, -0.03489961102604866, -0.027164816856384277, -0.019430022686719894, -0.011695228517055511, -0.0039604343473911285, 0.0037743598222732544, 0.011509153991937637, 0.01924394816160202, 0.026978742331266403, 0.034713536500930786, 0.04244833067059517, 0.05018312484025955, 0.057917919009923935, 0.06565271317958832, 0.0733875036239624, 0.08112230151891708, 0.08885709941387177, 0.09659188985824585, 0.10432668030261993, 0.11206147819757462, 0.1197962760925293, 0.12753106653690338, 0.13526585698127747, 0.14300066232681274, 0.15073545277118683, 0.1584702432155609, 0.166205033659935, 0.17393982410430908, 0.18167462944984436, 0.18940941989421844, 0.19714421033859253, 0.2048790156841278, 0.2126138061285019, 0.22034859657287598, 0.22808338701725006, 0.23581817746162415, 0.24355298280715942, 0.2512877583503723, 0.2590225636959076, 0.26675736904144287, 0.27449214458465576, 0.28222694993019104, 0.2899617552757263, 0.2976965308189392, 0.3054313361644745, 0.31316614151000977, 0.32090091705322266, 0.32863572239875793, 0.3363704979419708, 0.3441053032875061, 0.3518401086330414, 0.3595748841762543, 0.36730968952178955, 0.37504446506500244, 0.3827792704105377, 0.390514075756073, 0.3982488512992859, 0.40598365664482117]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 11.0, 10.0, 18.0, 17.0, 20.0, 23.0, 30.0, 36.0, 31.0, 27.0, 42.0, 52.0, 48.0, 49.0, 37.0, 50.0, 49.0, 58.0, 47.0, 44.0, 49.0, 44.0, 37.0, 24.0, 31.0, 21.0, 12.0, 12.0, 15.0, 16.0, 17.0, 2.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027567923069000244, -0.026634935289621353, -0.02570194937288761, -0.02476896345615387, -0.02383597567677498, -0.022902987897396088, -0.021970001980662346, -0.021037016063928604, -0.020104028284549713, -0.019171040505170822, -0.01823805458843708, -0.01730506867170334, -0.016372080892324448, -0.015439094044268131, -0.014506107196211815, -0.013573120348155499, -0.012640133500099182, -0.011707146652042866, -0.01077415980398655, -0.009841172955930233, -0.008908186107873917, -0.0079751992598176, -0.007042212411761284, -0.0061092255637049675, -0.005176238715648651, -0.004243251867592335, -0.0033102650195360184, -0.002377278171479702, -0.0014442913234233856, -0.0005113044753670692, 0.00042168237268924713, 0.0013546692207455635, 0.00228765606880188, 0.0032206429168581963, 0.004153629764914513, 0.005086616612970829, 0.006019603461027145, 0.006952590309083462, 0.007885577157139778, 0.008818564005196095, 0.009751550853252411, 0.010684537701308727, 0.011617524549365044, 0.01255051139742136, 0.013483498245477676, 0.014416485093533993, 0.01534947194159031, 0.01628245785832405, 0.017215445637702942, 0.018148433417081833, 0.019081419333815575, 0.020014405250549316, 0.020947393029928207, 0.0218803808093071, 0.02281336672604084, 0.023746352642774582, 0.024679340422153473, 0.025612328201532364, 0.026545314118266106, 0.027478300034999847, 0.02841128781437874, 0.02934427559375763, 0.03027726151049137, 0.031210247427225113, 0.032143235206604004]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 17.0, 10.0, 21.0, 22.0, 19.0, 16.0, 28.0, 29.0, 38.0, 40.0, 34.0, 37.0, 36.0, 39.0, 35.0, 49.0, 40.0, 39.0, 53.0, 35.0, 34.0, 28.0, 38.0, 28.0, 25.0, 31.0, 24.0, 20.0, 18.0, 24.0, 13.0, 5.0, 7.0, 14.0, 8.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.40625, -3.29998779296875, -3.1937255859375, -3.08746337890625, -2.981201171875, -2.87493896484375, -2.7686767578125, -2.66241455078125, -2.55615234375, -2.44989013671875, -2.3436279296875, -2.23736572265625, -2.131103515625, -2.02484130859375, -1.9185791015625, -1.81231689453125, -1.7060546875, -1.59979248046875, -1.4935302734375, -1.38726806640625, -1.281005859375, -1.17474365234375, -1.0684814453125, -0.96221923828125, -0.85595703125, -0.74969482421875, -0.6434326171875, -0.53717041015625, -0.430908203125, -0.32464599609375, -0.2183837890625, -0.11212158203125, -0.005859375, 0.10040283203125, 0.2066650390625, 0.31292724609375, 0.419189453125, 0.52545166015625, 0.6317138671875, 0.73797607421875, 0.84423828125, 0.95050048828125, 1.0567626953125, 1.16302490234375, 1.269287109375, 1.37554931640625, 1.4818115234375, 1.58807373046875, 1.6943359375, 1.80059814453125, 1.9068603515625, 2.01312255859375, 2.119384765625, 2.22564697265625, 2.3319091796875, 2.43817138671875, 2.54443359375, 2.65069580078125, 2.7569580078125, 2.86322021484375, 2.969482421875, 3.07574462890625, 3.1820068359375, 3.28826904296875, 3.39453125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 18.0, 21.0, 14.0, 41.0, 55.0, 58.0, 94.0, 134.0, 187.0, 228.0, 374.0, 481.0, 682.0, 1021.0, 1544.0, 2413.0, 3721.0, 6144.0, 10769.0, 21208.0, 50146.0, 175080.0, 507438.0, 169333.0, 48739.0, 20760.0, 10801.0, 6135.0, 3617.0, 2309.0, 1575.0, 1020.0, 705.0, 465.0, 336.0, 226.0, 176.0, 136.0, 94.0, 68.0, 40.0, 28.0, 35.0, 20.0, 16.0, 6.0, 9.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 4.0], "bins": [-11.6875, -11.3277587890625, -10.968017578125, -10.6082763671875, -10.24853515625, -9.8887939453125, -9.529052734375, -9.1693115234375, -8.8095703125, -8.4498291015625, -8.090087890625, -7.7303466796875, -7.37060546875, -7.0108642578125, -6.651123046875, -6.2913818359375, -5.931640625, -5.5718994140625, -5.212158203125, -4.8524169921875, -4.49267578125, -4.1329345703125, -3.773193359375, -3.4134521484375, -3.0537109375, -2.6939697265625, -2.334228515625, -1.9744873046875, -1.61474609375, -1.2550048828125, -0.895263671875, -0.5355224609375, -0.17578125, 0.1839599609375, 0.543701171875, 0.9034423828125, 1.26318359375, 1.6229248046875, 1.982666015625, 2.3424072265625, 2.7021484375, 3.0618896484375, 3.421630859375, 3.7813720703125, 4.14111328125, 4.5008544921875, 4.860595703125, 5.2203369140625, 5.580078125, 5.9398193359375, 6.299560546875, 6.6593017578125, 7.01904296875, 7.3787841796875, 7.738525390625, 8.0982666015625, 8.4580078125, 8.8177490234375, 9.177490234375, 9.5372314453125, 9.89697265625, 10.2567138671875, 10.616455078125, 10.9761962890625, 11.3359375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 6.0, 5.0, 9.0, 11.0, 15.0, 7.0, 14.0, 17.0, 21.0, 27.0, 22.0, 31.0, 25.0, 37.0, 40.0, 65.0, 76.0, 102.0, 169.0, 1449.0, 280.0, 127.0, 70.0, 65.0, 38.0, 33.0, 44.0, 32.0, 43.0, 31.0, 23.0, 17.0, 21.0, 13.0, 9.0, 7.0, 6.0, 7.0, 7.0, 7.0, 0.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.6234130859375, -13.207763671875, -12.7921142578125, -12.37646484375, -11.9608154296875, -11.545166015625, -11.1295166015625, -10.7138671875, -10.2982177734375, -9.882568359375, -9.4669189453125, -9.05126953125, -8.6356201171875, -8.219970703125, -7.8043212890625, -7.388671875, -6.9730224609375, -6.557373046875, -6.1417236328125, -5.72607421875, -5.3104248046875, -4.894775390625, -4.4791259765625, -4.0634765625, -3.6478271484375, -3.232177734375, -2.8165283203125, -2.40087890625, -1.9852294921875, -1.569580078125, -1.1539306640625, -0.73828125, -0.3226318359375, 0.093017578125, 0.5086669921875, 0.92431640625, 1.3399658203125, 1.755615234375, 2.1712646484375, 2.5869140625, 3.0025634765625, 3.418212890625, 3.8338623046875, 4.24951171875, 4.6651611328125, 5.080810546875, 5.4964599609375, 5.912109375, 6.3277587890625, 6.743408203125, 7.1590576171875, 7.57470703125, 7.9903564453125, 8.406005859375, 8.8216552734375, 9.2373046875, 9.6529541015625, 10.068603515625, 10.4842529296875, 10.89990234375, 11.3155517578125, 11.731201171875, 12.1468505859375, 12.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 8.0, 7.0, 8.0, 11.0, 15.0, 14.0, 27.0, 22.0, 26.0, 35.0, 43.0, 46.0, 92.0, 192.0, 511.0, 2076.0, 32795.0, 3012639.0, 92088.0, 3691.0, 697.0, 240.0, 109.0, 65.0, 40.0, 22.0, 27.0, 20.0, 15.0, 17.0, 10.0, 8.0, 11.0, 9.0, 10.0, 9.0, 9.0, 2.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.90625, -55.04833984375, -53.1904296875, -51.33251953125, -49.474609375, -47.61669921875, -45.7587890625, -43.90087890625, -42.04296875, -40.18505859375, -38.3271484375, -36.46923828125, -34.611328125, -32.75341796875, -30.8955078125, -29.03759765625, -27.1796875, -25.32177734375, -23.4638671875, -21.60595703125, -19.748046875, -17.89013671875, -16.0322265625, -14.17431640625, -12.31640625, -10.45849609375, -8.6005859375, -6.74267578125, -4.884765625, -3.02685546875, -1.1689453125, 0.68896484375, 2.546875, 4.40478515625, 6.2626953125, 8.12060546875, 9.978515625, 11.83642578125, 13.6943359375, 15.55224609375, 17.41015625, 19.26806640625, 21.1259765625, 22.98388671875, 24.841796875, 26.69970703125, 28.5576171875, 30.41552734375, 32.2734375, 34.13134765625, 35.9892578125, 37.84716796875, 39.705078125, 41.56298828125, 43.4208984375, 45.27880859375, 47.13671875, 48.99462890625, 50.8525390625, 52.71044921875, 54.568359375, 56.42626953125, 58.2841796875, 60.14208984375, 62.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 981.0, 33.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1167.9273681640625, -1144.395751953125, -1120.8641357421875, -1097.33251953125, -1073.8009033203125, -1050.269287109375, -1026.737548828125, -1003.2059936523438, -979.67431640625, -956.1427001953125, -932.611083984375, -909.0794677734375, -885.5477905273438, -862.0161743164062, -838.4845581054688, -814.9529418945312, -791.4213256835938, -767.8897094726562, -744.3580932617188, -720.826416015625, -697.2947998046875, -673.76318359375, -650.2315673828125, -626.699951171875, -603.1683349609375, -579.63671875, -556.1051025390625, -532.573486328125, -509.04180908203125, -485.51019287109375, -461.97857666015625, -438.44696044921875, -414.9153137207031, -391.3836975097656, -367.85205078125, -344.3204345703125, -320.788818359375, -297.2571716308594, -273.7255554199219, -250.1939239501953, -226.66229248046875, -203.1306610107422, -179.59902954101562, -156.06741333007812, -132.53578186035156, -109.004150390625, -85.4725341796875, -61.94090270996094, -38.409271240234375, -14.877643585205078, 8.653984069824219, 32.18560791015625, 55.71723937988281, 79.24887084960938, 102.78048706054688, 126.31211853027344, 149.84375, 173.37538146972656, 196.90701293945312, 220.43862915039062, 243.9702606201172, 267.50189208984375, 291.03350830078125, 314.56512451171875, 338.0967712402344]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 9.0, 22.0, 21.0, 27.0, 27.0, 30.0, 36.0, 53.0, 50.0, 41.0, 49.0, 63.0, 64.0, 50.0, 66.0, 49.0, 57.0, 59.0, 29.0, 36.0, 31.0, 27.0, 20.0, 21.0, 10.0, 12.0, 9.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.7646484375, -66.6091079711914, -64.45357513427734, -62.298038482666016, -60.14250183105469, -57.986961364746094, -55.831424713134766, -53.67588806152344, -51.52035140991211, -49.36481475830078, -47.20927810668945, -45.053741455078125, -42.89820098876953, -40.74266815185547, -38.587127685546875, -36.43159103393555, -34.27605438232422, -32.12051773071289, -29.964981079101562, -27.8094425201416, -25.653905868530273, -23.498369216918945, -21.342830657958984, -19.187294006347656, -17.031757354736328, -14.876220703125, -12.720683097839355, -10.565145492553711, -8.409608840942383, -6.254072189331055, -4.09853458404541, -1.9429969787597656, 0.21253204345703125, 2.3680691719055176, 4.523606300354004, 6.67914342880249, 8.834680557250977, 10.990217208862305, 13.14575481414795, 15.301292419433594, 17.456829071044922, 19.61236572265625, 21.767902374267578, 23.92344093322754, 26.078977584838867, 28.234514236450195, 30.390052795410156, 32.545589447021484, 34.70112609863281, 36.85666275024414, 39.01219940185547, 41.1677360534668, 43.323272705078125, 45.47881317138672, 47.63434982299805, 49.789886474609375, 51.9454231262207, 54.10095977783203, 56.25649642944336, 58.41203308105469, 60.56757354736328, 62.723106384277344, 64.87864685058594, 67.0341796875, 69.1897201538086]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 1.0, 3.0, 6.0, 7.0, 8.0, 17.0, 14.0, 12.0, 20.0, 14.0, 17.0, 29.0, 34.0, 41.0, 29.0, 32.0, 33.0, 48.0, 32.0, 38.0, 47.0, 35.0, 44.0, 42.0, 34.0, 45.0, 33.0, 39.0, 29.0, 31.0, 20.0, 30.0, 24.0, 18.0, 13.0, 16.0, 17.0, 6.0, 4.0, 10.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.107757568359375, -2.99871826171875, -2.889678955078125, -2.7806396484375, -2.671600341796875, -2.56256103515625, -2.453521728515625, -2.344482421875, -2.235443115234375, -2.12640380859375, -2.017364501953125, -1.9083251953125, -1.799285888671875, -1.69024658203125, -1.581207275390625, -1.47216796875, -1.363128662109375, -1.25408935546875, -1.145050048828125, -1.0360107421875, -0.926971435546875, -0.81793212890625, -0.708892822265625, -0.599853515625, -0.490814208984375, -0.38177490234375, -0.272735595703125, -0.1636962890625, -0.054656982421875, 0.05438232421875, 0.163421630859375, 0.2724609375, 0.381500244140625, 0.49053955078125, 0.599578857421875, 0.7086181640625, 0.817657470703125, 0.92669677734375, 1.035736083984375, 1.144775390625, 1.253814697265625, 1.36285400390625, 1.471893310546875, 1.5809326171875, 1.689971923828125, 1.79901123046875, 1.908050537109375, 2.01708984375, 2.126129150390625, 2.23516845703125, 2.344207763671875, 2.4532470703125, 2.562286376953125, 2.67132568359375, 2.780364990234375, 2.889404296875, 2.998443603515625, 3.10748291015625, 3.216522216796875, 3.3255615234375, 3.434600830078125, 3.54364013671875, 3.652679443359375, 3.76171875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 9.0, 17.0, 20.0, 40.0, 60.0, 93.0, 123.0, 251.0, 366.0, 720.0, 1286.0, 2245.0, 4614.0, 9925.0, 23941.0, 75934.0, 940691.0, 2957046.0, 118879.0, 33522.0, 12841.0, 5538.0, 2682.0, 1391.0, 785.0, 467.0, 284.0, 163.0, 118.0, 52.0, 48.0, 31.0, 30.0, 13.0, 13.0, 12.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.03125, -25.1064453125, -24.181640625, -23.2568359375, -22.33203125, -21.4072265625, -20.482421875, -19.5576171875, -18.6328125, -17.7080078125, -16.783203125, -15.8583984375, -14.93359375, -14.0087890625, -13.083984375, -12.1591796875, -11.234375, -10.3095703125, -9.384765625, -8.4599609375, -7.53515625, -6.6103515625, -5.685546875, -4.7607421875, -3.8359375, -2.9111328125, -1.986328125, -1.0615234375, -0.13671875, 0.7880859375, 1.712890625, 2.6376953125, 3.5625, 4.4873046875, 5.412109375, 6.3369140625, 7.26171875, 8.1865234375, 9.111328125, 10.0361328125, 10.9609375, 11.8857421875, 12.810546875, 13.7353515625, 14.66015625, 15.5849609375, 16.509765625, 17.4345703125, 18.359375, 19.2841796875, 20.208984375, 21.1337890625, 22.05859375, 22.9833984375, 23.908203125, 24.8330078125, 25.7578125, 26.6826171875, 27.607421875, 28.5322265625, 29.45703125, 30.3818359375, 31.306640625, 32.2314453125, 33.15625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 6.0, 14.0, 19.0, 12.0, 16.0, 20.0, 31.0, 55.0, 37.0, 72.0, 84.0, 130.0, 146.0, 222.0, 328.0, 495.0, 648.0, 521.0, 358.0, 230.0, 149.0, 106.0, 95.0, 48.0, 46.0, 38.0, 31.0, 24.0, 23.0, 15.0, 7.0, 12.0, 4.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.203125, -14.68896484375, -14.1748046875, -13.66064453125, -13.146484375, -12.63232421875, -12.1181640625, -11.60400390625, -11.08984375, -10.57568359375, -10.0615234375, -9.54736328125, -9.033203125, -8.51904296875, -8.0048828125, -7.49072265625, -6.9765625, -6.46240234375, -5.9482421875, -5.43408203125, -4.919921875, -4.40576171875, -3.8916015625, -3.37744140625, -2.86328125, -2.34912109375, -1.8349609375, -1.32080078125, -0.806640625, -0.29248046875, 0.2216796875, 0.73583984375, 1.25, 1.76416015625, 2.2783203125, 2.79248046875, 3.306640625, 3.82080078125, 4.3349609375, 4.84912109375, 5.36328125, 5.87744140625, 6.3916015625, 6.90576171875, 7.419921875, 7.93408203125, 8.4482421875, 8.96240234375, 9.4765625, 9.99072265625, 10.5048828125, 11.01904296875, 11.533203125, 12.04736328125, 12.5615234375, 13.07568359375, 13.58984375, 14.10400390625, 14.6181640625, 15.13232421875, 15.646484375, 16.16064453125, 16.6748046875, 17.18896484375, 17.703125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 12.0, 13.0, 13.0, 42.0, 59.0, 103.0, 174.0, 272.0, 398.0, 687.0, 1099.0, 1831.0, 3011.0, 5147.0, 8631.0, 15425.0, 29657.0, 62882.0, 157555.0, 658881.0, 2515382.0, 484784.0, 132264.0, 55288.0, 26700.0, 14053.0, 7995.0, 4736.0, 2764.0, 1755.0, 1046.0, 675.0, 367.0, 247.0, 132.0, 81.0, 61.0, 30.0, 14.0, 8.0, 6.0, 1.0, 4.0, 2.0, 1.0], "bins": [-30.09375, -29.330322265625, -28.56689453125, -27.803466796875, -27.0400390625, -26.276611328125, -25.51318359375, -24.749755859375, -23.986328125, -23.222900390625, -22.45947265625, -21.696044921875, -20.9326171875, -20.169189453125, -19.40576171875, -18.642333984375, -17.87890625, -17.115478515625, -16.35205078125, -15.588623046875, -14.8251953125, -14.061767578125, -13.29833984375, -12.534912109375, -11.771484375, -11.008056640625, -10.24462890625, -9.481201171875, -8.7177734375, -7.954345703125, -7.19091796875, -6.427490234375, -5.6640625, -4.900634765625, -4.13720703125, -3.373779296875, -2.6103515625, -1.846923828125, -1.08349609375, -0.320068359375, 0.443359375, 1.206787109375, 1.97021484375, 2.733642578125, 3.4970703125, 4.260498046875, 5.02392578125, 5.787353515625, 6.55078125, 7.314208984375, 8.07763671875, 8.841064453125, 9.6044921875, 10.367919921875, 11.13134765625, 11.894775390625, 12.658203125, 13.421630859375, 14.18505859375, 14.948486328125, 15.7119140625, 16.475341796875, 17.23876953125, 18.002197265625, 18.765625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 9.0, 13.0, 21.0, 17.0, 34.0, 63.0, 80.0, 103.0, 136.0, 133.0, 114.0, 99.0, 71.0, 41.0, 31.0, 14.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-148.42059326171875, -145.14511108398438, -141.86962890625, -138.59414672851562, -135.3186798095703, -132.04319763183594, -128.76771545410156, -125.49223327636719, -122.21675109863281, -118.94126892089844, -115.6657943725586, -112.39031219482422, -109.11483001708984, -105.83935546875, -102.56387329101562, -99.28839111328125, -96.01290893554688, -92.7374267578125, -89.46195220947266, -86.18647003173828, -82.9109878540039, -79.63551330566406, -76.36003112792969, -73.08454895019531, -69.80907440185547, -66.5335922241211, -63.258113861083984, -59.982635498046875, -56.7071533203125, -53.43167495727539, -50.15619659423828, -46.880714416503906, -43.6052360534668, -40.32975769042969, -37.05427551269531, -33.7787971496582, -30.503314971923828, -27.22783660888672, -23.952356338500977, -20.676876068115234, -17.401395797729492, -14.12591552734375, -10.850435256958008, -7.574955940246582, -4.29947566986084, -1.023996353149414, 2.251483917236328, 5.52696418762207, 8.802444458007812, 12.077924728393555, 15.353404998779297, 18.628883361816406, 21.90436553955078, 25.17984390258789, 28.455324172973633, 31.730804443359375, 35.00628662109375, 38.28176498413086, 41.557247161865234, 44.832725524902344, 48.10820770263672, 51.38368606567383, 54.65916442871094, 57.93464660644531, 61.21012496948242]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 13.0, 7.0, 14.0, 14.0, 16.0, 20.0, 21.0, 31.0, 41.0, 26.0, 34.0, 34.0, 48.0, 42.0, 47.0, 39.0, 57.0, 42.0, 44.0, 46.0, 40.0, 44.0, 37.0, 36.0, 26.0, 27.0, 25.0, 25.0, 15.0, 15.0, 11.0, 8.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.133914947509766, -55.247379302978516, -53.360843658447266, -51.474308013916016, -49.587772369384766, -47.701236724853516, -45.814697265625, -43.92816162109375, -42.0416259765625, -40.15509033203125, -38.2685546875, -36.38201904296875, -34.4954833984375, -32.60894775390625, -30.722410202026367, -28.835874557495117, -26.9493408203125, -25.06280517578125, -23.17626953125, -21.28973388671875, -19.4031982421875, -17.51666259765625, -15.630125045776367, -13.743589401245117, -11.857053756713867, -9.970518112182617, -8.083982467651367, -6.197445869445801, -4.310910224914551, -2.424374580383301, -0.5378379821777344, 1.3486976623535156, 3.2352294921875, 5.12176513671875, 7.008301258087158, 8.894837379455566, 10.781373023986816, 12.667908668518066, 14.554445266723633, 16.440980911254883, 18.327516555786133, 20.214052200317383, 22.100587844848633, 23.987125396728516, 25.873661041259766, 27.760196685791016, 29.646732330322266, 31.533267974853516, 33.419803619384766, 35.306339263916016, 37.192874908447266, 39.079410552978516, 40.965946197509766, 42.852481842041016, 44.73902130126953, 46.62555694580078, 48.51209259033203, 50.39862823486328, 52.28516387939453, 54.17169952392578, 56.05823516845703, 57.94477081298828, 59.83130645751953, 61.71784210205078, 63.60437774658203]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 6.0, 10.0, 8.0, 7.0, 9.0, 20.0, 18.0, 22.0, 28.0, 23.0, 33.0, 33.0, 34.0, 39.0, 38.0, 45.0, 46.0, 57.0, 49.0, 48.0, 57.0, 44.0, 33.0, 28.0, 34.0, 27.0, 31.0, 29.0, 20.0, 25.0, 11.0, 13.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.896484375, -3.768280029296875, -3.64007568359375, -3.511871337890625, -3.3836669921875, -3.255462646484375, -3.12725830078125, -2.999053955078125, -2.870849609375, -2.742645263671875, -2.61444091796875, -2.486236572265625, -2.3580322265625, -2.229827880859375, -2.10162353515625, -1.973419189453125, -1.84521484375, -1.717010498046875, -1.58880615234375, -1.460601806640625, -1.3323974609375, -1.204193115234375, -1.07598876953125, -0.947784423828125, -0.819580078125, -0.691375732421875, -0.56317138671875, -0.434967041015625, -0.3067626953125, -0.178558349609375, -0.05035400390625, 0.077850341796875, 0.2060546875, 0.334259033203125, 0.46246337890625, 0.590667724609375, 0.7188720703125, 0.847076416015625, 0.97528076171875, 1.103485107421875, 1.231689453125, 1.359893798828125, 1.48809814453125, 1.616302490234375, 1.7445068359375, 1.872711181640625, 2.00091552734375, 2.129119873046875, 2.25732421875, 2.385528564453125, 2.51373291015625, 2.641937255859375, 2.7701416015625, 2.898345947265625, 3.02655029296875, 3.154754638671875, 3.282958984375, 3.411163330078125, 3.53936767578125, 3.667572021484375, 3.7957763671875, 3.923980712890625, 4.05218505859375, 4.180389404296875, 4.30859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 0.0, 12.0, 15.0, 25.0, 28.0, 43.0, 56.0, 93.0, 119.0, 151.0, 212.0, 347.0, 434.0, 629.0, 895.0, 1201.0, 1830.0, 2794.0, 4239.0, 6700.0, 11037.0, 19025.0, 35404.0, 67529.0, 133831.0, 245926.0, 239278.0, 129626.0, 64652.0, 34002.0, 18206.0, 10755.0, 6538.0, 4061.0, 2680.0, 1788.0, 1297.0, 905.0, 652.0, 402.0, 310.0, 244.0, 156.0, 126.0, 93.0, 53.0, 37.0, 45.0, 25.0, 15.0, 8.0, 10.0, 9.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.587890625, -0.5700607299804688, -0.5522308349609375, -0.5344009399414062, -0.516571044921875, -0.49874114990234375, -0.4809112548828125, -0.46308135986328125, -0.44525146484375, -0.42742156982421875, -0.4095916748046875, -0.39176177978515625, -0.373931884765625, -0.35610198974609375, -0.3382720947265625, -0.32044219970703125, -0.3026123046875, -0.28478240966796875, -0.2669525146484375, -0.24912261962890625, -0.231292724609375, -0.21346282958984375, -0.1956329345703125, -0.17780303955078125, -0.15997314453125, -0.14214324951171875, -0.1243133544921875, -0.10648345947265625, -0.088653564453125, -0.07082366943359375, -0.0529937744140625, -0.03516387939453125, -0.017333984375, 0.00049591064453125, 0.0183258056640625, 0.03615570068359375, 0.053985595703125, 0.07181549072265625, 0.0896453857421875, 0.10747528076171875, 0.12530517578125, 0.14313507080078125, 0.1609649658203125, 0.17879486083984375, 0.196624755859375, 0.21445465087890625, 0.2322845458984375, 0.25011444091796875, 0.2679443359375, 0.28577423095703125, 0.3036041259765625, 0.32143402099609375, 0.339263916015625, 0.35709381103515625, 0.3749237060546875, 0.39275360107421875, 0.41058349609375, 0.42841339111328125, 0.4462432861328125, 0.46407318115234375, 0.481903076171875, 0.49973297119140625, 0.5175628662109375, 0.5353927612304688, 0.55322265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 8.0, 5.0, 16.0, 18.0, 17.0, 17.0, 24.0, 20.0, 32.0, 29.0, 41.0, 32.0, 40.0, 39.0, 51.0, 45.0, 40.0, 1075.0, 54.0, 37.0, 51.0, 49.0, 34.0, 31.0, 26.0, 25.0, 29.0, 26.0, 18.0, 21.0, 13.0, 12.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.308258056640625, -2.22003173828125, -2.131805419921875, -2.0435791015625, -1.955352783203125, -1.86712646484375, -1.778900146484375, -1.690673828125, -1.602447509765625, -1.51422119140625, -1.425994873046875, -1.3377685546875, -1.249542236328125, -1.16131591796875, -1.073089599609375, -0.98486328125, -0.896636962890625, -0.80841064453125, -0.720184326171875, -0.6319580078125, -0.543731689453125, -0.45550537109375, -0.367279052734375, -0.279052734375, -0.190826416015625, -0.10260009765625, -0.014373779296875, 0.0738525390625, 0.162078857421875, 0.25030517578125, 0.338531494140625, 0.4267578125, 0.514984130859375, 0.60321044921875, 0.691436767578125, 0.7796630859375, 0.867889404296875, 0.95611572265625, 1.044342041015625, 1.132568359375, 1.220794677734375, 1.30902099609375, 1.397247314453125, 1.4854736328125, 1.573699951171875, 1.66192626953125, 1.750152587890625, 1.83837890625, 1.926605224609375, 2.01483154296875, 2.103057861328125, 2.1912841796875, 2.279510498046875, 2.36773681640625, 2.455963134765625, 2.544189453125, 2.632415771484375, 2.72064208984375, 2.808868408203125, 2.8970947265625, 2.985321044921875, 3.07354736328125, 3.161773681640625, 3.25]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 2.0, 5.0, 7.0, 7.0, 20.0, 30.0, 60.0, 81.0, 112.0, 179.0, 327.0, 551.0, 842.0, 1349.0, 2204.0, 3655.0, 5900.0, 10170.0, 16764.0, 28867.0, 49793.0, 91480.0, 170362.0, 1294631.0, 187207.0, 100478.0, 54734.0, 31362.0, 18310.0, 11026.0, 6517.0, 3889.0, 2364.0, 1483.0, 899.0, 551.0, 359.0, 212.0, 129.0, 76.0, 57.0, 35.0, 25.0, 8.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30487823486328125, -0.2945709228515625, -0.28426361083984375, -0.273956298828125, -0.26364898681640625, -0.2533416748046875, -0.24303436279296875, -0.23272705078125, -0.22241973876953125, -0.2121124267578125, -0.20180511474609375, -0.191497802734375, -0.18119049072265625, -0.1708831787109375, -0.16057586669921875, -0.1502685546875, -0.13996124267578125, -0.1296539306640625, -0.11934661865234375, -0.109039306640625, -0.09873199462890625, -0.0884246826171875, -0.07811737060546875, -0.06781005859375, -0.05750274658203125, -0.0471954345703125, -0.03688812255859375, -0.026580810546875, -0.01627349853515625, -0.0059661865234375, 0.00434112548828125, 0.0146484375, 0.02495574951171875, 0.0352630615234375, 0.04557037353515625, 0.055877685546875, 0.06618499755859375, 0.0764923095703125, 0.08679962158203125, 0.09710693359375, 0.10741424560546875, 0.1177215576171875, 0.12802886962890625, 0.138336181640625, 0.14864349365234375, 0.1589508056640625, 0.16925811767578125, 0.1795654296875, 0.18987274169921875, 0.2001800537109375, 0.21048736572265625, 0.220794677734375, 0.23110198974609375, 0.2414093017578125, 0.25171661376953125, 0.26202392578125, 0.27233123779296875, 0.2826385498046875, 0.29294586181640625, 0.303253173828125, 0.31356048583984375, 0.3238677978515625, 0.33417510986328125, 0.344482421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 13.0, 7.0, 23.0, 36.0, 39.0, 51.0, 55.0, 127.0, 194.0, 134.0, 66.0, 58.0, 46.0, 31.0, 14.0, 15.0, 4.0, 5.0, 7.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0108795166015625, -0.010485172271728516, -0.010090827941894531, -0.009696483612060547, -0.009302139282226562, -0.008907794952392578, -0.008513450622558594, -0.00811910629272461, -0.007724761962890625, -0.007330417633056641, -0.006936073303222656, -0.006541728973388672, -0.0061473846435546875, -0.005753040313720703, -0.005358695983886719, -0.004964351654052734, -0.00457000732421875, -0.004175662994384766, -0.0037813186645507812, -0.003386974334716797, -0.0029926300048828125, -0.002598285675048828, -0.0022039413452148438, -0.0018095970153808594, -0.001415252685546875, -0.0010209083557128906, -0.0006265640258789062, -0.00023221969604492188, 0.0001621246337890625, 0.0005564689636230469, 0.0009508132934570312, 0.0013451576232910156, 0.001739501953125, 0.0021338462829589844, 0.0025281906127929688, 0.002922534942626953, 0.0033168792724609375, 0.003711223602294922, 0.004105567932128906, 0.004499912261962891, 0.004894256591796875, 0.005288600921630859, 0.005682945251464844, 0.006077289581298828, 0.0064716339111328125, 0.006865978240966797, 0.007260322570800781, 0.007654666900634766, 0.00804901123046875, 0.008443355560302734, 0.008837699890136719, 0.009232044219970703, 0.009626388549804688, 0.010020732879638672, 0.010415077209472656, 0.01080942153930664, 0.011203765869140625, 0.01159811019897461, 0.011992454528808594, 0.012386798858642578, 0.012781143188476562, 0.013175487518310547, 0.013569831848144531, 0.013964176177978516, 0.0143585205078125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 10.0, 11.0, 13.0, 19.0, 22.0, 46.0, 54.0, 102.0, 154.0, 350.0, 7394.0, 1007657.0, 31598.0, 570.0, 197.0, 94.0, 74.0, 39.0, 25.0, 23.0, 12.0, 8.0, 8.0, 12.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 6.0, 0.0, 2.0, 2.0, 2.0, 4.0], "bins": [-0.357666015625, -0.3484077453613281, -0.33914947509765625, -0.3298912048339844, -0.3206329345703125, -0.3113746643066406, -0.30211639404296875, -0.2928581237792969, -0.283599853515625, -0.2743415832519531, -0.26508331298828125, -0.2558250427246094, -0.2465667724609375, -0.23730850219726562, -0.22805023193359375, -0.21879196166992188, -0.20953369140625, -0.20027542114257812, -0.19101715087890625, -0.18175888061523438, -0.1725006103515625, -0.16324234008789062, -0.15398406982421875, -0.14472579956054688, -0.135467529296875, -0.12620925903320312, -0.11695098876953125, -0.10769271850585938, -0.0984344482421875, -0.08917617797851562, -0.07991790771484375, -0.07065963745117188, -0.0614013671875, -0.052143096923828125, -0.04288482666015625, -0.033626556396484375, -0.0243682861328125, -0.015110015869140625, -0.00585174560546875, 0.003406524658203125, 0.012664794921875, 0.021923065185546875, 0.03118133544921875, 0.040439605712890625, 0.0496978759765625, 0.058956146240234375, 0.06821441650390625, 0.07747268676757812, 0.08673095703125, 0.09598922729492188, 0.10524749755859375, 0.11450576782226562, 0.1237640380859375, 0.13302230834960938, 0.14228057861328125, 0.15153884887695312, 0.160797119140625, 0.17005538940429688, 0.17931365966796875, 0.18857192993164062, 0.1978302001953125, 0.20708847045898438, 0.21634674072265625, 0.22560501098632812, 0.23486328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 10.0, 30.0, 310.0, 578.0, 71.0, 19.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1947118639945984, -0.18916688859462738, -0.18362189829349518, -0.17807692289352417, -0.17253194749355316, -0.16698697209358215, -0.16144198179244995, -0.15589700639247894, -0.15035203099250793, -0.14480705559253693, -0.13926206529140472, -0.13371708989143372, -0.1281721144914627, -0.1226271316409111, -0.1170821487903595, -0.11153717339038849, -0.10599218308925629, -0.10044720023870468, -0.09490222483873367, -0.08935724198818207, -0.08381226658821106, -0.07826728373765945, -0.07272230088710785, -0.06717732548713684, -0.061632342636585236, -0.05608736351132393, -0.05054238438606262, -0.04499740153551102, -0.03945242241024971, -0.0339074432849884, -0.028362460434436798, -0.02281748130917549, -0.01727248728275299, -0.01172750722616911, -0.006182527169585228, -0.000637546181678772, 0.004907432943582535, 0.010452412068843842, 0.015997394919395447, 0.021542374044656754, 0.02708735316991806, 0.03263233229517937, 0.038177311420440674, 0.04372229427099228, 0.049267273396253586, 0.05481225252151489, 0.0603572353720665, 0.0659022182226181, 0.07144719362258911, 0.07699217647314072, 0.08253715187311172, 0.08808213472366333, 0.09362711012363434, 0.09917209297418594, 0.10471707582473755, 0.11026205122470856, 0.11580703407526016, 0.12135201692581177, 0.12689699232578278, 0.13244196772575378, 0.137986958026886, 0.143531933426857, 0.149076908826828, 0.1546218991279602, 0.1601668745279312]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 3.0, 8.0, 11.0, 15.0, 12.0, 13.0, 12.0, 21.0, 31.0, 35.0, 29.0, 32.0, 37.0, 34.0, 43.0, 35.0, 42.0, 39.0, 51.0, 44.0, 42.0, 53.0, 44.0, 47.0, 30.0, 36.0, 41.0, 26.0, 21.0, 27.0, 22.0, 20.0, 14.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016757488250732422, -0.016219746321439743, -0.015682004392147064, -0.015144262462854385, -0.014606520533561707, -0.014068778604269028, -0.013531036674976349, -0.01299329474568367, -0.012455552816390991, -0.011917810887098312, -0.011380068957805634, -0.010842327028512955, -0.010304585099220276, -0.009766843169927597, -0.009229101240634918, -0.00869135931134224, -0.00815361738204956, -0.007615875452756882, -0.007078133523464203, -0.006540391594171524, -0.006002649664878845, -0.005464907735586166, -0.0049271658062934875, -0.004389423877000809, -0.00385168194770813, -0.003313940018415451, -0.002776198089122772, -0.0022384561598300934, -0.0017007142305374146, -0.0011629723012447357, -0.0006252303719520569, -8.748844265937805e-05, 0.0004502534866333008, 0.0009879954159259796, 0.0015257373452186584, 0.0020634792745113373, 0.002601221203804016, 0.003138963133096695, 0.0036767050623893738, 0.004214446991682053, 0.0047521889209747314, 0.00528993085026741, 0.005827672779560089, 0.006365414708852768, 0.006903156638145447, 0.007440898567438126, 0.007978640496730804, 0.008516382426023483, 0.009054124355316162, 0.009591866284608841, 0.01012960821390152, 0.010667350143194199, 0.011205092072486877, 0.011742834001779556, 0.012280575931072235, 0.012818317860364914, 0.013356059789657593, 0.013893801718950272, 0.01443154364824295, 0.01496928557753563, 0.015507027506828308, 0.016044769436120987, 0.016582511365413666, 0.017120253294706345, 0.017657995223999023]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 6.0, 10.0, 8.0, 7.0, 9.0, 20.0, 18.0, 22.0, 28.0, 23.0, 33.0, 33.0, 34.0, 39.0, 39.0, 44.0, 45.0, 58.0, 49.0, 48.0, 57.0, 44.0, 33.0, 28.0, 34.0, 27.0, 31.0, 29.0, 20.0, 25.0, 11.0, 13.0, 13.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.896484375, -3.768280029296875, -3.64007568359375, -3.511871337890625, -3.3836669921875, -3.255462646484375, -3.12725830078125, -2.999053955078125, -2.870849609375, -2.742645263671875, -2.61444091796875, -2.486236572265625, -2.3580322265625, -2.229827880859375, -2.10162353515625, -1.973419189453125, -1.84521484375, -1.717010498046875, -1.58880615234375, -1.460601806640625, -1.3323974609375, -1.204193115234375, -1.07598876953125, -0.947784423828125, -0.819580078125, -0.691375732421875, -0.56317138671875, -0.434967041015625, -0.3067626953125, -0.178558349609375, -0.05035400390625, 0.077850341796875, 0.2060546875, 0.334259033203125, 0.46246337890625, 0.590667724609375, 0.7188720703125, 0.847076416015625, 0.97528076171875, 1.103485107421875, 1.231689453125, 1.359893798828125, 1.48809814453125, 1.616302490234375, 1.7445068359375, 1.872711181640625, 2.00091552734375, 2.129119873046875, 2.25732421875, 2.385528564453125, 2.51373291015625, 2.641937255859375, 2.7701416015625, 2.898345947265625, 3.02655029296875, 3.154754638671875, 3.282958984375, 3.411163330078125, 3.53936767578125, 3.667572021484375, 3.7957763671875, 3.923980712890625, 4.05218505859375, 4.180389404296875, 4.30859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 6.0, 14.0, 18.0, 27.0, 30.0, 32.0, 53.0, 57.0, 96.0, 137.0, 205.0, 300.0, 417.0, 777.0, 1419.0, 2962.0, 9700.0, 410442.0, 603140.0, 11409.0, 3380.0, 1578.0, 883.0, 491.0, 327.0, 204.0, 125.0, 94.0, 65.0, 37.0, 29.0, 20.0, 19.0, 17.0, 13.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.828125, -19.189453125, -18.55078125, -17.912109375, -17.2734375, -16.634765625, -15.99609375, -15.357421875, -14.71875, -14.080078125, -13.44140625, -12.802734375, -12.1640625, -11.525390625, -10.88671875, -10.248046875, -9.609375, -8.970703125, -8.33203125, -7.693359375, -7.0546875, -6.416015625, -5.77734375, -5.138671875, -4.5, -3.861328125, -3.22265625, -2.583984375, -1.9453125, -1.306640625, -0.66796875, -0.029296875, 0.609375, 1.248046875, 1.88671875, 2.525390625, 3.1640625, 3.802734375, 4.44140625, 5.080078125, 5.71875, 6.357421875, 6.99609375, 7.634765625, 8.2734375, 8.912109375, 9.55078125, 10.189453125, 10.828125, 11.466796875, 12.10546875, 12.744140625, 13.3828125, 14.021484375, 14.66015625, 15.298828125, 15.9375, 16.576171875, 17.21484375, 17.853515625, 18.4921875, 19.130859375, 19.76953125, 20.408203125, 21.046875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 6.0, 12.0, 11.0, 9.0, 6.0, 13.0, 19.0, 22.0, 26.0, 27.0, 37.0, 31.0, 31.0, 31.0, 42.0, 60.0, 125.0, 364.0, 1499.0, 133.0, 73.0, 59.0, 48.0, 45.0, 26.0, 25.0, 40.0, 23.0, 26.0, 30.0, 19.0, 20.0, 13.0, 10.0, 15.0, 12.0, 6.0, 12.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-14.75, -14.3304443359375, -13.910888671875, -13.4913330078125, -13.07177734375, -12.6522216796875, -12.232666015625, -11.8131103515625, -11.3935546875, -10.9739990234375, -10.554443359375, -10.1348876953125, -9.71533203125, -9.2957763671875, -8.876220703125, -8.4566650390625, -8.037109375, -7.6175537109375, -7.197998046875, -6.7784423828125, -6.35888671875, -5.9393310546875, -5.519775390625, -5.1002197265625, -4.6806640625, -4.2611083984375, -3.841552734375, -3.4219970703125, -3.00244140625, -2.5828857421875, -2.163330078125, -1.7437744140625, -1.32421875, -0.9046630859375, -0.485107421875, -0.0655517578125, 0.35400390625, 0.7735595703125, 1.193115234375, 1.6126708984375, 2.0322265625, 2.4517822265625, 2.871337890625, 3.2908935546875, 3.71044921875, 4.1300048828125, 4.549560546875, 4.9691162109375, 5.388671875, 5.8082275390625, 6.227783203125, 6.6473388671875, 7.06689453125, 7.4864501953125, 7.906005859375, 8.3255615234375, 8.7451171875, 9.1646728515625, 9.584228515625, 10.0037841796875, 10.42333984375, 10.8428955078125, 11.262451171875, 11.6820068359375, 12.1015625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 6.0, 8.0, 9.0, 13.0, 17.0, 13.0, 15.0, 27.0, 23.0, 41.0, 43.0, 70.0, 106.0, 156.0, 399.0, 1081.0, 2973.0, 9197.0, 614319.0, 2499552.0, 11925.0, 3452.0, 1253.0, 463.0, 184.0, 107.0, 65.0, 39.0, 32.0, 22.0, 14.0, 13.0, 15.0, 13.0, 9.0, 9.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -32.82080078125, -31.7978515625, -30.77490234375, -29.751953125, -28.72900390625, -27.7060546875, -26.68310546875, -25.66015625, -24.63720703125, -23.6142578125, -22.59130859375, -21.568359375, -20.54541015625, -19.5224609375, -18.49951171875, -17.4765625, -16.45361328125, -15.4306640625, -14.40771484375, -13.384765625, -12.36181640625, -11.3388671875, -10.31591796875, -9.29296875, -8.27001953125, -7.2470703125, -6.22412109375, -5.201171875, -4.17822265625, -3.1552734375, -2.13232421875, -1.109375, -0.08642578125, 0.9365234375, 1.95947265625, 2.982421875, 4.00537109375, 5.0283203125, 6.05126953125, 7.07421875, 8.09716796875, 9.1201171875, 10.14306640625, 11.166015625, 12.18896484375, 13.2119140625, 14.23486328125, 15.2578125, 16.28076171875, 17.3037109375, 18.32666015625, 19.349609375, 20.37255859375, 21.3955078125, 22.41845703125, 23.44140625, 24.46435546875, 25.4873046875, 26.51025390625, 27.533203125, 28.55615234375, 29.5791015625, 30.60205078125, 31.625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 114.0, 743.0, 150.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.32150268554688, -211.6716766357422, -207.0218505859375, -202.3720245361328, -197.72219848632812, -193.07237243652344, -188.42254638671875, -183.772705078125, -179.12289428710938, -174.4730682373047, -169.8232421875, -165.1734161376953, -160.52359008789062, -155.87376403808594, -151.22393798828125, -146.5740966796875, -141.9242706298828, -137.27444458007812, -132.62461853027344, -127.97479248046875, -123.32496643066406, -118.67514038085938, -114.02530670166016, -109.37548065185547, -104.72565460205078, -100.0758285522461, -95.4260025024414, -90.77617645263672, -86.1263427734375, -81.47651672363281, -76.82669067382812, -72.17686462402344, -67.52702331542969, -62.877197265625, -58.22737121582031, -53.57754135131836, -48.92771530151367, -44.277889251708984, -39.62805938720703, -34.978233337402344, -30.328407287597656, -25.67858123779297, -21.02875328063965, -16.378925323486328, -11.72909927368164, -7.079273223876953, -2.429445266723633, 2.2203826904296875, 6.870208740234375, 11.520035743713379, 16.169862747192383, 20.819690704345703, 25.46951675415039, 30.119342803955078, 34.76917266845703, 39.41899871826172, 44.068824768066406, 48.718650817871094, 53.36847686767578, 58.018306732177734, 62.66813278198242, 67.31796264648438, 71.96778869628906, 76.61761474609375, 81.26744079589844]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 6.0, 4.0, 10.0, 11.0, 8.0, 8.0, 10.0, 16.0, 17.0, 22.0, 17.0, 29.0, 37.0, 38.0, 39.0, 42.0, 38.0, 36.0, 42.0, 33.0, 52.0, 39.0, 40.0, 45.0, 39.0, 34.0, 28.0, 36.0, 33.0, 33.0, 31.0, 24.0, 17.0, 14.0, 15.0, 8.0, 10.0, 12.0, 4.0, 2.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.88842010498047, -45.42708206176758, -43.96574401855469, -42.5044059753418, -41.043067932128906, -39.581729888916016, -38.120391845703125, -36.6590576171875, -35.197715759277344, -33.73637771606445, -32.27503967285156, -30.813701629638672, -29.35236358642578, -27.89102554321289, -26.429689407348633, -24.968351364135742, -23.507015228271484, -22.045677185058594, -20.584339141845703, -19.123001098632812, -17.661663055419922, -16.20032501220703, -14.738988876342773, -13.277650833129883, -11.816312789916992, -10.354974746704102, -8.893636703491211, -7.432299613952637, -5.970961570739746, -4.5096235275268555, -3.0482864379882812, -1.5869483947753906, -0.12561416625976562, 1.335723638534546, 2.7970614433288574, 4.25839900970459, 5.7197370529174805, 7.181075096130371, 8.642412185668945, 10.103750228881836, 11.565088272094727, 13.026426315307617, 14.487764358520508, 15.949101448059082, 17.410438537597656, 18.871776580810547, 20.333114624023438, 21.794452667236328, 23.25579071044922, 24.71712875366211, 26.178466796875, 27.63980484008789, 29.10114288330078, 30.562480926513672, 32.02381896972656, 33.48515319824219, 34.946495056152344, 36.407833099365234, 37.869171142578125, 39.330509185791016, 40.791847229003906, 42.2531852722168, 43.71452331542969, 45.17585754394531, 46.6371955871582]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 10.0, 10.0, 5.0, 9.0, 11.0, 20.0, 21.0, 21.0, 28.0, 31.0, 31.0, 35.0, 36.0, 36.0, 40.0, 49.0, 42.0, 45.0, 66.0, 42.0, 46.0, 45.0, 38.0, 34.0, 29.0, 28.0, 32.0, 23.0, 23.0, 23.0, 7.0, 12.0, 15.0, 9.0, 8.0, 12.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.09765625, -3.9661865234375, -3.834716796875, -3.7032470703125, -3.57177734375, -3.4403076171875, -3.308837890625, -3.1773681640625, -3.0458984375, -2.9144287109375, -2.782958984375, -2.6514892578125, -2.52001953125, -2.3885498046875, -2.257080078125, -2.1256103515625, -1.994140625, -1.8626708984375, -1.731201171875, -1.5997314453125, -1.46826171875, -1.3367919921875, -1.205322265625, -1.0738525390625, -0.9423828125, -0.8109130859375, -0.679443359375, -0.5479736328125, -0.41650390625, -0.2850341796875, -0.153564453125, -0.0220947265625, 0.109375, 0.2408447265625, 0.372314453125, 0.5037841796875, 0.63525390625, 0.7667236328125, 0.898193359375, 1.0296630859375, 1.1611328125, 1.2926025390625, 1.424072265625, 1.5555419921875, 1.68701171875, 1.8184814453125, 1.949951171875, 2.0814208984375, 2.212890625, 2.3443603515625, 2.475830078125, 2.6072998046875, 2.73876953125, 2.8702392578125, 3.001708984375, 3.1331787109375, 3.2646484375, 3.3961181640625, 3.527587890625, 3.6590576171875, 3.79052734375, 3.9219970703125, 4.053466796875, 4.1849365234375, 4.31640625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 13.0, 20.0, 19.0, 35.0, 44.0, 83.0, 140.0, 259.0, 396.0, 646.0, 1294.0, 2435.0, 5017.0, 11924.0, 32546.0, 144737.0, 3452370.0, 459640.0, 52791.0, 16562.0, 6684.0, 3057.0, 1535.0, 797.0, 439.0, 288.0, 184.0, 103.0, 62.0, 44.0, 27.0, 20.0, 17.0, 11.0, 10.0, 5.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65625, -26.724853515625, -25.79345703125, -24.862060546875, -23.9306640625, -22.999267578125, -22.06787109375, -21.136474609375, -20.205078125, -19.273681640625, -18.34228515625, -17.410888671875, -16.4794921875, -15.548095703125, -14.61669921875, -13.685302734375, -12.75390625, -11.822509765625, -10.89111328125, -9.959716796875, -9.0283203125, -8.096923828125, -7.16552734375, -6.234130859375, -5.302734375, -4.371337890625, -3.43994140625, -2.508544921875, -1.5771484375, -0.645751953125, 0.28564453125, 1.217041015625, 2.1484375, 3.079833984375, 4.01123046875, 4.942626953125, 5.8740234375, 6.805419921875, 7.73681640625, 8.668212890625, 9.599609375, 10.531005859375, 11.46240234375, 12.393798828125, 13.3251953125, 14.256591796875, 15.18798828125, 16.119384765625, 17.05078125, 17.982177734375, 18.91357421875, 19.844970703125, 20.7763671875, 21.707763671875, 22.63916015625, 23.570556640625, 24.501953125, 25.433349609375, 26.36474609375, 27.296142578125, 28.2275390625, 29.158935546875, 30.09033203125, 31.021728515625, 31.953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 7.0, 6.0, 5.0, 14.0, 11.0, 22.0, 20.0, 33.0, 37.0, 44.0, 49.0, 68.0, 80.0, 132.0, 180.0, 254.0, 424.0, 607.0, 607.0, 475.0, 272.0, 176.0, 129.0, 89.0, 77.0, 58.0, 44.0, 33.0, 21.0, 20.0, 26.0, 14.0, 10.0, 10.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.8359375, -15.3272705078125, -14.818603515625, -14.3099365234375, -13.80126953125, -13.2926025390625, -12.783935546875, -12.2752685546875, -11.7666015625, -11.2579345703125, -10.749267578125, -10.2406005859375, -9.73193359375, -9.2232666015625, -8.714599609375, -8.2059326171875, -7.697265625, -7.1885986328125, -6.679931640625, -6.1712646484375, -5.66259765625, -5.1539306640625, -4.645263671875, -4.1365966796875, -3.6279296875, -3.1192626953125, -2.610595703125, -2.1019287109375, -1.59326171875, -1.0845947265625, -0.575927734375, -0.0672607421875, 0.44140625, 0.9500732421875, 1.458740234375, 1.9674072265625, 2.47607421875, 2.9847412109375, 3.493408203125, 4.0020751953125, 4.5107421875, 5.0194091796875, 5.528076171875, 6.0367431640625, 6.54541015625, 7.0540771484375, 7.562744140625, 8.0714111328125, 8.580078125, 9.0887451171875, 9.597412109375, 10.1060791015625, 10.61474609375, 11.1234130859375, 11.632080078125, 12.1407470703125, 12.6494140625, 13.1580810546875, 13.666748046875, 14.1754150390625, 14.68408203125, 15.1927490234375, 15.701416015625, 16.2100830078125, 16.71875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 4.0, 9.0, 16.0, 18.0, 39.0, 59.0, 83.0, 127.0, 193.0, 255.0, 454.0, 588.0, 949.0, 1514.0, 2411.0, 3890.0, 6290.0, 10617.0, 18325.0, 33722.0, 67519.0, 160691.0, 654445.0, 2364761.0, 577080.0, 149472.0, 63937.0, 32465.0, 17785.0, 10225.0, 6070.0, 3661.0, 2372.0, 1470.0, 949.0, 637.0, 374.0, 252.0, 187.0, 118.0, 89.0, 44.0, 40.0, 28.0, 13.0, 9.0, 10.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.234375, -20.580322265625, -19.92626953125, -19.272216796875, -18.6181640625, -17.964111328125, -17.31005859375, -16.656005859375, -16.001953125, -15.347900390625, -14.69384765625, -14.039794921875, -13.3857421875, -12.731689453125, -12.07763671875, -11.423583984375, -10.76953125, -10.115478515625, -9.46142578125, -8.807373046875, -8.1533203125, -7.499267578125, -6.84521484375, -6.191162109375, -5.537109375, -4.883056640625, -4.22900390625, -3.574951171875, -2.9208984375, -2.266845703125, -1.61279296875, -0.958740234375, -0.3046875, 0.349365234375, 1.00341796875, 1.657470703125, 2.3115234375, 2.965576171875, 3.61962890625, 4.273681640625, 4.927734375, 5.581787109375, 6.23583984375, 6.889892578125, 7.5439453125, 8.197998046875, 8.85205078125, 9.506103515625, 10.16015625, 10.814208984375, 11.46826171875, 12.122314453125, 12.7763671875, 13.430419921875, 14.08447265625, 14.738525390625, 15.392578125, 16.046630859375, 16.70068359375, 17.354736328125, 18.0087890625, 18.662841796875, 19.31689453125, 19.970947265625, 20.625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 10.0, 20.0, 53.0, 103.0, 191.0, 242.0, 200.0, 111.0, 47.0, 22.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.7401351928711, -84.49911499023438, -77.25808715820312, -70.0170669555664, -62.77604293823242, -55.53501892089844, -48.29399871826172, -41.052974700927734, -33.81195068359375, -26.570926666259766, -19.329904556274414, -12.088882446289062, -4.847858428955078, 2.3931655883789062, 9.634185791015625, 16.87520980834961, 24.116233825683594, 31.357257843017578, 38.59828186035156, 45.83930206298828, 53.080326080322266, 60.32135009765625, 67.56237030029297, 74.80339050292969, 82.04441833496094, 89.28543853759766, 96.5264663696289, 103.76748657226562, 111.00851440429688, 118.2495346069336, 125.49055480957031, 132.73158264160156, 139.97259521484375, 147.213623046875, 154.4546356201172, 161.69566345214844, 168.9366912841797, 176.17770385742188, 183.41873168945312, 190.65975952148438, 197.90078735351562, 205.14181518554688, 212.38282775878906, 219.6238555908203, 226.86488342285156, 234.10589599609375, 241.346923828125, 248.58795166015625, 255.82896423339844, 263.0699768066406, 270.3110046386719, 277.5520324707031, 284.7930603027344, 292.0340881347656, 299.27508544921875, 306.51611328125, 313.75714111328125, 320.9981689453125, 328.23919677734375, 335.480224609375, 342.7212219238281, 349.9622497558594, 357.2032775878906, 364.4443054199219, 371.6853332519531]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 3.0, 11.0, 10.0, 18.0, 13.0, 17.0, 24.0, 15.0, 26.0, 29.0, 16.0, 50.0, 41.0, 37.0, 45.0, 35.0, 47.0, 40.0, 35.0, 39.0, 44.0, 47.0, 46.0, 40.0, 40.0, 31.0, 27.0, 32.0, 29.0, 17.0, 17.0, 12.0, 11.0, 14.0, 8.0, 13.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-72.28639221191406, -70.28898620605469, -68.29158020019531, -66.29417419433594, -64.29676055908203, -62.299354553222656, -60.30194854736328, -58.304542541503906, -56.30713653564453, -54.309730529785156, -52.312320709228516, -50.31491470336914, -48.317508697509766, -46.320098876953125, -44.32269287109375, -42.325286865234375, -40.327877044677734, -38.33047103881836, -36.33306121826172, -34.335655212402344, -32.33824920654297, -30.34084129333496, -28.343433380126953, -26.346027374267578, -24.34861946105957, -22.351211547851562, -20.353805541992188, -18.35639762878418, -16.358989715576172, -14.361583709716797, -12.364175796508789, -10.366768836975098, -8.36935806274414, -6.371951103210449, -4.3745436668396, -2.37713623046875, -0.3797292709350586, 1.6176776885986328, 3.6150856018066406, 5.612492561340332, 7.609899520874023, 9.607306480407715, 11.604713439941406, 13.602121353149414, 15.599528312683105, 17.596935272216797, 19.594343185424805, 21.591751098632812, 23.589157104492188, 25.586565017700195, 27.58397102355957, 29.581378936767578, 31.578784942626953, 33.576194763183594, 35.57360076904297, 37.571006774902344, 39.56841278076172, 41.565818786621094, 43.563228607177734, 45.56063461303711, 47.558040618896484, 49.555450439453125, 51.5528564453125, 53.550262451171875, 55.547672271728516]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 2.0, 11.0, 8.0, 9.0, 12.0, 19.0, 12.0, 19.0, 20.0, 23.0, 24.0, 24.0, 32.0, 29.0, 48.0, 42.0, 41.0, 45.0, 47.0, 47.0, 38.0, 35.0, 52.0, 36.0, 37.0, 39.0, 30.0, 32.0, 21.0, 28.0, 19.0, 22.0, 12.0, 16.0, 8.0, 13.0, 11.0, 2.0, 3.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.703338623046875, -3.56488037109375, -3.426422119140625, -3.2879638671875, -3.149505615234375, -3.01104736328125, -2.872589111328125, -2.734130859375, -2.595672607421875, -2.45721435546875, -2.318756103515625, -2.1802978515625, -2.041839599609375, -1.90338134765625, -1.764923095703125, -1.62646484375, -1.488006591796875, -1.34954833984375, -1.211090087890625, -1.0726318359375, -0.934173583984375, -0.79571533203125, -0.657257080078125, -0.518798828125, -0.380340576171875, -0.24188232421875, -0.103424072265625, 0.0350341796875, 0.173492431640625, 0.31195068359375, 0.450408935546875, 0.5888671875, 0.727325439453125, 0.86578369140625, 1.004241943359375, 1.1427001953125, 1.281158447265625, 1.41961669921875, 1.558074951171875, 1.696533203125, 1.834991455078125, 1.97344970703125, 2.111907958984375, 2.2503662109375, 2.388824462890625, 2.52728271484375, 2.665740966796875, 2.80419921875, 2.942657470703125, 3.08111572265625, 3.219573974609375, 3.3580322265625, 3.496490478515625, 3.63494873046875, 3.773406982421875, 3.911865234375, 4.050323486328125, 4.18878173828125, 4.327239990234375, 4.4656982421875, 4.604156494140625, 4.74261474609375, 4.881072998046875, 5.01953125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 4.0, 8.0, 9.0, 12.0, 30.0, 31.0, 35.0, 68.0, 70.0, 116.0, 192.0, 250.0, 378.0, 594.0, 799.0, 1284.0, 2009.0, 3024.0, 5229.0, 9143.0, 16587.0, 32516.0, 65838.0, 136480.0, 260354.0, 251377.0, 129554.0, 63126.0, 31180.0, 15944.0, 8584.0, 5037.0, 3104.0, 1851.0, 1256.0, 800.0, 524.0, 356.0, 256.0, 172.0, 105.0, 78.0, 56.0, 49.0, 33.0, 20.0, 8.0, 8.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.68798828125, -0.6664657592773438, -0.6449432373046875, -0.6234207153320312, -0.601898193359375, -0.5803756713867188, -0.5588531494140625, -0.5373306274414062, -0.51580810546875, -0.49428558349609375, -0.4727630615234375, -0.45124053955078125, -0.429718017578125, -0.40819549560546875, -0.3866729736328125, -0.36515045166015625, -0.3436279296875, -0.32210540771484375, -0.3005828857421875, -0.27906036376953125, -0.257537841796875, -0.23601531982421875, -0.2144927978515625, -0.19297027587890625, -0.17144775390625, -0.14992523193359375, -0.1284027099609375, -0.10688018798828125, -0.085357666015625, -0.06383514404296875, -0.0423126220703125, -0.02079010009765625, 0.000732421875, 0.02225494384765625, 0.0437774658203125, 0.06529998779296875, 0.086822509765625, 0.10834503173828125, 0.1298675537109375, 0.15139007568359375, 0.17291259765625, 0.19443511962890625, 0.2159576416015625, 0.23748016357421875, 0.259002685546875, 0.28052520751953125, 0.3020477294921875, 0.32357025146484375, 0.3450927734375, 0.36661529541015625, 0.3881378173828125, 0.40966033935546875, 0.431182861328125, 0.45270538330078125, 0.4742279052734375, 0.49575042724609375, 0.51727294921875, 0.5387954711914062, 0.5603179931640625, 0.5818405151367188, 0.603363037109375, 0.6248855590820312, 0.6464080810546875, 0.6679306030273438, 0.689453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 3.0, 10.0, 6.0, 8.0, 12.0, 20.0, 16.0, 17.0, 18.0, 25.0, 22.0, 25.0, 22.0, 31.0, 32.0, 43.0, 42.0, 42.0, 48.0, 37.0, 1063.0, 44.0, 36.0, 44.0, 35.0, 29.0, 31.0, 37.0, 30.0, 32.0, 27.0, 22.0, 26.0, 17.0, 8.0, 6.0, 13.0, 3.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.681640625, -2.593505859375, -2.50537109375, -2.417236328125, -2.3291015625, -2.240966796875, -2.15283203125, -2.064697265625, -1.9765625, -1.888427734375, -1.80029296875, -1.712158203125, -1.6240234375, -1.535888671875, -1.44775390625, -1.359619140625, -1.271484375, -1.183349609375, -1.09521484375, -1.007080078125, -0.9189453125, -0.830810546875, -0.74267578125, -0.654541015625, -0.56640625, -0.478271484375, -0.39013671875, -0.302001953125, -0.2138671875, -0.125732421875, -0.03759765625, 0.050537109375, 0.138671875, 0.226806640625, 0.31494140625, 0.403076171875, 0.4912109375, 0.579345703125, 0.66748046875, 0.755615234375, 0.84375, 0.931884765625, 1.02001953125, 1.108154296875, 1.1962890625, 1.284423828125, 1.37255859375, 1.460693359375, 1.548828125, 1.636962890625, 1.72509765625, 1.813232421875, 1.9013671875, 1.989501953125, 2.07763671875, 2.165771484375, 2.25390625, 2.342041015625, 2.43017578125, 2.518310546875, 2.6064453125, 2.694580078125, 2.78271484375, 2.870849609375, 2.958984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 8.0, 2.0, 7.0, 10.0, 11.0, 14.0, 35.0, 48.0, 65.0, 89.0, 116.0, 197.0, 350.0, 456.0, 645.0, 922.0, 1528.0, 2295.0, 3670.0, 5718.0, 8933.0, 13705.0, 21650.0, 34749.0, 56974.0, 96793.0, 167428.0, 1253053.0, 172313.0, 99390.0, 58106.0, 35678.0, 22527.0, 14081.0, 8906.0, 5788.0, 3751.0, 2459.0, 1570.0, 1060.0, 627.0, 476.0, 316.0, 189.0, 130.0, 97.0, 70.0, 52.0, 26.0, 20.0, 6.0, 15.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.278411865234375, -0.26898193359375, -0.259552001953125, -0.2501220703125, -0.240692138671875, -0.23126220703125, -0.221832275390625, -0.21240234375, -0.202972412109375, -0.19354248046875, -0.184112548828125, -0.1746826171875, -0.165252685546875, -0.15582275390625, -0.146392822265625, -0.136962890625, -0.127532958984375, -0.11810302734375, -0.108673095703125, -0.0992431640625, -0.089813232421875, -0.08038330078125, -0.070953369140625, -0.0615234375, -0.052093505859375, -0.04266357421875, -0.033233642578125, -0.0238037109375, -0.014373779296875, -0.00494384765625, 0.004486083984375, 0.013916015625, 0.023345947265625, 0.03277587890625, 0.042205810546875, 0.0516357421875, 0.061065673828125, 0.07049560546875, 0.079925537109375, 0.08935546875, 0.098785400390625, 0.10821533203125, 0.117645263671875, 0.1270751953125, 0.136505126953125, 0.14593505859375, 0.155364990234375, 0.164794921875, 0.174224853515625, 0.18365478515625, 0.193084716796875, 0.2025146484375, 0.211944580078125, 0.22137451171875, 0.230804443359375, 0.240234375, 0.249664306640625, 0.25909423828125, 0.268524169921875, 0.2779541015625, 0.287384033203125, 0.29681396484375, 0.306243896484375, 0.315673828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 4.0, 3.0, 9.0, 11.0, 16.0, 30.0, 23.0, 28.0, 43.0, 52.0, 42.0, 95.0, 150.0, 125.0, 68.0, 48.0, 41.0, 27.0, 42.0, 22.0, 21.0, 16.0, 14.0, 14.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0237884521484375, -0.0230405330657959, -0.022292613983154297, -0.021544694900512695, -0.020796775817871094, -0.020048856735229492, -0.01930093765258789, -0.01855301856994629, -0.017805099487304688, -0.017057180404663086, -0.016309261322021484, -0.015561342239379883, -0.014813423156738281, -0.01406550407409668, -0.013317584991455078, -0.012569665908813477, -0.011821746826171875, -0.011073827743530273, -0.010325908660888672, -0.00957798957824707, -0.008830070495605469, -0.008082151412963867, -0.007334232330322266, -0.006586313247680664, -0.0058383941650390625, -0.005090475082397461, -0.004342555999755859, -0.003594636917114258, -0.0028467178344726562, -0.0020987987518310547, -0.0013508796691894531, -0.0006029605865478516, 0.00014495849609375, 0.0008928775787353516, 0.0016407966613769531, 0.0023887157440185547, 0.0031366348266601562, 0.003884553909301758, 0.004632472991943359, 0.005380392074584961, 0.0061283111572265625, 0.006876230239868164, 0.007624149322509766, 0.008372068405151367, 0.009119987487792969, 0.00986790657043457, 0.010615825653076172, 0.011363744735717773, 0.012111663818359375, 0.012859582901000977, 0.013607501983642578, 0.01435542106628418, 0.015103340148925781, 0.015851259231567383, 0.016599178314208984, 0.017347097396850586, 0.018095016479492188, 0.01884293556213379, 0.01959085464477539, 0.020338773727416992, 0.021086692810058594, 0.021834611892700195, 0.022582530975341797, 0.0233304500579834, 0.024078369140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 7.0, 3.0, 7.0, 21.0, 26.0, 23.0, 28.0, 34.0, 55.0, 75.0, 119.0, 180.0, 805.0, 18203.0, 1018891.0, 8977.0, 538.0, 166.0, 92.0, 74.0, 71.0, 41.0, 30.0, 15.0, 16.0, 12.0, 7.0, 3.0, 8.0, 0.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.49442291259765625, -0.4776153564453125, -0.46080780029296875, -0.444000244140625, -0.42719268798828125, -0.4103851318359375, -0.39357757568359375, -0.37677001953125, -0.35996246337890625, -0.3431549072265625, -0.32634735107421875, -0.309539794921875, -0.29273223876953125, -0.2759246826171875, -0.25911712646484375, -0.2423095703125, -0.22550201416015625, -0.2086944580078125, -0.19188690185546875, -0.175079345703125, -0.15827178955078125, -0.1414642333984375, -0.12465667724609375, -0.10784912109375, -0.09104156494140625, -0.0742340087890625, -0.05742645263671875, -0.040618896484375, -0.02381134033203125, -0.0070037841796875, 0.00980377197265625, 0.026611328125, 0.04341888427734375, 0.0602264404296875, 0.07703399658203125, 0.093841552734375, 0.11064910888671875, 0.1274566650390625, 0.14426422119140625, 0.16107177734375, 0.17787933349609375, 0.1946868896484375, 0.21149444580078125, 0.228302001953125, 0.24510955810546875, 0.2619171142578125, 0.27872467041015625, 0.2955322265625, 0.31233978271484375, 0.3291473388671875, 0.34595489501953125, 0.362762451171875, 0.37957000732421875, 0.3963775634765625, 0.41318511962890625, 0.42999267578125, 0.44680023193359375, 0.4636077880859375, 0.48041534423828125, 0.497222900390625, 0.5140304565429688, 0.5308380126953125, 0.5476455688476562, 0.564453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 22.0, 109.0, 556.0, 239.0, 58.0, 16.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04319857805967331, -0.03673320636153221, -0.030267834663391113, -0.023802461102604866, -0.017337089404463768, -0.01087171584367752, -0.004406344145536423, 0.0020590275526046753, 0.008524399250745773, 0.014989770948886871, 0.02145514264702797, 0.027920516207814217, 0.034385889768600464, 0.04085126146674156, 0.04731663316488266, 0.05378200486302376, 0.060247376561164856, 0.06671275198459625, 0.07317811995744705, 0.07964349538087845, 0.08610886335372925, 0.09257423877716064, 0.09903961420059204, 0.10550498217344284, 0.11197035014629364, 0.11843572556972504, 0.12490109354257584, 0.13136646151542664, 0.13783183693885803, 0.14429721236228943, 0.15076258778572083, 0.15722796320915222, 0.16369332373142242, 0.17015869915485382, 0.17662407457828522, 0.18308943510055542, 0.18955481052398682, 0.1960201859474182, 0.2024855613708496, 0.208950936794281, 0.2154162973165512, 0.2218816727399826, 0.228347048163414, 0.2348124086856842, 0.2412777841091156, 0.247743159532547, 0.2542085349559784, 0.2606739103794098, 0.2671392858028412, 0.2736046612262726, 0.280070036649704, 0.2865354120731354, 0.2930007874965668, 0.2994661331176758, 0.3059315085411072, 0.3123968839645386, 0.31886225938796997, 0.32532763481140137, 0.33179301023483276, 0.33825838565826416, 0.34472376108169556, 0.35118913650512695, 0.35765448212623596, 0.36411985754966736, 0.37058523297309875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 3.0, 8.0, 5.0, 8.0, 10.0, 12.0, 11.0, 16.0, 18.0, 17.0, 23.0, 29.0, 33.0, 23.0, 23.0, 35.0, 37.0, 45.0, 33.0, 38.0, 40.0, 36.0, 42.0, 34.0, 40.0, 35.0, 38.0, 27.0, 28.0, 22.0, 34.0, 36.0, 29.0, 22.0, 20.0, 16.0, 18.0, 13.0, 9.0, 6.0, 11.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.041758060455322266, -0.04040367901325226, -0.03904929757118225, -0.03769491985440254, -0.036340538412332535, -0.03498615697026253, -0.03363177925348282, -0.03227739781141281, -0.030923016369342804, -0.029568634927272797, -0.02821425534784794, -0.02685987576842308, -0.025505494326353073, -0.024151112884283066, -0.022796733304858208, -0.02144235372543335, -0.020087972283363342, -0.018733590841293335, -0.017379211261868477, -0.01602483168244362, -0.014670450240373611, -0.013316069729626179, -0.011961689218878746, -0.010607308708131313, -0.00925292819738388, -0.007898547686636448, -0.006544167175889015, -0.0051897866651415825, -0.0038354061543941498, -0.002481025643646717, -0.0011266451328992844, 0.00022773537784814835, 0.001582115888595581, 0.0029364963993430138, 0.0042908769100904465, 0.005645257420837879, 0.006999637931585312, 0.008354018442332745, 0.009708398953080177, 0.01106277946382761, 0.012417159974575043, 0.013771540485322475, 0.015125920996069908, 0.016480300575494766, 0.017834682017564774, 0.01918906345963478, 0.02054344303905964, 0.021897822618484497, 0.023252204060554504, 0.02460658550262451, 0.02596096508204937, 0.027315344661474228, 0.028669726103544235, 0.030024107545614243, 0.03137848526239395, 0.03273286670446396, 0.034087248146533966, 0.03544162958860397, 0.03679601103067398, 0.03815038874745369, 0.0395047701895237, 0.040859151631593704, 0.04221352934837341, 0.04356791079044342, 0.04492229223251343]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 2.0, 11.0, 8.0, 9.0, 12.0, 19.0, 12.0, 19.0, 20.0, 24.0, 23.0, 24.0, 32.0, 29.0, 48.0, 41.0, 41.0, 46.0, 47.0, 47.0, 38.0, 35.0, 52.0, 36.0, 37.0, 39.0, 30.0, 32.0, 21.0, 28.0, 19.0, 22.0, 12.0, 16.0, 8.0, 13.0, 11.0, 2.0, 3.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.703338623046875, -3.56488037109375, -3.426422119140625, -3.2879638671875, -3.149505615234375, -3.01104736328125, -2.872589111328125, -2.734130859375, -2.595672607421875, -2.45721435546875, -2.318756103515625, -2.1802978515625, -2.041839599609375, -1.90338134765625, -1.764923095703125, -1.62646484375, -1.488006591796875, -1.34954833984375, -1.211090087890625, -1.0726318359375, -0.934173583984375, -0.79571533203125, -0.657257080078125, -0.518798828125, -0.380340576171875, -0.24188232421875, -0.103424072265625, 0.0350341796875, 0.173492431640625, 0.31195068359375, 0.450408935546875, 0.5888671875, 0.727325439453125, 0.86578369140625, 1.004241943359375, 1.1427001953125, 1.281158447265625, 1.41961669921875, 1.558074951171875, 1.696533203125, 1.834991455078125, 1.97344970703125, 2.111907958984375, 2.2503662109375, 2.388824462890625, 2.52728271484375, 2.665740966796875, 2.80419921875, 2.942657470703125, 3.08111572265625, 3.219573974609375, 3.3580322265625, 3.496490478515625, 3.63494873046875, 3.773406982421875, 3.911865234375, 4.050323486328125, 4.18878173828125, 4.327239990234375, 4.4656982421875, 4.604156494140625, 4.74261474609375, 4.881072998046875, 5.01953125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 10.0, 12.0, 12.0, 22.0, 18.0, 33.0, 77.0, 77.0, 99.0, 175.0, 220.0, 283.0, 428.0, 581.0, 905.0, 1397.0, 2037.0, 3464.0, 5797.0, 15716.0, 705206.0, 286365.0, 11304.0, 5283.0, 3187.0, 1912.0, 1274.0, 796.0, 541.0, 382.0, 249.0, 182.0, 146.0, 93.0, 67.0, 44.0, 46.0, 27.0, 20.0, 16.0, 11.0, 8.0, 9.0, 5.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.3466796875, -17.771484375, -17.1962890625, -16.62109375, -16.0458984375, -15.470703125, -14.8955078125, -14.3203125, -13.7451171875, -13.169921875, -12.5947265625, -12.01953125, -11.4443359375, -10.869140625, -10.2939453125, -9.71875, -9.1435546875, -8.568359375, -7.9931640625, -7.41796875, -6.8427734375, -6.267578125, -5.6923828125, -5.1171875, -4.5419921875, -3.966796875, -3.3916015625, -2.81640625, -2.2412109375, -1.666015625, -1.0908203125, -0.515625, 0.0595703125, 0.634765625, 1.2099609375, 1.78515625, 2.3603515625, 2.935546875, 3.5107421875, 4.0859375, 4.6611328125, 5.236328125, 5.8115234375, 6.38671875, 6.9619140625, 7.537109375, 8.1123046875, 8.6875, 9.2626953125, 9.837890625, 10.4130859375, 10.98828125, 11.5634765625, 12.138671875, 12.7138671875, 13.2890625, 13.8642578125, 14.439453125, 15.0146484375, 15.58984375, 16.1650390625, 16.740234375, 17.3154296875, 17.890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 15.0, 13.0, 10.0, 24.0, 15.0, 20.0, 31.0, 31.0, 29.0, 43.0, 45.0, 50.0, 60.0, 80.0, 147.0, 1782.0, 156.0, 60.0, 59.0, 53.0, 40.0, 34.0, 38.0, 26.0, 28.0, 18.0, 32.0, 10.0, 9.0, 13.0, 13.0, 7.0, 6.0, 6.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -13.9757080078125, -13.427978515625, -12.8802490234375, -12.33251953125, -11.7847900390625, -11.237060546875, -10.6893310546875, -10.1416015625, -9.5938720703125, -9.046142578125, -8.4984130859375, -7.95068359375, -7.4029541015625, -6.855224609375, -6.3074951171875, -5.759765625, -5.2120361328125, -4.664306640625, -4.1165771484375, -3.56884765625, -3.0211181640625, -2.473388671875, -1.9256591796875, -1.3779296875, -0.8302001953125, -0.282470703125, 0.2652587890625, 0.81298828125, 1.3607177734375, 1.908447265625, 2.4561767578125, 3.00390625, 3.5516357421875, 4.099365234375, 4.6470947265625, 5.19482421875, 5.7425537109375, 6.290283203125, 6.8380126953125, 7.3857421875, 7.9334716796875, 8.481201171875, 9.0289306640625, 9.57666015625, 10.1243896484375, 10.672119140625, 11.2198486328125, 11.767578125, 12.3153076171875, 12.863037109375, 13.4107666015625, 13.95849609375, 14.5062255859375, 15.053955078125, 15.6016845703125, 16.1494140625, 16.6971435546875, 17.244873046875, 17.7926025390625, 18.34033203125, 18.8880615234375, 19.435791015625, 19.9835205078125, 20.53125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 8.0, 7.0, 4.0, 6.0, 10.0, 10.0, 9.0, 15.0, 12.0, 26.0, 27.0, 35.0, 71.0, 106.0, 227.0, 430.0, 926.0, 1949.0, 4255.0, 11340.0, 60176.0, 2969445.0, 75349.0, 12444.0, 4788.0, 2010.0, 1027.0, 445.0, 214.0, 108.0, 65.0, 39.0, 20.0, 23.0, 15.0, 15.0, 10.0, 14.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-31.34375, -30.48583984375, -29.6279296875, -28.77001953125, -27.912109375, -27.05419921875, -26.1962890625, -25.33837890625, -24.48046875, -23.62255859375, -22.7646484375, -21.90673828125, -21.048828125, -20.19091796875, -19.3330078125, -18.47509765625, -17.6171875, -16.75927734375, -15.9013671875, -15.04345703125, -14.185546875, -13.32763671875, -12.4697265625, -11.61181640625, -10.75390625, -9.89599609375, -9.0380859375, -8.18017578125, -7.322265625, -6.46435546875, -5.6064453125, -4.74853515625, -3.890625, -3.03271484375, -2.1748046875, -1.31689453125, -0.458984375, 0.39892578125, 1.2568359375, 2.11474609375, 2.97265625, 3.83056640625, 4.6884765625, 5.54638671875, 6.404296875, 7.26220703125, 8.1201171875, 8.97802734375, 9.8359375, 10.69384765625, 11.5517578125, 12.40966796875, 13.267578125, 14.12548828125, 14.9833984375, 15.84130859375, 16.69921875, 17.55712890625, 18.4150390625, 19.27294921875, 20.130859375, 20.98876953125, 21.8466796875, 22.70458984375, 23.5625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 16.0, 68.0, 209.0, 394.0, 247.0, 64.0, 12.0, 7.0], "bins": [-183.8159942626953, -180.72845458984375, -177.6409149169922, -174.55337524414062, -171.46583557128906, -168.3782958984375, -165.29075622558594, -162.20321655273438, -159.1156768798828, -156.02813720703125, -152.9405975341797, -149.85305786132812, -146.76551818847656, -143.677978515625, -140.59043884277344, -137.50289916992188, -134.41537475585938, -131.3278350830078, -128.24029541015625, -125.15275573730469, -122.06521606445312, -118.97767639160156, -115.89013671875, -112.80260467529297, -109.71505737304688, -106.62751770019531, -103.53997802734375, -100.45243835449219, -97.36489868164062, -94.27735900878906, -91.1898193359375, -88.10228729248047, -85.01473999023438, -81.92720031738281, -78.83966064453125, -75.75212097167969, -72.66458129882812, -69.57704162597656, -66.489501953125, -63.40196990966797, -60.314430236816406, -57.226890563964844, -54.13935089111328, -51.05181121826172, -47.96427536010742, -44.87673568725586, -41.7891960144043, -38.70166015625, -35.61412048339844, -32.526580810546875, -29.439043045043945, -26.351503372192383, -23.263965606689453, -20.17642593383789, -17.088886260986328, -14.001348495483398, -10.913806915283203, -7.826268196105957, -4.738729000091553, -1.6511898040771484, 1.4363489151000977, 4.523887634277344, 7.611427307128906, 10.698965072631836, 13.786504745483398]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 13.0, 9.0, 10.0, 12.0, 17.0, 21.0, 12.0, 25.0, 18.0, 22.0, 20.0, 35.0, 33.0, 30.0, 37.0, 39.0, 49.0, 42.0, 43.0, 37.0, 42.0, 36.0, 48.0, 33.0, 31.0, 28.0, 28.0, 24.0, 35.0, 26.0, 19.0, 19.0, 14.0, 15.0, 9.0, 12.0, 8.0, 13.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.28564453125, -44.646331787109375, -43.00701904296875, -41.367706298828125, -39.7283935546875, -38.089080810546875, -36.449771881103516, -34.81045913696289, -33.171146392822266, -31.53183364868164, -29.892520904541016, -28.253210067749023, -26.6138973236084, -24.974584579467773, -23.33527374267578, -21.695960998535156, -20.05664825439453, -18.417335510253906, -16.77802276611328, -15.138711929321289, -13.499399185180664, -11.860086441040039, -10.22077465057373, -8.581462860107422, -6.942150115966797, -5.30283784866333, -3.6635255813598633, -2.0242133140563965, -0.3849010467529297, 1.2544116973876953, 2.893723487854004, 4.5330352783203125, 6.1723480224609375, 7.811660289764404, 9.450972557067871, 11.09028434753418, 12.729597091674805, 14.36890983581543, 16.008220672607422, 17.647533416748047, 19.286846160888672, 20.926158905029297, 22.565471649169922, 24.204782485961914, 25.84409523010254, 27.483407974243164, 29.122718811035156, 30.76203155517578, 32.401344299316406, 34.04065704345703, 35.679969787597656, 37.31928253173828, 38.958595275878906, 40.59790802001953, 42.23721694946289, 43.876529693603516, 45.51584243774414, 47.155155181884766, 48.79446792602539, 50.433780670166016, 52.073089599609375, 53.71240234375, 55.351715087890625, 56.99102783203125, 58.630340576171875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 3.0, 6.0, 8.0, 15.0, 3.0, 14.0, 15.0, 16.0, 27.0, 12.0, 17.0, 32.0, 32.0, 24.0, 35.0, 35.0, 45.0, 42.0, 41.0, 47.0, 47.0, 39.0, 46.0, 34.0, 36.0, 48.0, 33.0, 25.0, 26.0, 29.0, 27.0, 21.0, 19.0, 15.0, 13.0, 10.0, 13.0, 13.0, 4.0, 5.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.6099853515625, -3.469970703125, -3.3299560546875, -3.18994140625, -3.0499267578125, -2.909912109375, -2.7698974609375, -2.6298828125, -2.4898681640625, -2.349853515625, -2.2098388671875, -2.06982421875, -1.9298095703125, -1.789794921875, -1.6497802734375, -1.509765625, -1.3697509765625, -1.229736328125, -1.0897216796875, -0.94970703125, -0.8096923828125, -0.669677734375, -0.5296630859375, -0.3896484375, -0.2496337890625, -0.109619140625, 0.0303955078125, 0.17041015625, 0.3104248046875, 0.450439453125, 0.5904541015625, 0.73046875, 0.8704833984375, 1.010498046875, 1.1505126953125, 1.29052734375, 1.4305419921875, 1.570556640625, 1.7105712890625, 1.8505859375, 1.9906005859375, 2.130615234375, 2.2706298828125, 2.41064453125, 2.5506591796875, 2.690673828125, 2.8306884765625, 2.970703125, 3.1107177734375, 3.250732421875, 3.3907470703125, 3.53076171875, 3.6707763671875, 3.810791015625, 3.9508056640625, 4.0908203125, 4.2308349609375, 4.370849609375, 4.5108642578125, 4.65087890625, 4.7908935546875, 4.930908203125, 5.0709228515625, 5.2109375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 2.0, 18.0, 19.0, 31.0, 46.0, 67.0, 105.0, 173.0, 345.0, 519.0, 939.0, 1637.0, 3260.0, 6545.0, 15112.0, 41213.0, 194738.0, 3323244.0, 507179.0, 62338.0, 20150.0, 8180.0, 3904.0, 1917.0, 1078.0, 594.0, 308.0, 201.0, 129.0, 84.0, 48.0, 29.0, 28.0, 24.0, 19.0, 11.0, 8.0, 10.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.765625, -23.9833984375, -23.201171875, -22.4189453125, -21.63671875, -20.8544921875, -20.072265625, -19.2900390625, -18.5078125, -17.7255859375, -16.943359375, -16.1611328125, -15.37890625, -14.5966796875, -13.814453125, -13.0322265625, -12.25, -11.4677734375, -10.685546875, -9.9033203125, -9.12109375, -8.3388671875, -7.556640625, -6.7744140625, -5.9921875, -5.2099609375, -4.427734375, -3.6455078125, -2.86328125, -2.0810546875, -1.298828125, -0.5166015625, 0.265625, 1.0478515625, 1.830078125, 2.6123046875, 3.39453125, 4.1767578125, 4.958984375, 5.7412109375, 6.5234375, 7.3056640625, 8.087890625, 8.8701171875, 9.65234375, 10.4345703125, 11.216796875, 11.9990234375, 12.78125, 13.5634765625, 14.345703125, 15.1279296875, 15.91015625, 16.6923828125, 17.474609375, 18.2568359375, 19.0390625, 19.8212890625, 20.603515625, 21.3857421875, 22.16796875, 22.9501953125, 23.732421875, 24.5146484375, 25.296875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 17.0, 22.0, 13.0, 30.0, 35.0, 42.0, 65.0, 59.0, 114.0, 165.0, 291.0, 506.0, 734.0, 691.0, 393.0, 272.0, 167.0, 104.0, 81.0, 79.0, 44.0, 31.0, 29.0, 13.0, 20.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.35302734375, -19.7529296875, -19.15283203125, -18.552734375, -17.95263671875, -17.3525390625, -16.75244140625, -16.15234375, -15.55224609375, -14.9521484375, -14.35205078125, -13.751953125, -13.15185546875, -12.5517578125, -11.95166015625, -11.3515625, -10.75146484375, -10.1513671875, -9.55126953125, -8.951171875, -8.35107421875, -7.7509765625, -7.15087890625, -6.55078125, -5.95068359375, -5.3505859375, -4.75048828125, -4.150390625, -3.55029296875, -2.9501953125, -2.35009765625, -1.75, -1.14990234375, -0.5498046875, 0.05029296875, 0.650390625, 1.25048828125, 1.8505859375, 2.45068359375, 3.05078125, 3.65087890625, 4.2509765625, 4.85107421875, 5.451171875, 6.05126953125, 6.6513671875, 7.25146484375, 7.8515625, 8.45166015625, 9.0517578125, 9.65185546875, 10.251953125, 10.85205078125, 11.4521484375, 12.05224609375, 12.65234375, 13.25244140625, 13.8525390625, 14.45263671875, 15.052734375, 15.65283203125, 16.2529296875, 16.85302734375, 17.453125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 9.0, 16.0, 22.0, 38.0, 59.0, 85.0, 197.0, 331.0, 578.0, 1030.0, 1994.0, 3894.0, 7796.0, 17017.0, 42084.0, 128873.0, 830890.0, 2717785.0, 313031.0, 76043.0, 28278.0, 12161.0, 5726.0, 2911.0, 1501.0, 837.0, 484.0, 254.0, 145.0, 79.0, 49.0, 27.0, 23.0, 10.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.125, -26.166015625, -25.20703125, -24.248046875, -23.2890625, -22.330078125, -21.37109375, -20.412109375, -19.453125, -18.494140625, -17.53515625, -16.576171875, -15.6171875, -14.658203125, -13.69921875, -12.740234375, -11.78125, -10.822265625, -9.86328125, -8.904296875, -7.9453125, -6.986328125, -6.02734375, -5.068359375, -4.109375, -3.150390625, -2.19140625, -1.232421875, -0.2734375, 0.685546875, 1.64453125, 2.603515625, 3.5625, 4.521484375, 5.48046875, 6.439453125, 7.3984375, 8.357421875, 9.31640625, 10.275390625, 11.234375, 12.193359375, 13.15234375, 14.111328125, 15.0703125, 16.029296875, 16.98828125, 17.947265625, 18.90625, 19.865234375, 20.82421875, 21.783203125, 22.7421875, 23.701171875, 24.66015625, 25.619140625, 26.578125, 27.537109375, 28.49609375, 29.455078125, 30.4140625, 31.373046875, 32.33203125, 33.291015625, 34.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 20.0, 43.0, 43.0, 85.0, 143.0, 166.0, 165.0, 106.0, 90.0, 60.0, 30.0, 23.0, 13.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.4460906982422, -203.45620727539062, -198.46632385253906, -193.4764404296875, -188.48655700683594, -183.49667358398438, -178.5067901611328, -173.51690673828125, -168.52703857421875, -163.5371551513672, -158.54727172851562, -153.55738830566406, -148.5675048828125, -143.57762145996094, -138.58773803710938, -133.59786987304688, -128.60797119140625, -123.61808776855469, -118.62820434570312, -113.63832092285156, -108.6484375, -103.65855407714844, -98.6686782836914, -93.67879486083984, -88.68891143798828, -83.69902801513672, -78.70914459228516, -73.7192611694336, -68.72938537597656, -63.739498138427734, -58.74961853027344, -53.759735107421875, -48.76984405517578, -43.77996063232422, -38.790077209472656, -33.80019760131836, -28.810314178466797, -23.820430755615234, -18.830549240112305, -13.840667724609375, -8.850784301757812, -3.8609018325805664, 1.1289806365966797, 6.118863105773926, 11.108745574951172, 16.098628997802734, 21.088510513305664, 26.078392028808594, 31.068275451660156, 36.05815887451172, 41.04804229736328, 46.03792190551758, 51.02780532836914, 56.0176887512207, 61.007568359375, 65.99745178222656, 70.98733520507812, 75.97721862792969, 80.96710205078125, 85.95698547363281, 90.94686889648438, 95.93675231933594, 100.92662811279297, 105.91651153564453, 110.9063949584961]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 9.0, 10.0, 11.0, 13.0, 12.0, 16.0, 16.0, 19.0, 25.0, 21.0, 29.0, 38.0, 25.0, 33.0, 28.0, 40.0, 34.0, 40.0, 48.0, 43.0, 39.0, 25.0, 48.0, 42.0, 44.0, 40.0, 41.0, 28.0, 28.0, 24.0, 21.0, 23.0, 13.0, 16.0, 15.0, 9.0, 15.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.133670806884766, -55.37603759765625, -53.61840057373047, -51.86076354980469, -50.10313034057617, -48.345497131347656, -46.587860107421875, -44.830223083496094, -43.07258987426758, -41.31495666503906, -39.55731964111328, -37.7996826171875, -36.042049407958984, -34.28441619873047, -32.52677917480469, -30.76914405822754, -29.01150894165039, -27.253873825073242, -25.496238708496094, -23.738603591918945, -21.980968475341797, -20.22333335876465, -18.4656982421875, -16.70806312561035, -14.950428009033203, -13.192792892456055, -11.435157775878906, -9.677522659301758, -7.919887542724609, -6.162252426147461, -4.4046173095703125, -2.646982192993164, -0.8893470764160156, 0.8682880401611328, 2.6259231567382812, 4.38355827331543, 6.141193389892578, 7.898828506469727, 9.656463623046875, 11.414098739624023, 13.171733856201172, 14.92936897277832, 16.68700408935547, 18.444639205932617, 20.202274322509766, 21.959909439086914, 23.717544555664062, 25.47517967224121, 27.23281478881836, 28.990449905395508, 30.748085021972656, 32.50572204589844, 34.26335525512695, 36.02098846435547, 37.77862548828125, 39.53626251220703, 41.29389572143555, 43.05152893066406, 44.809165954589844, 46.566802978515625, 48.32443618774414, 50.082069396972656, 51.83970642089844, 53.59734344482422, 55.354976654052734]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 12.0, 11.0, 7.0, 17.0, 15.0, 17.0, 23.0, 24.0, 28.0, 21.0, 25.0, 26.0, 35.0, 33.0, 32.0, 34.0, 36.0, 48.0, 40.0, 39.0, 36.0, 25.0, 44.0, 33.0, 29.0, 39.0, 31.0, 27.0, 24.0, 17.0, 16.0, 25.0, 12.0, 10.0, 14.0, 14.0, 14.0, 7.0, 8.0, 6.0, 5.0, 11.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.05078125, -3.9110107421875, -3.771240234375, -3.6314697265625, -3.49169921875, -3.3519287109375, -3.212158203125, -3.0723876953125, -2.9326171875, -2.7928466796875, -2.653076171875, -2.5133056640625, -2.37353515625, -2.2337646484375, -2.093994140625, -1.9542236328125, -1.814453125, -1.6746826171875, -1.534912109375, -1.3951416015625, -1.25537109375, -1.1156005859375, -0.975830078125, -0.8360595703125, -0.6962890625, -0.5565185546875, -0.416748046875, -0.2769775390625, -0.13720703125, 0.0025634765625, 0.142333984375, 0.2821044921875, 0.421875, 0.5616455078125, 0.701416015625, 0.8411865234375, 0.98095703125, 1.1207275390625, 1.260498046875, 1.4002685546875, 1.5400390625, 1.6798095703125, 1.819580078125, 1.9593505859375, 2.09912109375, 2.2388916015625, 2.378662109375, 2.5184326171875, 2.658203125, 2.7979736328125, 2.937744140625, 3.0775146484375, 3.21728515625, 3.3570556640625, 3.496826171875, 3.6365966796875, 3.7763671875, 3.9161376953125, 4.055908203125, 4.1956787109375, 4.33544921875, 4.4752197265625, 4.614990234375, 4.7547607421875, 4.89453125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 14.0, 15.0, 22.0, 35.0, 52.0, 54.0, 107.0, 137.0, 234.0, 331.0, 553.0, 905.0, 1398.0, 2376.0, 3908.0, 6875.0, 12767.0, 24757.0, 49987.0, 108597.0, 229573.0, 293144.0, 162490.0, 74775.0, 34981.0, 17618.0, 9632.0, 5263.0, 3031.0, 1760.0, 1091.0, 749.0, 447.0, 286.0, 190.0, 123.0, 85.0, 62.0, 39.0, 28.0, 21.0, 8.0, 12.0, 7.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.84521484375, -0.8198013305664062, -0.7943878173828125, -0.7689743041992188, -0.743560791015625, -0.7181472778320312, -0.6927337646484375, -0.6673202514648438, -0.64190673828125, -0.6164932250976562, -0.5910797119140625, -0.5656661987304688, -0.540252685546875, -0.5148391723632812, -0.4894256591796875, -0.46401214599609375, -0.4385986328125, -0.41318511962890625, -0.3877716064453125, -0.36235809326171875, -0.336944580078125, -0.31153106689453125, -0.2861175537109375, -0.26070404052734375, -0.23529052734375, -0.20987701416015625, -0.1844635009765625, -0.15904998779296875, -0.133636474609375, -0.10822296142578125, -0.0828094482421875, -0.05739593505859375, -0.031982421875, -0.00656890869140625, 0.0188446044921875, 0.04425811767578125, 0.069671630859375, 0.09508514404296875, 0.1204986572265625, 0.14591217041015625, 0.17132568359375, 0.19673919677734375, 0.2221527099609375, 0.24756622314453125, 0.272979736328125, 0.29839324951171875, 0.3238067626953125, 0.34922027587890625, 0.3746337890625, 0.40004730224609375, 0.4254608154296875, 0.45087432861328125, 0.476287841796875, 0.5017013549804688, 0.5271148681640625, 0.5525283813476562, 0.57794189453125, 0.6033554077148438, 0.6287689208984375, 0.6541824340820312, 0.679595947265625, 0.7050094604492188, 0.7304229736328125, 0.7558364868164062, 0.78125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 17.0, 16.0, 18.0, 18.0, 21.0, 26.0, 28.0, 32.0, 21.0, 32.0, 35.0, 35.0, 43.0, 47.0, 31.0, 35.0, 1057.0, 50.0, 39.0, 44.0, 40.0, 27.0, 24.0, 27.0, 36.0, 31.0, 23.0, 19.0, 26.0, 20.0, 11.0, 12.0, 12.0, 5.0, 8.0, 13.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.228515625, -3.12896728515625, -3.0294189453125, -2.92987060546875, -2.830322265625, -2.73077392578125, -2.6312255859375, -2.53167724609375, -2.43212890625, -2.33258056640625, -2.2330322265625, -2.13348388671875, -2.033935546875, -1.93438720703125, -1.8348388671875, -1.73529052734375, -1.6357421875, -1.53619384765625, -1.4366455078125, -1.33709716796875, -1.237548828125, -1.13800048828125, -1.0384521484375, -0.93890380859375, -0.83935546875, -0.73980712890625, -0.6402587890625, -0.54071044921875, -0.441162109375, -0.34161376953125, -0.2420654296875, -0.14251708984375, -0.04296875, 0.05657958984375, 0.1561279296875, 0.25567626953125, 0.355224609375, 0.45477294921875, 0.5543212890625, 0.65386962890625, 0.75341796875, 0.85296630859375, 0.9525146484375, 1.05206298828125, 1.151611328125, 1.25115966796875, 1.3507080078125, 1.45025634765625, 1.5498046875, 1.64935302734375, 1.7489013671875, 1.84844970703125, 1.947998046875, 2.04754638671875, 2.1470947265625, 2.24664306640625, 2.34619140625, 2.44573974609375, 2.5452880859375, 2.64483642578125, 2.744384765625, 2.84393310546875, 2.9434814453125, 3.04302978515625, 3.142578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 9.0, 7.0, 10.0, 19.0, 26.0, 38.0, 50.0, 89.0, 123.0, 183.0, 285.0, 385.0, 641.0, 820.0, 1280.0, 1889.0, 2879.0, 4254.0, 6424.0, 9418.0, 14609.0, 22916.0, 35865.0, 57745.0, 95520.0, 155039.0, 1232956.0, 174828.0, 104010.0, 63610.0, 39045.0, 25054.0, 15914.0, 10328.0, 6958.0, 4477.0, 3065.0, 2037.0, 1396.0, 949.0, 629.0, 448.0, 271.0, 204.0, 150.0, 81.0, 70.0, 50.0, 27.0, 18.0, 13.0, 7.0, 10.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.279052734375, -0.2699317932128906, -0.26081085205078125, -0.2516899108886719, -0.2425689697265625, -0.23344802856445312, -0.22432708740234375, -0.21520614624023438, -0.206085205078125, -0.19696426391601562, -0.18784332275390625, -0.17872238159179688, -0.1696014404296875, -0.16048049926757812, -0.15135955810546875, -0.14223861694335938, -0.13311767578125, -0.12399673461914062, -0.11487579345703125, -0.10575485229492188, -0.0966339111328125, -0.08751296997070312, -0.07839202880859375, -0.06927108764648438, -0.060150146484375, -0.051029205322265625, -0.04190826416015625, -0.032787322998046875, -0.0236663818359375, -0.014545440673828125, -0.00542449951171875, 0.003696441650390625, 0.0128173828125, 0.021938323974609375, 0.03105926513671875, 0.040180206298828125, 0.0493011474609375, 0.058422088623046875, 0.06754302978515625, 0.07666397094726562, 0.085784912109375, 0.09490585327148438, 0.10402679443359375, 0.11314773559570312, 0.1222686767578125, 0.13138961791992188, 0.14051055908203125, 0.14963150024414062, 0.15875244140625, 0.16787338256835938, 0.17699432373046875, 0.18611526489257812, 0.1952362060546875, 0.20435714721679688, 0.21347808837890625, 0.22259902954101562, 0.231719970703125, 0.24084091186523438, 0.24996185302734375, 0.2590827941894531, 0.2682037353515625, 0.2773246765136719, 0.28644561767578125, 0.2955665588378906, 0.3046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 8.0, 1.0, 1.0, 8.0, 2.0, 8.0, 11.0, 13.0, 16.0, 13.0, 21.0, 33.0, 29.0, 27.0, 46.0, 38.0, 41.0, 50.0, 119.0, 90.0, 67.0, 34.0, 33.0, 45.0, 28.0, 35.0, 19.0, 22.0, 17.0, 20.0, 15.0, 13.0, 9.0, 14.0, 10.0, 10.0, 5.0, 5.0, 4.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0244598388671875, -0.023715496063232422, -0.022971153259277344, -0.022226810455322266, -0.021482467651367188, -0.02073812484741211, -0.01999378204345703, -0.019249439239501953, -0.018505096435546875, -0.017760753631591797, -0.01701641082763672, -0.01627206802368164, -0.015527725219726562, -0.014783382415771484, -0.014039039611816406, -0.013294696807861328, -0.01255035400390625, -0.011806011199951172, -0.011061668395996094, -0.010317325592041016, -0.009572982788085938, -0.00882863998413086, -0.008084297180175781, -0.007339954376220703, -0.006595611572265625, -0.005851268768310547, -0.005106925964355469, -0.004362583160400391, -0.0036182403564453125, -0.0028738975524902344, -0.0021295547485351562, -0.0013852119445800781, -0.000640869140625, 0.00010347366333007812, 0.0008478164672851562, 0.0015921592712402344, 0.0023365020751953125, 0.0030808448791503906, 0.0038251876831054688, 0.004569530487060547, 0.005313873291015625, 0.006058216094970703, 0.006802558898925781, 0.007546901702880859, 0.008291244506835938, 0.009035587310791016, 0.009779930114746094, 0.010524272918701172, 0.01126861572265625, 0.012012958526611328, 0.012757301330566406, 0.013501644134521484, 0.014245986938476562, 0.01499032974243164, 0.01573467254638672, 0.016479015350341797, 0.017223358154296875, 0.017967700958251953, 0.01871204376220703, 0.01945638656616211, 0.020200729370117188, 0.020945072174072266, 0.021689414978027344, 0.022433757781982422, 0.0231781005859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 7.0, 7.0, 7.0, 15.0, 17.0, 15.0, 11.0, 27.0, 23.0, 35.0, 55.0, 79.0, 121.0, 217.0, 609.0, 43068.0, 1001662.0, 1706.0, 315.0, 203.0, 92.0, 81.0, 50.0, 29.0, 27.0, 17.0, 9.0, 5.0, 6.0, 6.0, 6.0, 2.0, 0.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.61376953125, -0.5941085815429688, -0.5744476318359375, -0.5547866821289062, -0.535125732421875, -0.5154647827148438, -0.4958038330078125, -0.47614288330078125, -0.45648193359375, -0.43682098388671875, -0.4171600341796875, -0.39749908447265625, -0.377838134765625, -0.35817718505859375, -0.3385162353515625, -0.31885528564453125, -0.2991943359375, -0.27953338623046875, -0.2598724365234375, -0.24021148681640625, -0.220550537109375, -0.20088958740234375, -0.1812286376953125, -0.16156768798828125, -0.14190673828125, -0.12224578857421875, -0.1025848388671875, -0.08292388916015625, -0.063262939453125, -0.04360198974609375, -0.0239410400390625, -0.00428009033203125, 0.015380859375, 0.03504180908203125, 0.0547027587890625, 0.07436370849609375, 0.094024658203125, 0.11368560791015625, 0.1333465576171875, 0.15300750732421875, 0.17266845703125, 0.19232940673828125, 0.2119903564453125, 0.23165130615234375, 0.251312255859375, 0.27097320556640625, 0.2906341552734375, 0.31029510498046875, 0.3299560546875, 0.34961700439453125, 0.3692779541015625, 0.38893890380859375, 0.408599853515625, 0.42826080322265625, 0.4479217529296875, 0.46758270263671875, 0.48724365234375, 0.5069046020507812, 0.5265655517578125, 0.5462265014648438, 0.565887451171875, 0.5855484008789062, 0.6052093505859375, 0.6248703002929688, 0.64453125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 7.0, 28.0, 76.0, 426.0, 331.0, 92.0, 30.0, 14.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03435846418142319, -0.027344107627868652, -0.020329751074314117, -0.013315392658114433, -0.006301036104559898, 0.0007133223116397858, 0.007727678865194321, 0.014742035418748856, 0.02175639197230339, 0.028770748525857925, 0.03578510507941246, 0.042799465358257294, 0.04981382191181183, 0.056828178465366364, 0.0638425350189209, 0.07085689157247543, 0.07787124812602997, 0.0848856046795845, 0.09189996123313904, 0.09891431778669357, 0.10592867434024811, 0.11294303834438324, 0.11995738744735718, 0.1269717514514923, 0.13398610055446625, 0.14100046455860138, 0.14801481366157532, 0.15502917766571045, 0.1620435267686844, 0.16905789077281952, 0.17607223987579346, 0.1830866038799286, 0.19010095298290253, 0.19711531698703766, 0.2041296660900116, 0.21114403009414673, 0.21815837919712067, 0.2251727432012558, 0.23218709230422974, 0.23920145630836487, 0.2462158054113388, 0.25323015451431274, 0.2602445185184479, 0.267258882522583, 0.27427324652671814, 0.2812875807285309, 0.288301944732666, 0.29531630873680115, 0.3023306727409363, 0.3093450367450714, 0.31635940074920654, 0.3233737349510193, 0.3303880989551544, 0.33740246295928955, 0.3444168269634247, 0.3514311611652374, 0.35844552516937256, 0.3654598891735077, 0.3724742531776428, 0.37948858737945557, 0.3865029513835907, 0.39351731538772583, 0.40053167939186096, 0.4075460135936737, 0.41456037759780884]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 7.0, 6.0, 10.0, 11.0, 11.0, 10.0, 9.0, 15.0, 17.0, 13.0, 21.0, 28.0, 40.0, 35.0, 27.0, 38.0, 34.0, 40.0, 36.0, 36.0, 45.0, 43.0, 37.0, 26.0, 42.0, 26.0, 24.0, 34.0, 35.0, 31.0, 24.0, 28.0, 26.0, 22.0, 21.0, 14.0, 13.0, 15.0, 13.0, 6.0, 8.0, 4.0, 5.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0731077790260315, -0.0709151029586792, -0.0687224268913269, -0.06652975082397461, -0.06433707475662231, -0.06214439496397972, -0.05995171517133713, -0.05775903910398483, -0.05556636303663254, -0.05337368696928024, -0.05118101090192795, -0.048988331109285355, -0.04679565504193306, -0.044602978974580765, -0.04241029918193817, -0.040217623114585876, -0.03802494704723358, -0.03583227097988129, -0.03363959491252899, -0.0314469151198864, -0.029254239052534103, -0.02706156298518181, -0.024868885055184364, -0.02267620712518692, -0.020483531057834625, -0.01829085499048233, -0.016098177060484886, -0.013905500061810017, -0.011712823063135147, -0.009520146064460278, -0.007327469065785408, -0.0051347920671105385, -0.002942115068435669, -0.0007494380697607994, 0.0014432389289140701, 0.0036359159275889397, 0.005828592926263809, 0.008021269924938679, 0.010213946923613548, 0.012406623922288418, 0.014599300920963287, 0.016791976988315582, 0.018984654918313026, 0.02117733284831047, 0.023370008915662766, 0.02556268498301506, 0.027755362913012505, 0.02994804084300995, 0.032140716910362244, 0.03433339297771454, 0.036526069045066833, 0.03871874883770943, 0.04091142490506172, 0.04310410097241402, 0.04529678076505661, 0.047489456832408905, 0.0496821328997612, 0.051874808967113495, 0.05406748503446579, 0.05626016482710838, 0.05845284089446068, 0.06064551696181297, 0.06283819675445557, 0.06503087282180786, 0.06722354888916016]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 12.0, 11.0, 7.0, 17.0, 15.0, 17.0, 23.0, 24.0, 27.0, 23.0, 24.0, 26.0, 35.0, 33.0, 32.0, 34.0, 36.0, 48.0, 40.0, 39.0, 35.0, 26.0, 44.0, 33.0, 29.0, 40.0, 30.0, 26.0, 25.0, 17.0, 16.0, 26.0, 11.0, 10.0, 14.0, 15.0, 13.0, 7.0, 8.0, 6.0, 5.0, 11.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.05078125, -3.9110107421875, -3.771240234375, -3.6314697265625, -3.49169921875, -3.3519287109375, -3.212158203125, -3.0723876953125, -2.9326171875, -2.7928466796875, -2.653076171875, -2.5133056640625, -2.37353515625, -2.2337646484375, -2.093994140625, -1.9542236328125, -1.814453125, -1.6746826171875, -1.534912109375, -1.3951416015625, -1.25537109375, -1.1156005859375, -0.975830078125, -0.8360595703125, -0.6962890625, -0.5565185546875, -0.416748046875, -0.2769775390625, -0.13720703125, 0.0025634765625, 0.142333984375, 0.2821044921875, 0.421875, 0.5616455078125, 0.701416015625, 0.8411865234375, 0.98095703125, 1.1207275390625, 1.260498046875, 1.4002685546875, 1.5400390625, 1.6798095703125, 1.819580078125, 1.9593505859375, 2.09912109375, 2.2388916015625, 2.378662109375, 2.5184326171875, 2.658203125, 2.7979736328125, 2.937744140625, 3.0775146484375, 3.21728515625, 3.3570556640625, 3.496826171875, 3.6365966796875, 3.7763671875, 3.9161376953125, 4.055908203125, 4.1956787109375, 4.33544921875, 4.4752197265625, 4.614990234375, 4.7547607421875, 4.89453125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 6.0, 4.0, 2.0, 4.0, 6.0, 12.0, 13.0, 22.0, 42.0, 52.0, 76.0, 90.0, 143.0, 223.0, 367.0, 547.0, 957.0, 1596.0, 2927.0, 5560.0, 12551.0, 32508.0, 105519.0, 428770.0, 328548.0, 79910.0, 26492.0, 10486.0, 4868.0, 2463.0, 1441.0, 817.0, 495.0, 340.0, 219.0, 134.0, 99.0, 79.0, 48.0, 34.0, 22.0, 18.0, 16.0, 10.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0], "bins": [-5.1796875, -5.03125, -4.8828125, -4.734375, -4.5859375, -4.4375, -4.2890625, -4.140625, -3.9921875, -3.84375, -3.6953125, -3.546875, -3.3984375, -3.25, -3.1015625, -2.953125, -2.8046875, -2.65625, -2.5078125, -2.359375, -2.2109375, -2.0625, -1.9140625, -1.765625, -1.6171875, -1.46875, -1.3203125, -1.171875, -1.0234375, -0.875, -0.7265625, -0.578125, -0.4296875, -0.28125, -0.1328125, 0.015625, 0.1640625, 0.3125, 0.4609375, 0.609375, 0.7578125, 0.90625, 1.0546875, 1.203125, 1.3515625, 1.5, 1.6484375, 1.796875, 1.9453125, 2.09375, 2.2421875, 2.390625, 2.5390625, 2.6875, 2.8359375, 2.984375, 3.1328125, 3.28125, 3.4296875, 3.578125, 3.7265625, 3.875, 4.0234375, 4.171875, 4.3203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 8.0, 8.0, 7.0, 11.0, 7.0, 16.0, 25.0, 19.0, 19.0, 20.0, 27.0, 32.0, 32.0, 39.0, 42.0, 36.0, 62.0, 127.0, 1555.0, 410.0, 92.0, 48.0, 50.0, 41.0, 41.0, 33.0, 38.0, 23.0, 33.0, 27.0, 16.0, 20.0, 16.0, 13.0, 14.0, 10.0, 13.0, 6.0, 0.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.78125, -17.224853515625, -16.66845703125, -16.112060546875, -15.5556640625, -14.999267578125, -14.44287109375, -13.886474609375, -13.330078125, -12.773681640625, -12.21728515625, -11.660888671875, -11.1044921875, -10.548095703125, -9.99169921875, -9.435302734375, -8.87890625, -8.322509765625, -7.76611328125, -7.209716796875, -6.6533203125, -6.096923828125, -5.54052734375, -4.984130859375, -4.427734375, -3.871337890625, -3.31494140625, -2.758544921875, -2.2021484375, -1.645751953125, -1.08935546875, -0.532958984375, 0.0234375, 0.579833984375, 1.13623046875, 1.692626953125, 2.2490234375, 2.805419921875, 3.36181640625, 3.918212890625, 4.474609375, 5.031005859375, 5.58740234375, 6.143798828125, 6.7001953125, 7.256591796875, 7.81298828125, 8.369384765625, 8.92578125, 9.482177734375, 10.03857421875, 10.594970703125, 11.1513671875, 11.707763671875, 12.26416015625, 12.820556640625, 13.376953125, 13.933349609375, 14.48974609375, 15.046142578125, 15.6025390625, 16.158935546875, 16.71533203125, 17.271728515625, 17.828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 0.0, 7.0, 8.0, 11.0, 14.0, 14.0, 15.0, 18.0, 20.0, 30.0, 32.0, 52.0, 62.0, 106.0, 151.0, 221.0, 436.0, 1092.0, 7709.0, 993215.0, 2130679.0, 9375.0, 1259.0, 425.0, 237.0, 158.0, 100.0, 49.0, 47.0, 30.0, 25.0, 23.0, 15.0, 16.0, 12.0, 14.0, 8.0, 3.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -27.14111328125, -26.2666015625, -25.39208984375, -24.517578125, -23.64306640625, -22.7685546875, -21.89404296875, -21.01953125, -20.14501953125, -19.2705078125, -18.39599609375, -17.521484375, -16.64697265625, -15.7724609375, -14.89794921875, -14.0234375, -13.14892578125, -12.2744140625, -11.39990234375, -10.525390625, -9.65087890625, -8.7763671875, -7.90185546875, -7.02734375, -6.15283203125, -5.2783203125, -4.40380859375, -3.529296875, -2.65478515625, -1.7802734375, -0.90576171875, -0.03125, 0.84326171875, 1.7177734375, 2.59228515625, 3.466796875, 4.34130859375, 5.2158203125, 6.09033203125, 6.96484375, 7.83935546875, 8.7138671875, 9.58837890625, 10.462890625, 11.33740234375, 12.2119140625, 13.08642578125, 13.9609375, 14.83544921875, 15.7099609375, 16.58447265625, 17.458984375, 18.33349609375, 19.2080078125, 20.08251953125, 20.95703125, 21.83154296875, 22.7060546875, 23.58056640625, 24.455078125, 25.32958984375, 26.2041015625, 27.07861328125, 27.953125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 204.0, 730.0, 79.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.94773864746094, -59.170570373535156, -54.39340591430664, -49.616241455078125, -44.839073181152344, -40.06190490722656, -35.28474044799805, -30.50757598876953, -25.73040771484375, -20.9532413482666, -16.176074981689453, -11.398908615112305, -6.621742248535156, -1.8445758819580078, 2.9325904846191406, 7.709754943847656, 12.486923217773438, 17.264089584350586, 22.041255950927734, 26.818422317504883, 31.59558868408203, 36.37275695800781, 41.14992141723633, 45.927085876464844, 50.704254150390625, 55.481422424316406, 60.25858688354492, 65.03575134277344, 69.81291961669922, 74.590087890625, 79.36724853515625, 84.14441680908203, 88.92160034179688, 93.69876861572266, 98.47593688964844, 103.25309753417969, 108.03026580810547, 112.80743408203125, 117.5845947265625, 122.36176300048828, 127.13893127441406, 131.9160919189453, 136.69326782226562, 141.47042846679688, 146.24758911132812, 151.02476501464844, 155.8019256591797, 160.5791015625, 165.35626220703125, 170.1334228515625, 174.9105987548828, 179.68775939941406, 184.46493530273438, 189.24209594726562, 194.01925659179688, 198.79641723632812, 203.57359313964844, 208.3507537841797, 213.1279296875, 217.90509033203125, 222.6822509765625, 227.4594268798828, 232.23658752441406, 237.01376342773438, 241.79092407226562]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 9.0, 7.0, 8.0, 10.0, 14.0, 11.0, 15.0, 14.0, 23.0, 25.0, 29.0, 39.0, 29.0, 42.0, 40.0, 48.0, 43.0, 40.0, 43.0, 45.0, 42.0, 70.0, 43.0, 39.0, 34.0, 40.0, 31.0, 22.0, 31.0, 22.0, 14.0, 16.0, 16.0, 14.0, 11.0, 6.0, 9.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.020755767822266, -57.145050048828125, -55.26934051513672, -53.39363479614258, -51.51792526245117, -49.64221954345703, -47.766510009765625, -45.890804290771484, -44.015098571777344, -42.1393928527832, -40.2636833190918, -38.387977600097656, -36.51226806640625, -34.63656234741211, -32.76085662841797, -30.885147094726562, -29.009437561035156, -27.133729934692383, -25.25802230834961, -23.38231658935547, -21.506607055664062, -19.630901336669922, -17.75519371032715, -15.879486083984375, -14.003778457641602, -12.128070831298828, -10.252363204956055, -8.376656532287598, -6.500948905944824, -4.625241279602051, -2.7495346069335938, -0.8738269805908203, 1.0018844604492188, 2.877591848373413, 4.753299236297607, 6.629006385803223, 8.504714012145996, 10.38042163848877, 12.256128311157227, 14.1318359375, 16.007543563842773, 17.883251190185547, 19.75895881652832, 21.634666442871094, 23.510372161865234, 25.38608169555664, 27.26178741455078, 29.137495040893555, 31.013202667236328, 32.88890838623047, 34.764617919921875, 36.640323638916016, 38.51603317260742, 40.39173889160156, 42.26744842529297, 44.14315414428711, 46.01885986328125, 47.89456558227539, 49.7702751159668, 51.64598083496094, 53.521690368652344, 55.397396087646484, 57.273101806640625, 59.14881134033203, 61.02452087402344]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 11.0, 3.0, 10.0, 14.0, 13.0, 13.0, 16.0, 25.0, 21.0, 23.0, 30.0, 26.0, 21.0, 22.0, 40.0, 36.0, 41.0, 29.0, 45.0, 35.0, 49.0, 34.0, 36.0, 37.0, 42.0, 27.0, 38.0, 33.0, 29.0, 20.0, 20.0, 23.0, 20.0, 11.0, 13.0, 12.0, 13.0, 15.0, 12.0, 6.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140625, -3.9949951171875, -3.849365234375, -3.7037353515625, -3.55810546875, -3.4124755859375, -3.266845703125, -3.1212158203125, -2.9755859375, -2.8299560546875, -2.684326171875, -2.5386962890625, -2.39306640625, -2.2474365234375, -2.101806640625, -1.9561767578125, -1.810546875, -1.6649169921875, -1.519287109375, -1.3736572265625, -1.22802734375, -1.0823974609375, -0.936767578125, -0.7911376953125, -0.6455078125, -0.4998779296875, -0.354248046875, -0.2086181640625, -0.06298828125, 0.0826416015625, 0.228271484375, 0.3739013671875, 0.51953125, 0.6651611328125, 0.810791015625, 0.9564208984375, 1.10205078125, 1.2476806640625, 1.393310546875, 1.5389404296875, 1.6845703125, 1.8302001953125, 1.975830078125, 2.1214599609375, 2.26708984375, 2.4127197265625, 2.558349609375, 2.7039794921875, 2.849609375, 2.9952392578125, 3.140869140625, 3.2864990234375, 3.43212890625, 3.5777587890625, 3.723388671875, 3.8690185546875, 4.0146484375, 4.1602783203125, 4.305908203125, 4.4515380859375, 4.59716796875, 4.7427978515625, 4.888427734375, 5.0340576171875, 5.1796875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 23.0, 23.0, 32.0, 38.0, 57.0, 66.0, 91.0, 152.0, 242.0, 312.0, 458.0, 635.0, 972.0, 1421.0, 2167.0, 3338.0, 5403.0, 9163.0, 16504.0, 32474.0, 81077.0, 457554.0, 2830380.0, 582573.0, 89945.0, 35924.0, 17555.0, 9766.0, 5680.0, 3473.0, 2226.0, 1389.0, 951.0, 656.0, 440.0, 316.0, 222.0, 167.0, 119.0, 68.0, 46.0, 44.0, 34.0, 22.0, 20.0, 13.0, 7.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.5390625, -15.0303955078125, -14.521728515625, -14.0130615234375, -13.50439453125, -12.9957275390625, -12.487060546875, -11.9783935546875, -11.4697265625, -10.9610595703125, -10.452392578125, -9.9437255859375, -9.43505859375, -8.9263916015625, -8.417724609375, -7.9090576171875, -7.400390625, -6.8917236328125, -6.383056640625, -5.8743896484375, -5.36572265625, -4.8570556640625, -4.348388671875, -3.8397216796875, -3.3310546875, -2.8223876953125, -2.313720703125, -1.8050537109375, -1.29638671875, -0.7877197265625, -0.279052734375, 0.2296142578125, 0.73828125, 1.2469482421875, 1.755615234375, 2.2642822265625, 2.77294921875, 3.2816162109375, 3.790283203125, 4.2989501953125, 4.8076171875, 5.3162841796875, 5.824951171875, 6.3336181640625, 6.84228515625, 7.3509521484375, 7.859619140625, 8.3682861328125, 8.876953125, 9.3856201171875, 9.894287109375, 10.4029541015625, 10.91162109375, 11.4202880859375, 11.928955078125, 12.4376220703125, 12.9462890625, 13.4549560546875, 13.963623046875, 14.4722900390625, 14.98095703125, 15.4896240234375, 15.998291015625, 16.5069580078125, 17.015625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 17.0, 9.0, 19.0, 26.0, 27.0, 47.0, 50.0, 73.0, 93.0, 114.0, 194.0, 264.0, 404.0, 599.0, 610.0, 461.0, 297.0, 222.0, 144.0, 74.0, 77.0, 36.0, 46.0, 27.0, 28.0, 22.0, 24.0, 8.0, 8.0, 8.0, 8.0, 2.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.765625, -16.243896484375, -15.72216796875, -15.200439453125, -14.6787109375, -14.156982421875, -13.63525390625, -13.113525390625, -12.591796875, -12.070068359375, -11.54833984375, -11.026611328125, -10.5048828125, -9.983154296875, -9.46142578125, -8.939697265625, -8.41796875, -7.896240234375, -7.37451171875, -6.852783203125, -6.3310546875, -5.809326171875, -5.28759765625, -4.765869140625, -4.244140625, -3.722412109375, -3.20068359375, -2.678955078125, -2.1572265625, -1.635498046875, -1.11376953125, -0.592041015625, -0.0703125, 0.451416015625, 0.97314453125, 1.494873046875, 2.0166015625, 2.538330078125, 3.06005859375, 3.581787109375, 4.103515625, 4.625244140625, 5.14697265625, 5.668701171875, 6.1904296875, 6.712158203125, 7.23388671875, 7.755615234375, 8.27734375, 8.799072265625, 9.32080078125, 9.842529296875, 10.3642578125, 10.885986328125, 11.40771484375, 11.929443359375, 12.451171875, 12.972900390625, 13.49462890625, 14.016357421875, 14.5380859375, 15.059814453125, 15.58154296875, 16.103271484375, 16.625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 2.0, 8.0, 9.0, 16.0, 26.0, 24.0, 42.0, 70.0, 85.0, 143.0, 196.0, 336.0, 595.0, 883.0, 1552.0, 2710.0, 4933.0, 9124.0, 18150.0, 37651.0, 89544.0, 312551.0, 2141917.0, 1245384.0, 199040.0, 67555.0, 29747.0, 14388.0, 7714.0, 4084.0, 2435.0, 1332.0, 743.0, 492.0, 278.0, 176.0, 134.0, 65.0, 51.0, 35.0, 20.0, 15.0, 6.0, 4.0, 11.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.203125, -23.46630859375, -22.7294921875, -21.99267578125, -21.255859375, -20.51904296875, -19.7822265625, -19.04541015625, -18.30859375, -17.57177734375, -16.8349609375, -16.09814453125, -15.361328125, -14.62451171875, -13.8876953125, -13.15087890625, -12.4140625, -11.67724609375, -10.9404296875, -10.20361328125, -9.466796875, -8.72998046875, -7.9931640625, -7.25634765625, -6.51953125, -5.78271484375, -5.0458984375, -4.30908203125, -3.572265625, -2.83544921875, -2.0986328125, -1.36181640625, -0.625, 0.11181640625, 0.8486328125, 1.58544921875, 2.322265625, 3.05908203125, 3.7958984375, 4.53271484375, 5.26953125, 6.00634765625, 6.7431640625, 7.47998046875, 8.216796875, 8.95361328125, 9.6904296875, 10.42724609375, 11.1640625, 11.90087890625, 12.6376953125, 13.37451171875, 14.111328125, 14.84814453125, 15.5849609375, 16.32177734375, 17.05859375, 17.79541015625, 18.5322265625, 19.26904296875, 20.005859375, 20.74267578125, 21.4794921875, 22.21630859375, 22.953125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 13.0, 24.0, 32.0, 54.0, 91.0, 107.0, 123.0, 135.0, 138.0, 86.0, 71.0, 43.0, 32.0, 17.0, 11.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.44300842285156, -163.2902374267578, -159.13746643066406, -154.9846954345703, -150.8319091796875, -146.67913818359375, -142.5263671875, -138.37359619140625, -134.2208251953125, -130.06805419921875, -125.915283203125, -121.76250457763672, -117.60973358154297, -113.45696258544922, -109.30418395996094, -105.15141296386719, -100.99864196777344, -96.84587097167969, -92.69309997558594, -88.54032135009766, -84.3875503540039, -80.23477935791016, -76.08200073242188, -71.92922973632812, -67.77645874023438, -63.623687744140625, -59.47091293334961, -55.318138122558594, -51.165367126464844, -47.012596130371094, -42.85982131958008, -38.70704650878906, -34.55426025390625, -30.401487350463867, -26.248714447021484, -22.0959415435791, -17.94316864013672, -13.790395736694336, -9.637622833251953, -5.48484992980957, -1.3320770263671875, 2.8206958770751953, 6.973468780517578, 11.126241683959961, 15.279014587402344, 19.431787490844727, 23.58456039428711, 27.737333297729492, 31.890106201171875, 36.042877197265625, 40.19565200805664, 44.348426818847656, 48.501197814941406, 52.653968811035156, 56.80674362182617, 60.95951843261719, 65.11228942871094, 69.26506042480469, 73.41783142089844, 77.57061004638672, 81.72338104248047, 85.87615203857422, 90.0289306640625, 94.18170166015625, 98.33447265625]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 7.0, 9.0, 11.0, 15.0, 15.0, 17.0, 17.0, 26.0, 29.0, 29.0, 29.0, 38.0, 33.0, 30.0, 27.0, 29.0, 41.0, 37.0, 35.0, 48.0, 50.0, 50.0, 29.0, 45.0, 31.0, 32.0, 32.0, 28.0, 26.0, 26.0, 13.0, 22.0, 22.0, 12.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-56.74903106689453, -55.08230209350586, -53.41557312011719, -51.748844146728516, -50.082115173339844, -48.41539001464844, -46.7486572265625, -45.081932067871094, -43.41520309448242, -41.74847412109375, -40.08174514770508, -38.415016174316406, -36.748287200927734, -35.08155822753906, -33.414833068847656, -31.748104095458984, -30.08137321472168, -28.414644241333008, -26.747915267944336, -25.081188201904297, -23.414459228515625, -21.747730255126953, -20.08100128173828, -18.41427230834961, -16.747543334960938, -15.080814361572266, -13.41408634185791, -11.747357368469238, -10.080629348754883, -8.413900375366211, -6.747171401977539, -5.080443382263184, -3.413715362548828, -1.746986746788025, -0.08025813102722168, 1.586470603942871, 3.2531991004943848, 4.919927597045898, 6.58665657043457, 8.253384590148926, 9.920113563537598, 11.58684253692627, 13.253570556640625, 14.920299530029297, 16.58702850341797, 18.25375747680664, 19.920486450195312, 21.58721351623535, 23.253942489624023, 24.920671463012695, 26.587400436401367, 28.254127502441406, 29.920856475830078, 31.58758544921875, 33.25431442260742, 34.921043395996094, 36.587772369384766, 38.25450134277344, 39.92123031616211, 41.58795928955078, 43.25468826293945, 44.921417236328125, 46.58814239501953, 48.2548713684082, 49.921600341796875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 5.0, 8.0, 14.0, 13.0, 17.0, 18.0, 19.0, 29.0, 19.0, 27.0, 31.0, 31.0, 31.0, 24.0, 32.0, 47.0, 40.0, 35.0, 40.0, 40.0, 40.0, 37.0, 26.0, 38.0, 26.0, 27.0, 31.0, 30.0, 28.0, 29.0, 20.0, 13.0, 18.0, 19.0, 10.0, 11.0, 12.0, 9.0, 12.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-5.515625, -5.358154296875, -5.20068359375, -5.043212890625, -4.8857421875, -4.728271484375, -4.57080078125, -4.413330078125, -4.255859375, -4.098388671875, -3.94091796875, -3.783447265625, -3.6259765625, -3.468505859375, -3.31103515625, -3.153564453125, -2.99609375, -2.838623046875, -2.68115234375, -2.523681640625, -2.3662109375, -2.208740234375, -2.05126953125, -1.893798828125, -1.736328125, -1.578857421875, -1.42138671875, -1.263916015625, -1.1064453125, -0.948974609375, -0.79150390625, -0.634033203125, -0.4765625, -0.319091796875, -0.16162109375, -0.004150390625, 0.1533203125, 0.310791015625, 0.46826171875, 0.625732421875, 0.783203125, 0.940673828125, 1.09814453125, 1.255615234375, 1.4130859375, 1.570556640625, 1.72802734375, 1.885498046875, 2.04296875, 2.200439453125, 2.35791015625, 2.515380859375, 2.6728515625, 2.830322265625, 2.98779296875, 3.145263671875, 3.302734375, 3.460205078125, 3.61767578125, 3.775146484375, 3.9326171875, 4.090087890625, 4.24755859375, 4.405029296875, 4.5625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 10.0, 10.0, 9.0, 19.0, 26.0, 33.0, 61.0, 90.0, 140.0, 196.0, 304.0, 505.0, 836.0, 1280.0, 2097.0, 3407.0, 5577.0, 9655.0, 17543.0, 33118.0, 67051.0, 141722.0, 269894.0, 245062.0, 123937.0, 58703.0, 29514.0, 15700.0, 8674.0, 4999.0, 3157.0, 1881.0, 1239.0, 787.0, 431.0, 309.0, 200.0, 128.0, 78.0, 55.0, 40.0, 22.0, 18.0, 10.0, 6.0, 5.0, 11.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.91015625, -0.8824996948242188, -0.8548431396484375, -0.8271865844726562, -0.799530029296875, -0.7718734741210938, -0.7442169189453125, -0.7165603637695312, -0.68890380859375, -0.6612472534179688, -0.6335906982421875, -0.6059341430664062, -0.578277587890625, -0.5506210327148438, -0.5229644775390625, -0.49530792236328125, -0.4676513671875, -0.43999481201171875, -0.4123382568359375, -0.38468170166015625, -0.357025146484375, -0.32936859130859375, -0.3017120361328125, -0.27405548095703125, -0.24639892578125, -0.21874237060546875, -0.1910858154296875, -0.16342926025390625, -0.135772705078125, -0.10811614990234375, -0.0804595947265625, -0.05280303955078125, -0.025146484375, 0.00251007080078125, 0.0301666259765625, 0.05782318115234375, 0.085479736328125, 0.11313629150390625, 0.1407928466796875, 0.16844940185546875, 0.19610595703125, 0.22376251220703125, 0.2514190673828125, 0.27907562255859375, 0.306732177734375, 0.33438873291015625, 0.3620452880859375, 0.38970184326171875, 0.4173583984375, 0.44501495361328125, 0.4726715087890625, 0.5003280639648438, 0.527984619140625, 0.5556411743164062, 0.5832977294921875, 0.6109542846679688, 0.63861083984375, 0.6662673950195312, 0.6939239501953125, 0.7215805053710938, 0.749237060546875, 0.7768936157226562, 0.8045501708984375, 0.8322067260742188, 0.85986328125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 6.0, 5.0, 10.0, 6.0, 8.0, 10.0, 13.0, 16.0, 20.0, 21.0, 25.0, 25.0, 26.0, 31.0, 32.0, 37.0, 36.0, 34.0, 37.0, 46.0, 44.0, 1057.0, 27.0, 44.0, 38.0, 35.0, 37.0, 31.0, 24.0, 34.0, 34.0, 25.0, 30.0, 28.0, 17.0, 9.0, 13.0, 13.0, 11.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.73828125, -3.625732421875, -3.51318359375, -3.400634765625, -3.2880859375, -3.175537109375, -3.06298828125, -2.950439453125, -2.837890625, -2.725341796875, -2.61279296875, -2.500244140625, -2.3876953125, -2.275146484375, -2.16259765625, -2.050048828125, -1.9375, -1.824951171875, -1.71240234375, -1.599853515625, -1.4873046875, -1.374755859375, -1.26220703125, -1.149658203125, -1.037109375, -0.924560546875, -0.81201171875, -0.699462890625, -0.5869140625, -0.474365234375, -0.36181640625, -0.249267578125, -0.13671875, -0.024169921875, 0.08837890625, 0.200927734375, 0.3134765625, 0.426025390625, 0.53857421875, 0.651123046875, 0.763671875, 0.876220703125, 0.98876953125, 1.101318359375, 1.2138671875, 1.326416015625, 1.43896484375, 1.551513671875, 1.6640625, 1.776611328125, 1.88916015625, 2.001708984375, 2.1142578125, 2.226806640625, 2.33935546875, 2.451904296875, 2.564453125, 2.677001953125, 2.78955078125, 2.902099609375, 3.0146484375, 3.127197265625, 3.23974609375, 3.352294921875, 3.46484375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 13.0, 18.0, 20.0, 21.0, 27.0, 57.0, 88.0, 111.0, 172.0, 273.0, 349.0, 560.0, 809.0, 1215.0, 1893.0, 2874.0, 4459.0, 6824.0, 11009.0, 17227.0, 27598.0, 44284.0, 74657.0, 126857.0, 407228.0, 1023594.0, 136106.0, 80281.0, 47795.0, 29500.0, 18603.0, 11454.0, 7348.0, 4719.0, 3055.0, 2015.0, 1292.0, 915.0, 587.0, 397.0, 248.0, 179.0, 128.0, 95.0, 63.0, 29.0, 23.0, 24.0, 12.0, 10.0, 6.0, 5.0, 2.0, 4.0, 2.0], "bins": [-0.345458984375, -0.33531951904296875, -0.3251800537109375, -0.31504058837890625, -0.304901123046875, -0.29476165771484375, -0.2846221923828125, -0.27448272705078125, -0.26434326171875, -0.25420379638671875, -0.2440643310546875, -0.23392486572265625, -0.223785400390625, -0.21364593505859375, -0.2035064697265625, -0.19336700439453125, -0.1832275390625, -0.17308807373046875, -0.1629486083984375, -0.15280914306640625, -0.142669677734375, -0.13253021240234375, -0.1223907470703125, -0.11225128173828125, -0.10211181640625, -0.09197235107421875, -0.0818328857421875, -0.07169342041015625, -0.061553955078125, -0.05141448974609375, -0.0412750244140625, -0.03113555908203125, -0.02099609375, -0.01085662841796875, -0.0007171630859375, 0.00942230224609375, 0.019561767578125, 0.02970123291015625, 0.0398406982421875, 0.04998016357421875, 0.06011962890625, 0.07025909423828125, 0.0803985595703125, 0.09053802490234375, 0.100677490234375, 0.11081695556640625, 0.1209564208984375, 0.13109588623046875, 0.1412353515625, 0.15137481689453125, 0.1615142822265625, 0.17165374755859375, 0.181793212890625, 0.19193267822265625, 0.2020721435546875, 0.21221160888671875, 0.22235107421875, 0.23249053955078125, 0.2426300048828125, 0.25276947021484375, 0.262908935546875, 0.27304840087890625, 0.2831878662109375, 0.29332733154296875, 0.303466796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 8.0, 13.0, 14.0, 24.0, 20.0, 17.0, 20.0, 29.0, 23.0, 45.0, 51.0, 60.0, 50.0, 43.0, 54.0, 57.0, 66.0, 47.0, 39.0, 43.0, 31.0, 32.0, 33.0, 31.0, 19.0, 13.0, 11.0, 12.0, 12.0, 9.0, 3.0, 6.0, 2.0, 4.0, 2.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.038238525390625, -0.03709220886230469, -0.035945892333984375, -0.03479957580566406, -0.03365325927734375, -0.03250694274902344, -0.031360626220703125, -0.030214309692382812, -0.0290679931640625, -0.027921676635742188, -0.026775360107421875, -0.025629043579101562, -0.02448272705078125, -0.023336410522460938, -0.022190093994140625, -0.021043777465820312, -0.0198974609375, -0.018751144409179688, -0.017604827880859375, -0.016458511352539062, -0.01531219482421875, -0.014165878295898438, -0.013019561767578125, -0.011873245239257812, -0.0107269287109375, -0.009580612182617188, -0.008434295654296875, -0.0072879791259765625, -0.00614166259765625, -0.0049953460693359375, -0.003849029541015625, -0.0027027130126953125, -0.001556396484375, -0.0004100799560546875, 0.000736236572265625, 0.0018825531005859375, 0.00302886962890625, 0.0041751861572265625, 0.005321502685546875, 0.0064678192138671875, 0.0076141357421875, 0.008760452270507812, 0.009906768798828125, 0.011053085327148438, 0.01219940185546875, 0.013345718383789062, 0.014492034912109375, 0.015638351440429688, 0.01678466796875, 0.017930984497070312, 0.019077301025390625, 0.020223617553710938, 0.02136993408203125, 0.022516250610351562, 0.023662567138671875, 0.024808883666992188, 0.0259552001953125, 0.027101516723632812, 0.028247833251953125, 0.029394149780273438, 0.03054046630859375, 0.03168678283691406, 0.032833099365234375, 0.03397941589355469, 0.035125732421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 2.0, 6.0, 2.0, 5.0, 5.0, 5.0, 10.0, 11.0, 15.0, 17.0, 20.0, 37.0, 34.0, 49.0, 62.0, 73.0, 100.0, 157.0, 230.0, 445.0, 2312.0, 828703.0, 213469.0, 1545.0, 437.0, 255.0, 151.0, 84.0, 64.0, 53.0, 32.0, 30.0, 36.0, 23.0, 11.0, 10.0, 7.0, 5.0, 8.0, 2.0, 2.0, 3.0, 9.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.7080078125, -0.6858291625976562, -0.6636505126953125, -0.6414718627929688, -0.619293212890625, -0.5971145629882812, -0.5749359130859375, -0.5527572631835938, -0.53057861328125, -0.5083999633789062, -0.4862213134765625, -0.46404266357421875, -0.441864013671875, -0.41968536376953125, -0.3975067138671875, -0.37532806396484375, -0.3531494140625, -0.33097076416015625, -0.3087921142578125, -0.28661346435546875, -0.264434814453125, -0.24225616455078125, -0.2200775146484375, -0.19789886474609375, -0.17572021484375, -0.15354156494140625, -0.1313629150390625, -0.10918426513671875, -0.087005615234375, -0.06482696533203125, -0.0426483154296875, -0.02046966552734375, 0.001708984375, 0.02388763427734375, 0.0460662841796875, 0.06824493408203125, 0.090423583984375, 0.11260223388671875, 0.1347808837890625, 0.15695953369140625, 0.17913818359375, 0.20131683349609375, 0.2234954833984375, 0.24567413330078125, 0.267852783203125, 0.29003143310546875, 0.3122100830078125, 0.33438873291015625, 0.3565673828125, 0.37874603271484375, 0.4009246826171875, 0.42310333251953125, 0.445281982421875, 0.46746063232421875, 0.4896392822265625, 0.5118179321289062, 0.53399658203125, 0.5561752319335938, 0.5783538818359375, 0.6005325317382812, 0.622711181640625, 0.6448898315429688, 0.6670684814453125, 0.6892471313476562, 0.71142578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 14.0, 72.0, 225.0, 464.0, 148.0, 37.0, 24.0, 11.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059545211493968964, -0.04999332129955292, -0.04044143110513687, -0.030889540910720825, -0.02133765071630478, -0.011785760521888733, -0.0022338703274726868, 0.007318019866943359, 0.016869910061359406, 0.02642180025577545, 0.0359736904501915, 0.045525580644607544, 0.05507747083902359, 0.06462936103343964, 0.07418125122785568, 0.08373314142227173, 0.09328503161668777, 0.10283692181110382, 0.11238881200551987, 0.12194070219993591, 0.13149258494377136, 0.141044482588768, 0.15059638023376465, 0.1601482629776001, 0.16970014572143555, 0.179252028465271, 0.18880392611026764, 0.19835582375526428, 0.20790770649909973, 0.21745958924293518, 0.22701148688793182, 0.23656338453292847, 0.24611526727676392, 0.25566715002059937, 0.2652190327644348, 0.27477094531059265, 0.2843228280544281, 0.29387471079826355, 0.3034266233444214, 0.31297850608825684, 0.3225303888320923, 0.33208227157592773, 0.3416341543197632, 0.351186066865921, 0.36073794960975647, 0.3702898323535919, 0.37984174489974976, 0.3893936276435852, 0.39894551038742065, 0.4084973931312561, 0.41804927587509155, 0.4276011884212494, 0.43715307116508484, 0.4467049539089203, 0.4562568664550781, 0.4658087491989136, 0.475360631942749, 0.4849125146865845, 0.4944643974304199, 0.5040162801742554, 0.5135681629180908, 0.523120105266571, 0.5326719880104065, 0.5422238707542419, 0.5517757534980774]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 11.0, 11.0, 10.0, 8.0, 14.0, 16.0, 11.0, 19.0, 23.0, 25.0, 34.0, 29.0, 32.0, 22.0, 42.0, 27.0, 34.0, 38.0, 44.0, 33.0, 30.0, 51.0, 31.0, 26.0, 35.0, 33.0, 33.0, 33.0, 23.0, 19.0, 30.0, 22.0, 18.0, 18.0, 15.0, 12.0, 11.0, 7.0, 14.0, 5.0, 6.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11718302965164185, -0.1135890930891037, -0.10999515652656555, -0.106401227414608, -0.10280729085206985, -0.09921335428953171, -0.09561942517757416, -0.09202548861503601, -0.08843155205249786, -0.08483761548995972, -0.08124367892742157, -0.07764974981546402, -0.07405581325292587, -0.07046187669038773, -0.06686794757843018, -0.06327401101589203, -0.05968007445335388, -0.056086137890815735, -0.052492205053567886, -0.04889827221632004, -0.04530433565378189, -0.041710399091243744, -0.038116466253995895, -0.03452253341674805, -0.0309285968542099, -0.027334662154316902, -0.023740727454423904, -0.020146792754530907, -0.01655285805463791, -0.012958923354744911, -0.009364988654851913, -0.005771053954958916, -0.002177119255065918, 0.0014168154448270798, 0.0050107501447200775, 0.008604684844613075, 0.012198619544506073, 0.01579255424439907, 0.01938648894429207, 0.022980423644185066, 0.026574358344078064, 0.03016829304397106, 0.03376222774386406, 0.03735616058111191, 0.040950097143650055, 0.0445440337061882, 0.04813796654343605, 0.0517318993806839, 0.055325835943222046, 0.05891977250576019, 0.06251370906829834, 0.06610763818025589, 0.06970157474279404, 0.07329551130533218, 0.07688944041728973, 0.08048337697982788, 0.08407731354236603, 0.08767125010490417, 0.09126518666744232, 0.09485911577939987, 0.09845305234193802, 0.10204698890447617, 0.10564091801643372, 0.10923485457897186, 0.11282879114151001]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 10.0, 5.0, 8.0, 14.0, 13.0, 17.0, 17.0, 20.0, 29.0, 19.0, 27.0, 31.0, 29.0, 31.0, 24.0, 33.0, 47.0, 40.0, 35.0, 41.0, 38.0, 41.0, 38.0, 27.0, 36.0, 27.0, 25.0, 33.0, 30.0, 28.0, 28.0, 20.0, 14.0, 18.0, 19.0, 9.0, 12.0, 11.0, 10.0, 12.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-5.51953125, -5.362060546875, -5.20458984375, -5.047119140625, -4.8896484375, -4.732177734375, -4.57470703125, -4.417236328125, -4.259765625, -4.102294921875, -3.94482421875, -3.787353515625, -3.6298828125, -3.472412109375, -3.31494140625, -3.157470703125, -3.0, -2.842529296875, -2.68505859375, -2.527587890625, -2.3701171875, -2.212646484375, -2.05517578125, -1.897705078125, -1.740234375, -1.582763671875, -1.42529296875, -1.267822265625, -1.1103515625, -0.952880859375, -0.79541015625, -0.637939453125, -0.48046875, -0.322998046875, -0.16552734375, -0.008056640625, 0.1494140625, 0.306884765625, 0.46435546875, 0.621826171875, 0.779296875, 0.936767578125, 1.09423828125, 1.251708984375, 1.4091796875, 1.566650390625, 1.72412109375, 1.881591796875, 2.0390625, 2.196533203125, 2.35400390625, 2.511474609375, 2.6689453125, 2.826416015625, 2.98388671875, 3.141357421875, 3.298828125, 3.456298828125, 3.61376953125, 3.771240234375, 3.9287109375, 4.086181640625, 4.24365234375, 4.401123046875, 4.55859375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 10.0, 16.0, 18.0, 18.0, 34.0, 45.0, 59.0, 84.0, 88.0, 158.0, 179.0, 271.0, 344.0, 456.0, 585.0, 819.0, 1135.0, 1458.0, 2140.0, 3242.0, 5139.0, 9829.0, 32298.0, 399085.0, 522380.0, 40596.0, 11029.0, 5455.0, 3306.0, 2237.0, 1594.0, 1120.0, 847.0, 622.0, 475.0, 328.0, 268.0, 187.0, 163.0, 115.0, 83.0, 66.0, 49.0, 34.0, 37.0, 15.0, 4.0, 8.0, 7.0, 9.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5859375, -12.193359375, -11.80078125, -11.408203125, -11.015625, -10.623046875, -10.23046875, -9.837890625, -9.4453125, -9.052734375, -8.66015625, -8.267578125, -7.875, -7.482421875, -7.08984375, -6.697265625, -6.3046875, -5.912109375, -5.51953125, -5.126953125, -4.734375, -4.341796875, -3.94921875, -3.556640625, -3.1640625, -2.771484375, -2.37890625, -1.986328125, -1.59375, -1.201171875, -0.80859375, -0.416015625, -0.0234375, 0.369140625, 0.76171875, 1.154296875, 1.546875, 1.939453125, 2.33203125, 2.724609375, 3.1171875, 3.509765625, 3.90234375, 4.294921875, 4.6875, 5.080078125, 5.47265625, 5.865234375, 6.2578125, 6.650390625, 7.04296875, 7.435546875, 7.828125, 8.220703125, 8.61328125, 9.005859375, 9.3984375, 9.791015625, 10.18359375, 10.576171875, 10.96875, 11.361328125, 11.75390625, 12.146484375, 12.5390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 14.0, 13.0, 14.0, 20.0, 19.0, 36.0, 27.0, 35.0, 32.0, 44.0, 46.0, 56.0, 61.0, 77.0, 150.0, 1620.0, 228.0, 82.0, 70.0, 50.0, 45.0, 46.0, 44.0, 39.0, 36.0, 26.0, 22.0, 27.0, 11.0, 16.0, 11.0, 12.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.498779296875, -20.84130859375, -20.183837890625, -19.5263671875, -18.868896484375, -18.21142578125, -17.553955078125, -16.896484375, -16.239013671875, -15.58154296875, -14.924072265625, -14.2666015625, -13.609130859375, -12.95166015625, -12.294189453125, -11.63671875, -10.979248046875, -10.32177734375, -9.664306640625, -9.0068359375, -8.349365234375, -7.69189453125, -7.034423828125, -6.376953125, -5.719482421875, -5.06201171875, -4.404541015625, -3.7470703125, -3.089599609375, -2.43212890625, -1.774658203125, -1.1171875, -0.459716796875, 0.19775390625, 0.855224609375, 1.5126953125, 2.170166015625, 2.82763671875, 3.485107421875, 4.142578125, 4.800048828125, 5.45751953125, 6.114990234375, 6.7724609375, 7.429931640625, 8.08740234375, 8.744873046875, 9.40234375, 10.059814453125, 10.71728515625, 11.374755859375, 12.0322265625, 12.689697265625, 13.34716796875, 14.004638671875, 14.662109375, 15.319580078125, 15.97705078125, 16.634521484375, 17.2919921875, 17.949462890625, 18.60693359375, 19.264404296875, 19.921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 10.0, 14.0, 21.0, 26.0, 26.0, 42.0, 51.0, 101.0, 149.0, 253.0, 392.0, 854.0, 1488.0, 3040.0, 6595.0, 16415.0, 75739.0, 2829682.0, 172010.0, 22698.0, 8318.0, 3706.0, 1820.0, 972.0, 509.0, 272.0, 181.0, 92.0, 79.0, 36.0, 30.0, 24.0, 19.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.859375, -28.91552734375, -27.9716796875, -27.02783203125, -26.083984375, -25.14013671875, -24.1962890625, -23.25244140625, -22.30859375, -21.36474609375, -20.4208984375, -19.47705078125, -18.533203125, -17.58935546875, -16.6455078125, -15.70166015625, -14.7578125, -13.81396484375, -12.8701171875, -11.92626953125, -10.982421875, -10.03857421875, -9.0947265625, -8.15087890625, -7.20703125, -6.26318359375, -5.3193359375, -4.37548828125, -3.431640625, -2.48779296875, -1.5439453125, -0.60009765625, 0.34375, 1.28759765625, 2.2314453125, 3.17529296875, 4.119140625, 5.06298828125, 6.0068359375, 6.95068359375, 7.89453125, 8.83837890625, 9.7822265625, 10.72607421875, 11.669921875, 12.61376953125, 13.5576171875, 14.50146484375, 15.4453125, 16.38916015625, 17.3330078125, 18.27685546875, 19.220703125, 20.16455078125, 21.1083984375, 22.05224609375, 22.99609375, 23.93994140625, 24.8837890625, 25.82763671875, 26.771484375, 27.71533203125, 28.6591796875, 29.60302734375, 30.546875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [23.0, 838.0, 155.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.15609359741211, -12.435873031616211, 5.2843475341796875, 23.004566192626953, 40.724788665771484, 58.445011138916016, 76.16522216796875, 93.88545227050781, 111.60566711425781, 129.3258819580078, 147.04611206054688, 164.76632690429688, 182.48654174804688, 200.20677185058594, 217.92698669433594, 235.647216796875, 253.367431640625, 271.087646484375, 288.807861328125, 306.528076171875, 324.2483215332031, 341.9685363769531, 359.6887512207031, 377.4089660644531, 395.12921142578125, 412.84942626953125, 430.56964111328125, 448.28985595703125, 466.0101013183594, 483.7303161621094, 501.4505310058594, 519.1707763671875, 536.8909301757812, 554.6111450195312, 572.3313598632812, 590.0515747070312, 607.7717895507812, 625.4920654296875, 643.2122802734375, 660.9324951171875, 678.6527099609375, 696.3729248046875, 714.0931396484375, 731.8133544921875, 749.5335693359375, 767.2537841796875, 784.9739990234375, 802.6942749023438, 820.4144287109375, 838.1346435546875, 855.8548583984375, 873.5750732421875, 891.2952880859375, 909.0155029296875, 926.7357177734375, 944.4559936523438, 962.1762084960938, 979.8964233398438, 997.6166381835938, 1015.3368530273438, 1033.05712890625, 1050.77734375, 1068.49755859375, 1086.2177734375, 1103.93798828125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 21.0, 11.0, 24.0, 20.0, 19.0, 27.0, 21.0, 31.0, 40.0, 30.0, 45.0, 40.0, 37.0, 39.0, 43.0, 37.0, 37.0, 37.0, 31.0, 36.0, 39.0, 26.0, 31.0, 25.0, 19.0, 26.0, 29.0, 25.0, 19.0, 17.0, 11.0, 13.0, 8.0, 8.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.10598373413086, -56.234596252441406, -54.36320877075195, -52.4918212890625, -50.62043380737305, -48.749046325683594, -46.877655029296875, -45.00627136230469, -43.13488006591797, -41.263492584228516, -39.39210510253906, -37.52071762084961, -35.649330139160156, -33.7779426574707, -31.906553268432617, -30.035165786743164, -28.163780212402344, -26.29239273071289, -24.421005249023438, -22.549617767333984, -20.67823028564453, -18.806842803955078, -16.935453414916992, -15.064065933227539, -13.192678451538086, -11.321290969848633, -9.44990348815918, -7.57851505279541, -5.707127571105957, -3.835740089416504, -1.9643516540527344, -0.09296417236328125, 1.7784271240234375, 3.6498148441314697, 5.521202564239502, 7.392590522766113, 9.263978004455566, 11.13536548614502, 13.006753921508789, 14.878141403198242, 16.749528884887695, 18.62091636657715, 20.4923038482666, 22.363693237304688, 24.23508071899414, 26.106468200683594, 27.977855682373047, 29.8492431640625, 31.720630645751953, 33.592018127441406, 35.46340560913086, 37.33479309082031, 39.206180572509766, 41.07756805419922, 42.94895935058594, 44.820343017578125, 46.691734313964844, 48.5631217956543, 50.43450927734375, 52.3058967590332, 54.177284240722656, 56.04867172241211, 57.92005920410156, 59.79145050048828, 61.66283416748047]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 2.0, 11.0, 10.0, 8.0, 15.0, 13.0, 24.0, 19.0, 22.0, 28.0, 21.0, 27.0, 32.0, 33.0, 38.0, 39.0, 37.0, 36.0, 48.0, 44.0, 35.0, 45.0, 43.0, 30.0, 32.0, 32.0, 26.0, 29.0, 31.0, 24.0, 19.0, 20.0, 23.0, 18.0, 14.0, 10.0, 15.0, 10.0, 6.0, 9.0, 9.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.34588623046875, -5.1722412109375, -4.99859619140625, -4.824951171875, -4.65130615234375, -4.4776611328125, -4.30401611328125, -4.13037109375, -3.95672607421875, -3.7830810546875, -3.60943603515625, -3.435791015625, -3.26214599609375, -3.0885009765625, -2.91485595703125, -2.7412109375, -2.56756591796875, -2.3939208984375, -2.22027587890625, -2.046630859375, -1.87298583984375, -1.6993408203125, -1.52569580078125, -1.35205078125, -1.17840576171875, -1.0047607421875, -0.83111572265625, -0.657470703125, -0.48382568359375, -0.3101806640625, -0.13653564453125, 0.037109375, 0.21075439453125, 0.3843994140625, 0.55804443359375, 0.731689453125, 0.90533447265625, 1.0789794921875, 1.25262451171875, 1.42626953125, 1.59991455078125, 1.7735595703125, 1.94720458984375, 2.120849609375, 2.29449462890625, 2.4681396484375, 2.64178466796875, 2.8154296875, 2.98907470703125, 3.1627197265625, 3.33636474609375, 3.510009765625, 3.68365478515625, 3.8572998046875, 4.03094482421875, 4.20458984375, 4.37823486328125, 4.5518798828125, 4.72552490234375, 4.899169921875, 5.07281494140625, 5.2464599609375, 5.42010498046875, 5.59375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 7.0, 9.0, 13.0, 20.0, 29.0, 52.0, 102.0, 144.0, 282.0, 539.0, 988.0, 2013.0, 4226.0, 10143.0, 26452.0, 97427.0, 1805913.0, 2092925.0, 105909.0, 28042.0, 10394.0, 4472.0, 1920.0, 1054.0, 507.0, 269.0, 153.0, 75.0, 59.0, 35.0, 32.0, 20.0, 15.0, 8.0, 3.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.671875, -22.8271484375, -21.982421875, -21.1376953125, -20.29296875, -19.4482421875, -18.603515625, -17.7587890625, -16.9140625, -16.0693359375, -15.224609375, -14.3798828125, -13.53515625, -12.6904296875, -11.845703125, -11.0009765625, -10.15625, -9.3115234375, -8.466796875, -7.6220703125, -6.77734375, -5.9326171875, -5.087890625, -4.2431640625, -3.3984375, -2.5537109375, -1.708984375, -0.8642578125, -0.01953125, 0.8251953125, 1.669921875, 2.5146484375, 3.359375, 4.2041015625, 5.048828125, 5.8935546875, 6.73828125, 7.5830078125, 8.427734375, 9.2724609375, 10.1171875, 10.9619140625, 11.806640625, 12.6513671875, 13.49609375, 14.3408203125, 15.185546875, 16.0302734375, 16.875, 17.7197265625, 18.564453125, 19.4091796875, 20.25390625, 21.0986328125, 21.943359375, 22.7880859375, 23.6328125, 24.4775390625, 25.322265625, 26.1669921875, 27.01171875, 27.8564453125, 28.701171875, 29.5458984375, 30.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 12.0, 10.0, 28.0, 26.0, 47.0, 65.0, 95.0, 122.0, 228.0, 348.0, 595.0, 783.0, 603.0, 400.0, 240.0, 147.0, 95.0, 47.0, 46.0, 35.0, 18.0, 26.0, 16.0, 6.0, 4.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.63427734375, -14.9404296875, -14.24658203125, -13.552734375, -12.85888671875, -12.1650390625, -11.47119140625, -10.77734375, -10.08349609375, -9.3896484375, -8.69580078125, -8.001953125, -7.30810546875, -6.6142578125, -5.92041015625, -5.2265625, -4.53271484375, -3.8388671875, -3.14501953125, -2.451171875, -1.75732421875, -1.0634765625, -0.36962890625, 0.32421875, 1.01806640625, 1.7119140625, 2.40576171875, 3.099609375, 3.79345703125, 4.4873046875, 5.18115234375, 5.875, 6.56884765625, 7.2626953125, 7.95654296875, 8.650390625, 9.34423828125, 10.0380859375, 10.73193359375, 11.42578125, 12.11962890625, 12.8134765625, 13.50732421875, 14.201171875, 14.89501953125, 15.5888671875, 16.28271484375, 16.9765625, 17.67041015625, 18.3642578125, 19.05810546875, 19.751953125, 20.44580078125, 21.1396484375, 21.83349609375, 22.52734375, 23.22119140625, 23.9150390625, 24.60888671875, 25.302734375, 25.99658203125, 26.6904296875, 27.38427734375, 28.078125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 12.0, 10.0, 11.0, 15.0, 31.0, 50.0, 67.0, 107.0, 202.0, 386.0, 757.0, 1468.0, 3340.0, 7570.0, 19028.0, 51094.0, 172584.0, 1372794.0, 2210842.0, 247825.0, 65421.0, 23484.0, 9376.0, 4040.0, 1832.0, 904.0, 411.0, 248.0, 145.0, 67.0, 50.0, 38.0, 22.0, 14.0, 8.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.875, -33.9599609375, -33.044921875, -32.1298828125, -31.21484375, -30.2998046875, -29.384765625, -28.4697265625, -27.5546875, -26.6396484375, -25.724609375, -24.8095703125, -23.89453125, -22.9794921875, -22.064453125, -21.1494140625, -20.234375, -19.3193359375, -18.404296875, -17.4892578125, -16.57421875, -15.6591796875, -14.744140625, -13.8291015625, -12.9140625, -11.9990234375, -11.083984375, -10.1689453125, -9.25390625, -8.3388671875, -7.423828125, -6.5087890625, -5.59375, -4.6787109375, -3.763671875, -2.8486328125, -1.93359375, -1.0185546875, -0.103515625, 0.8115234375, 1.7265625, 2.6416015625, 3.556640625, 4.4716796875, 5.38671875, 6.3017578125, 7.216796875, 8.1318359375, 9.046875, 9.9619140625, 10.876953125, 11.7919921875, 12.70703125, 13.6220703125, 14.537109375, 15.4521484375, 16.3671875, 17.2822265625, 18.197265625, 19.1123046875, 20.02734375, 20.9423828125, 21.857421875, 22.7724609375, 23.6875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 26.0, 28.0, 95.0, 112.0, 154.0, 197.0, 167.0, 104.0, 63.0, 25.0, 18.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.56088256835938, -109.8447494506836, -104.12861633300781, -98.4124755859375, -92.69634246826172, -86.98020935058594, -81.26406860351562, -75.54793548583984, -69.83180236816406, -64.11566925048828, -58.399532318115234, -52.68339538574219, -46.967262268066406, -41.251129150390625, -35.53499221801758, -29.81885528564453, -24.10272216796875, -18.386587142944336, -12.670452117919922, -6.954317092895508, -1.2381820678710938, 4.47795295715332, 10.194087982177734, 15.910224914550781, 21.626358032226562, 27.342493057250977, 33.05862808227539, 38.77476501464844, 44.49089813232422, 50.20703125, 55.92316818237305, 61.639305114746094, 67.35545349121094, 73.07158660888672, 78.7877197265625, 84.50386047363281, 90.2199935913086, 95.93612670898438, 101.65226745605469, 107.36840057373047, 113.08453369140625, 118.80066680908203, 124.51679992675781, 130.23294067382812, 135.94906616210938, 141.6652069091797, 147.38134765625, 153.09747314453125, 158.81361389160156, 164.52975463867188, 170.24588012695312, 175.96202087402344, 181.67816162109375, 187.394287109375, 193.1104278564453, 198.82656860351562, 204.54269409179688, 210.2588348388672, 215.97496032714844, 221.69110107421875, 227.4072265625, 233.1233673095703, 238.83950805664062, 244.55563354492188, 250.2717742919922]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 10.0, 16.0, 19.0, 13.0, 15.0, 19.0, 34.0, 30.0, 25.0, 42.0, 36.0, 37.0, 36.0, 39.0, 44.0, 38.0, 53.0, 37.0, 55.0, 44.0, 35.0, 40.0, 38.0, 35.0, 17.0, 19.0, 20.0, 17.0, 25.0, 22.0, 10.0, 18.0, 7.0, 9.0, 5.0, 10.0, 4.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.1502685546875, -53.32899475097656, -51.50772476196289, -49.68645095825195, -47.86518096923828, -46.043907165527344, -44.222633361816406, -42.40135955810547, -40.5800895690918, -38.75881576538086, -36.93754577636719, -35.11627197265625, -33.29499816894531, -31.47372817993164, -29.652454376220703, -27.8311824798584, -26.009910583496094, -24.18863868713379, -22.367366790771484, -20.546092987060547, -18.724821090698242, -16.903549194335938, -15.082276344299316, -13.261003494262695, -11.43973159790039, -9.618459701538086, -7.797186851501465, -5.975914478302002, -4.154642105102539, -2.3333702087402344, -0.5120973587036133, 1.3091754913330078, 3.1304473876953125, 4.951719760894775, 6.772992134094238, 8.59426498413086, 10.415536880493164, 12.236808776855469, 14.05808162689209, 15.879354476928711, 17.700626373291016, 19.52189826965332, 21.343170166015625, 23.164443969726562, 24.985715866088867, 26.806987762451172, 28.62826156616211, 30.449533462524414, 32.27080535888672, 34.092079162597656, 35.91334915161133, 37.734622955322266, 39.55589294433594, 41.377166748046875, 43.19844055175781, 45.01971435546875, 46.84098434448242, 48.66225814819336, 50.48352813720703, 52.30480194091797, 54.126075744628906, 55.94734573364258, 57.768619537353516, 59.58988952636719, 61.411163330078125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 2.0, 2.0, 7.0, 8.0, 12.0, 16.0, 17.0, 17.0, 28.0, 27.0, 27.0, 24.0, 33.0, 34.0, 34.0, 42.0, 49.0, 39.0, 49.0, 36.0, 52.0, 40.0, 35.0, 37.0, 35.0, 40.0, 32.0, 27.0, 25.0, 24.0, 27.0, 12.0, 26.0, 17.0, 14.0, 9.0, 4.0, 6.0, 8.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.40594482421875, -6.2103271484375, -6.01470947265625, -5.819091796875, -5.62347412109375, -5.4278564453125, -5.23223876953125, -5.03662109375, -4.84100341796875, -4.6453857421875, -4.44976806640625, -4.254150390625, -4.05853271484375, -3.8629150390625, -3.66729736328125, -3.4716796875, -3.27606201171875, -3.0804443359375, -2.88482666015625, -2.689208984375, -2.49359130859375, -2.2979736328125, -2.10235595703125, -1.90673828125, -1.71112060546875, -1.5155029296875, -1.31988525390625, -1.124267578125, -0.92864990234375, -0.7330322265625, -0.53741455078125, -0.341796875, -0.14617919921875, 0.0494384765625, 0.24505615234375, 0.440673828125, 0.63629150390625, 0.8319091796875, 1.02752685546875, 1.22314453125, 1.41876220703125, 1.6143798828125, 1.80999755859375, 2.005615234375, 2.20123291015625, 2.3968505859375, 2.59246826171875, 2.7880859375, 2.98370361328125, 3.1793212890625, 3.37493896484375, 3.570556640625, 3.76617431640625, 3.9617919921875, 4.15740966796875, 4.35302734375, 4.54864501953125, 4.7442626953125, 4.93988037109375, 5.135498046875, 5.33111572265625, 5.5267333984375, 5.72235107421875, 5.91796875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 9.0, 21.0, 29.0, 46.0, 66.0, 96.0, 156.0, 262.0, 410.0, 667.0, 1117.0, 1983.0, 3221.0, 5633.0, 10150.0, 18607.0, 35083.0, 70112.0, 142614.0, 265691.0, 239743.0, 123494.0, 60715.0, 31063.0, 16100.0, 9126.0, 5044.0, 2913.0, 1675.0, 1085.0, 624.0, 336.0, 256.0, 148.0, 92.0, 55.0, 40.0, 17.0, 12.0, 19.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.072265625, -1.0396728515625, -1.007080078125, -0.9744873046875, -0.94189453125, -0.9093017578125, -0.876708984375, -0.8441162109375, -0.8115234375, -0.7789306640625, -0.746337890625, -0.7137451171875, -0.68115234375, -0.6485595703125, -0.615966796875, -0.5833740234375, -0.55078125, -0.5181884765625, -0.485595703125, -0.4530029296875, -0.42041015625, -0.3878173828125, -0.355224609375, -0.3226318359375, -0.2900390625, -0.2574462890625, -0.224853515625, -0.1922607421875, -0.15966796875, -0.1270751953125, -0.094482421875, -0.0618896484375, -0.029296875, 0.0032958984375, 0.035888671875, 0.0684814453125, 0.10107421875, 0.1336669921875, 0.166259765625, 0.1988525390625, 0.2314453125, 0.2640380859375, 0.296630859375, 0.3292236328125, 0.36181640625, 0.3944091796875, 0.427001953125, 0.4595947265625, 0.4921875, 0.5247802734375, 0.557373046875, 0.5899658203125, 0.62255859375, 0.6551513671875, 0.687744140625, 0.7203369140625, 0.7529296875, 0.7855224609375, 0.818115234375, 0.8507080078125, 0.88330078125, 0.9158935546875, 0.948486328125, 0.9810791015625, 1.013671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 7.0, 4.0, 10.0, 4.0, 8.0, 11.0, 16.0, 8.0, 17.0, 19.0, 22.0, 22.0, 24.0, 33.0, 43.0, 35.0, 37.0, 33.0, 34.0, 40.0, 34.0, 1062.0, 57.0, 31.0, 41.0, 30.0, 47.0, 38.0, 34.0, 33.0, 27.0, 20.0, 24.0, 24.0, 11.0, 15.0, 14.0, 16.0, 8.0, 7.0, 4.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.12109375, -3.99267578125, -3.8642578125, -3.73583984375, -3.607421875, -3.47900390625, -3.3505859375, -3.22216796875, -3.09375, -2.96533203125, -2.8369140625, -2.70849609375, -2.580078125, -2.45166015625, -2.3232421875, -2.19482421875, -2.06640625, -1.93798828125, -1.8095703125, -1.68115234375, -1.552734375, -1.42431640625, -1.2958984375, -1.16748046875, -1.0390625, -0.91064453125, -0.7822265625, -0.65380859375, -0.525390625, -0.39697265625, -0.2685546875, -0.14013671875, -0.01171875, 0.11669921875, 0.2451171875, 0.37353515625, 0.501953125, 0.63037109375, 0.7587890625, 0.88720703125, 1.015625, 1.14404296875, 1.2724609375, 1.40087890625, 1.529296875, 1.65771484375, 1.7861328125, 1.91455078125, 2.04296875, 2.17138671875, 2.2998046875, 2.42822265625, 2.556640625, 2.68505859375, 2.8134765625, 2.94189453125, 3.0703125, 3.19873046875, 3.3271484375, 3.45556640625, 3.583984375, 3.71240234375, 3.8408203125, 3.96923828125, 4.09765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 19.0, 39.0, 46.0, 69.0, 93.0, 144.0, 256.0, 408.0, 650.0, 888.0, 1467.0, 2379.0, 3718.0, 5644.0, 9121.0, 14783.0, 24456.0, 39420.0, 68037.0, 120006.0, 318229.0, 1120238.0, 156727.0, 83833.0, 49084.0, 29167.0, 17876.0, 11330.0, 6892.0, 4430.0, 2691.0, 1819.0, 1153.0, 722.0, 481.0, 299.0, 189.0, 112.0, 71.0, 55.0, 30.0, 23.0, 14.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342041015625, -0.3303260803222656, -0.31861114501953125, -0.3068962097167969, -0.2951812744140625, -0.2834663391113281, -0.27175140380859375, -0.2600364685058594, -0.248321533203125, -0.23660659790039062, -0.22489166259765625, -0.21317672729492188, -0.2014617919921875, -0.18974685668945312, -0.17803192138671875, -0.16631698608398438, -0.15460205078125, -0.14288711547851562, -0.13117218017578125, -0.11945724487304688, -0.1077423095703125, -0.09602737426757812, -0.08431243896484375, -0.07259750366210938, -0.060882568359375, -0.049167633056640625, -0.03745269775390625, -0.025737762451171875, -0.0140228271484375, -0.002307891845703125, 0.00940704345703125, 0.021121978759765625, 0.0328369140625, 0.044551849365234375, 0.05626678466796875, 0.06798171997070312, 0.0796966552734375, 0.09141159057617188, 0.10312652587890625, 0.11484146118164062, 0.126556396484375, 0.13827133178710938, 0.14998626708984375, 0.16170120239257812, 0.1734161376953125, 0.18513107299804688, 0.19684600830078125, 0.20856094360351562, 0.22027587890625, 0.23199081420898438, 0.24370574951171875, 0.2554206848144531, 0.2671356201171875, 0.2788505554199219, 0.29056549072265625, 0.3022804260253906, 0.313995361328125, 0.3257102966308594, 0.33742523193359375, 0.3491401672363281, 0.3608551025390625, 0.3725700378417969, 0.38428497314453125, 0.3959999084472656, 0.40771484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 14.0, 14.0, 21.0, 33.0, 45.0, 37.0, 68.0, 78.0, 64.0, 78.0, 79.0, 88.0, 64.0, 57.0, 59.0, 33.0, 24.0, 16.0, 22.0, 11.0, 8.0, 11.0, 3.0, 4.0, 7.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.1048583984375, -0.1016702651977539, -0.09848213195800781, -0.09529399871826172, -0.09210586547851562, -0.08891773223876953, -0.08572959899902344, -0.08254146575927734, -0.07935333251953125, -0.07616519927978516, -0.07297706604003906, -0.06978893280029297, -0.06660079956054688, -0.06341266632080078, -0.06022453308105469, -0.057036399841308594, -0.0538482666015625, -0.050660133361816406, -0.04747200012207031, -0.04428386688232422, -0.041095733642578125, -0.03790760040283203, -0.03471946716308594, -0.031531333923339844, -0.02834320068359375, -0.025155067443847656, -0.021966934204101562, -0.01877880096435547, -0.015590667724609375, -0.012402534484863281, -0.009214401245117188, -0.006026268005371094, -0.002838134765625, 0.00034999847412109375, 0.0035381317138671875, 0.006726264953613281, 0.009914398193359375, 0.013102531433105469, 0.016290664672851562, 0.019478797912597656, 0.02266693115234375, 0.025855064392089844, 0.029043197631835938, 0.03223133087158203, 0.035419464111328125, 0.03860759735107422, 0.04179573059082031, 0.044983863830566406, 0.0481719970703125, 0.051360130310058594, 0.05454826354980469, 0.05773639678955078, 0.060924530029296875, 0.06411266326904297, 0.06730079650878906, 0.07048892974853516, 0.07367706298828125, 0.07686519622802734, 0.08005332946777344, 0.08324146270751953, 0.08642959594726562, 0.08961772918701172, 0.09280586242675781, 0.0959939956665039, 0.09918212890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 4.0, 8.0, 3.0, 15.0, 11.0, 17.0, 31.0, 32.0, 46.0, 82.0, 126.0, 196.0, 562.0, 5405.0, 993088.0, 46770.0, 1365.0, 289.0, 169.0, 96.0, 57.0, 47.0, 36.0, 15.0, 14.0, 11.0, 11.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0703125, -2.005096435546875, -1.93988037109375, -1.874664306640625, -1.8094482421875, -1.744232177734375, -1.67901611328125, -1.613800048828125, -1.548583984375, -1.483367919921875, -1.41815185546875, -1.352935791015625, -1.2877197265625, -1.222503662109375, -1.15728759765625, -1.092071533203125, -1.02685546875, -0.961639404296875, -0.89642333984375, -0.831207275390625, -0.7659912109375, -0.700775146484375, -0.63555908203125, -0.570343017578125, -0.505126953125, -0.439910888671875, -0.37469482421875, -0.309478759765625, -0.2442626953125, -0.179046630859375, -0.11383056640625, -0.048614501953125, 0.0166015625, 0.081817626953125, 0.14703369140625, 0.212249755859375, 0.2774658203125, 0.342681884765625, 0.40789794921875, 0.473114013671875, 0.538330078125, 0.603546142578125, 0.66876220703125, 0.733978271484375, 0.7991943359375, 0.864410400390625, 0.92962646484375, 0.994842529296875, 1.06005859375, 1.125274658203125, 1.19049072265625, 1.255706787109375, 1.3209228515625, 1.386138916015625, 1.45135498046875, 1.516571044921875, 1.581787109375, 1.647003173828125, 1.71221923828125, 1.777435302734375, 1.8426513671875, 1.907867431640625, 1.97308349609375, 2.038299560546875, 2.103515625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 15.0, 17.0, 29.0, 43.0, 64.0, 112.0, 278.0, 185.0, 102.0, 56.0, 33.0, 16.0, 16.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19301098585128784, -0.1807277500629425, -0.16844452917575836, -0.15616129338741302, -0.14387807250022888, -0.13159483671188354, -0.11931160092353821, -0.10702837258577347, -0.09474514424800873, -0.08246191591024399, -0.07017868757247925, -0.05789545178413391, -0.04561222344636917, -0.03332899510860443, -0.021045759320259094, -0.008762530982494354, 0.0035206973552703857, 0.015803927555680275, 0.028087157756090164, 0.0403703898191452, 0.05265361815690994, 0.06493684649467468, 0.07722008228302002, 0.08950331062078476, 0.1017865389585495, 0.11406976729631424, 0.12635299563407898, 0.13863623142242432, 0.15091946721076965, 0.1632026880979538, 0.17548592388629913, 0.18776914477348328, 0.2000523805618286, 0.21233561635017395, 0.2246188372373581, 0.23690207302570343, 0.24918529391288757, 0.2614685297012329, 0.27375176548957825, 0.2860350012779236, 0.29831820726394653, 0.31060144305229187, 0.3228846788406372, 0.33516788482666016, 0.3474511206150055, 0.35973435640335083, 0.37201759219169617, 0.3843008279800415, 0.39658406376838684, 0.4088672995567322, 0.4211505353450775, 0.43343377113342285, 0.4457169771194458, 0.45800021290779114, 0.4702834486961365, 0.4825666844844818, 0.49484992027282715, 0.5071331262588501, 0.5194163918495178, 0.5316995978355408, 0.5439828634262085, 0.5562660694122314, 0.5685492753982544, 0.5808325409889221, 0.5931157469749451]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 5.0, 12.0, 12.0, 9.0, 14.0, 11.0, 16.0, 19.0, 14.0, 20.0, 25.0, 23.0, 29.0, 41.0, 31.0, 39.0, 28.0, 46.0, 42.0, 42.0, 30.0, 34.0, 31.0, 37.0, 26.0, 35.0, 23.0, 43.0, 22.0, 29.0, 23.0, 23.0, 20.0, 22.0, 15.0, 15.0, 20.0, 12.0, 6.0, 10.0, 4.0, 8.0, 7.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.2616593837738037, -0.2540225386619568, -0.24638566374778748, -0.23874881863594055, -0.23111195862293243, -0.22347509860992432, -0.2158382534980774, -0.20820139348506927, -0.20056453347206116, -0.19292767345905304, -0.18529081344604492, -0.177653968334198, -0.17001710832118988, -0.16238024830818176, -0.15474340319633484, -0.14710654318332672, -0.1394696831703186, -0.13183282315731049, -0.12419597059488297, -0.11655911803245544, -0.10892225801944733, -0.10128539800643921, -0.09364854544401169, -0.08601169288158417, -0.07837483286857605, -0.07073797285556793, -0.06310112029314041, -0.05546426400542259, -0.04782740771770477, -0.040190551429986954, -0.032553695142269135, -0.024916838854551315, -0.017279982566833496, -0.009643126279115677, -0.0020062699913978577, 0.0056305862963199615, 0.01326744258403778, 0.0209042988717556, 0.02854115515947342, 0.03617801144719124, 0.04381486773490906, 0.05145172402262688, 0.059088580310344696, 0.06672543287277222, 0.07436229288578033, 0.08199915289878845, 0.08963600546121597, 0.0972728580236435, 0.10490971803665161, 0.11254657804965973, 0.12018343061208725, 0.12782028317451477, 0.1354571431875229, 0.143094003200531, 0.15073084831237793, 0.15836770832538605, 0.16600456833839417, 0.17364142835140228, 0.1812782883644104, 0.18891513347625732, 0.19655199348926544, 0.20418885350227356, 0.21182569861412048, 0.2194625586271286, 0.22709941864013672]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 3.0, 2.0, 7.0, 7.0, 12.0, 17.0, 17.0, 15.0, 29.0, 27.0, 27.0, 24.0, 30.0, 38.0, 34.0, 38.0, 52.0, 37.0, 50.0, 36.0, 53.0, 40.0, 35.0, 35.0, 38.0, 40.0, 32.0, 27.0, 24.0, 24.0, 27.0, 13.0, 26.0, 16.0, 15.0, 8.0, 5.0, 6.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.61328125, -6.41754150390625, -6.2218017578125, -6.02606201171875, -5.830322265625, -5.63458251953125, -5.4388427734375, -5.24310302734375, -5.04736328125, -4.85162353515625, -4.6558837890625, -4.46014404296875, -4.264404296875, -4.06866455078125, -3.8729248046875, -3.67718505859375, -3.4814453125, -3.28570556640625, -3.0899658203125, -2.89422607421875, -2.698486328125, -2.50274658203125, -2.3070068359375, -2.11126708984375, -1.91552734375, -1.71978759765625, -1.5240478515625, -1.32830810546875, -1.132568359375, -0.93682861328125, -0.7410888671875, -0.54534912109375, -0.349609375, -0.15386962890625, 0.0418701171875, 0.23760986328125, 0.433349609375, 0.62908935546875, 0.8248291015625, 1.02056884765625, 1.21630859375, 1.41204833984375, 1.6077880859375, 1.80352783203125, 1.999267578125, 2.19500732421875, 2.3907470703125, 2.58648681640625, 2.7822265625, 2.97796630859375, 3.1737060546875, 3.36944580078125, 3.565185546875, 3.76092529296875, 3.9566650390625, 4.15240478515625, 4.34814453125, 4.54388427734375, 4.7396240234375, 4.93536376953125, 5.131103515625, 5.32684326171875, 5.5225830078125, 5.71832275390625, 5.9140625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 11.0, 19.0, 24.0, 28.0, 45.0, 59.0, 92.0, 163.0, 211.0, 334.0, 491.0, 676.0, 1008.0, 1475.0, 2145.0, 3230.0, 5312.0, 11837.0, 54249.0, 624269.0, 291217.0, 29684.0, 8605.0, 4458.0, 2890.0, 1896.0, 1265.0, 940.0, 594.0, 456.0, 277.0, 183.0, 138.0, 81.0, 52.0, 54.0, 32.0, 13.0, 15.0, 12.0, 8.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9375, -14.453125, -13.96875, -13.484375, -13.0, -12.515625, -12.03125, -11.546875, -11.0625, -10.578125, -10.09375, -9.609375, -9.125, -8.640625, -8.15625, -7.671875, -7.1875, -6.703125, -6.21875, -5.734375, -5.25, -4.765625, -4.28125, -3.796875, -3.3125, -2.828125, -2.34375, -1.859375, -1.375, -0.890625, -0.40625, 0.078125, 0.5625, 1.046875, 1.53125, 2.015625, 2.5, 2.984375, 3.46875, 3.953125, 4.4375, 4.921875, 5.40625, 5.890625, 6.375, 6.859375, 7.34375, 7.828125, 8.3125, 8.796875, 9.28125, 9.765625, 10.25, 10.734375, 11.21875, 11.703125, 12.1875, 12.671875, 13.15625, 13.640625, 14.125, 14.609375, 15.09375, 15.578125, 16.0625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 1.0, 3.0, 5.0, 9.0, 6.0, 6.0, 6.0, 11.0, 10.0, 16.0, 14.0, 17.0, 23.0, 19.0, 23.0, 17.0, 32.0, 34.0, 30.0, 49.0, 40.0, 53.0, 97.0, 189.0, 1487.0, 283.0, 108.0, 69.0, 52.0, 44.0, 45.0, 25.0, 34.0, 27.0, 26.0, 24.0, 18.0, 17.0, 12.0, 11.0, 22.0, 5.0, 9.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-21.46875, -20.866943359375, -20.26513671875, -19.663330078125, -19.0615234375, -18.459716796875, -17.85791015625, -17.256103515625, -16.654296875, -16.052490234375, -15.45068359375, -14.848876953125, -14.2470703125, -13.645263671875, -13.04345703125, -12.441650390625, -11.83984375, -11.238037109375, -10.63623046875, -10.034423828125, -9.4326171875, -8.830810546875, -8.22900390625, -7.627197265625, -7.025390625, -6.423583984375, -5.82177734375, -5.219970703125, -4.6181640625, -4.016357421875, -3.41455078125, -2.812744140625, -2.2109375, -1.609130859375, -1.00732421875, -0.405517578125, 0.1962890625, 0.798095703125, 1.39990234375, 2.001708984375, 2.603515625, 3.205322265625, 3.80712890625, 4.408935546875, 5.0107421875, 5.612548828125, 6.21435546875, 6.816162109375, 7.41796875, 8.019775390625, 8.62158203125, 9.223388671875, 9.8251953125, 10.427001953125, 11.02880859375, 11.630615234375, 12.232421875, 12.834228515625, 13.43603515625, 14.037841796875, 14.6396484375, 15.241455078125, 15.84326171875, 16.445068359375, 17.046875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 6.0, 9.0, 10.0, 11.0, 19.0, 10.0, 12.0, 28.0, 39.0, 49.0, 70.0, 91.0, 156.0, 253.0, 506.0, 1023.0, 2720.0, 8317.0, 43147.0, 2194949.0, 854143.0, 29294.0, 6442.0, 2293.0, 907.0, 447.0, 240.0, 130.0, 96.0, 56.0, 43.0, 41.0, 30.0, 19.0, 20.0, 14.0, 15.0, 5.0, 7.0, 5.0, 9.0, 7.0, 5.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.42431640625, -25.4423828125, -24.46044921875, -23.478515625, -22.49658203125, -21.5146484375, -20.53271484375, -19.55078125, -18.56884765625, -17.5869140625, -16.60498046875, -15.623046875, -14.64111328125, -13.6591796875, -12.67724609375, -11.6953125, -10.71337890625, -9.7314453125, -8.74951171875, -7.767578125, -6.78564453125, -5.8037109375, -4.82177734375, -3.83984375, -2.85791015625, -1.8759765625, -0.89404296875, 0.087890625, 1.06982421875, 2.0517578125, 3.03369140625, 4.015625, 4.99755859375, 5.9794921875, 6.96142578125, 7.943359375, 8.92529296875, 9.9072265625, 10.88916015625, 11.87109375, 12.85302734375, 13.8349609375, 14.81689453125, 15.798828125, 16.78076171875, 17.7626953125, 18.74462890625, 19.7265625, 20.70849609375, 21.6904296875, 22.67236328125, 23.654296875, 24.63623046875, 25.6181640625, 26.60009765625, 27.58203125, 28.56396484375, 29.5458984375, 30.52783203125, 31.509765625, 32.49169921875, 33.4736328125, 34.45556640625, 35.4375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 29.0, 29.0, 46.0, 73.0, 117.0, 129.0, 115.0, 115.0, 97.0, 80.0, 59.0, 48.0, 22.0, 8.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0], "bins": [-71.45100402832031, -70.0322494506836, -68.6135025024414, -67.19474792480469, -65.7760009765625, -64.35724639892578, -62.938499450683594, -61.51974868774414, -60.10099792480469, -58.682247161865234, -57.26349639892578, -55.84474563598633, -54.425994873046875, -53.00724411010742, -51.58849334716797, -50.169742584228516, -48.75099182128906, -47.33224105834961, -45.913490295410156, -44.4947395324707, -43.07598876953125, -41.6572380065918, -40.238487243652344, -38.81973648071289, -37.40098190307617, -35.98223114013672, -34.563480377197266, -33.14472961425781, -31.72597885131836, -30.307228088378906, -28.888477325439453, -27.4697265625, -26.05097770690918, -24.632226943969727, -23.213476181030273, -21.79472541809082, -20.375974655151367, -18.957223892211914, -17.538471221923828, -16.119720458984375, -14.700970649719238, -13.282219886779785, -11.863469123840332, -10.444717407226562, -9.02596664428711, -7.6072163581848145, -6.188465118408203, -4.76971435546875, -3.350963592529297, -1.9322127103805542, -0.5134618282318115, 0.9052891731262207, 2.324039936065674, 3.742790699005127, 5.161541938781738, 6.580292701721191, 7.9990434646606445, 9.417794227600098, 10.83654499053955, 12.25529670715332, 13.674047470092773, 15.092798233032227, 16.51154899597168, 17.930299758911133, 19.349050521850586]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 7.0, 6.0, 16.0, 10.0, 17.0, 18.0, 18.0, 17.0, 21.0, 26.0, 30.0, 23.0, 34.0, 34.0, 32.0, 40.0, 28.0, 34.0, 36.0, 36.0, 35.0, 47.0, 36.0, 40.0, 40.0, 35.0, 36.0, 31.0, 34.0, 31.0, 20.0, 25.0, 16.0, 16.0, 9.0, 12.0, 7.0, 7.0, 5.0, 7.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-57.27606201171875, -55.533939361572266, -53.79182052612305, -52.04969787597656, -50.307579040527344, -48.56545639038086, -46.823333740234375, -45.081214904785156, -43.33909225463867, -41.59696960449219, -39.85485076904297, -38.112728118896484, -36.37060546875, -34.62848663330078, -32.8863639831543, -31.144243240356445, -29.402122497558594, -27.660001754760742, -25.91788101196289, -24.175758361816406, -22.433637619018555, -20.691516876220703, -18.94939422607422, -17.207273483276367, -15.465152740478516, -13.723031997680664, -11.980910301208496, -10.238788604736328, -8.496667861938477, -6.754547119140625, -5.012425422668457, -3.270303726196289, -1.5281829833984375, 0.21393823623657227, 1.956059455871582, 3.698180675506592, 5.440301895141602, 7.182422637939453, 8.924544334411621, 10.666666030883789, 12.40878677368164, 14.150907516479492, 15.89302921295166, 17.635150909423828, 19.37727165222168, 21.11939239501953, 22.861515045166016, 24.603635787963867, 26.34575653076172, 28.08787727355957, 29.829998016357422, 31.572120666503906, 33.314239501953125, 35.05636215209961, 36.798484802246094, 38.54060363769531, 40.2827262878418, 42.02484893798828, 43.7669677734375, 45.509090423583984, 47.25121307373047, 48.99333190917969, 50.73545455932617, 52.477577209472656, 54.219696044921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 4.0, 5.0, 2.0, 9.0, 9.0, 12.0, 14.0, 19.0, 28.0, 20.0, 26.0, 31.0, 23.0, 25.0, 36.0, 40.0, 34.0, 50.0, 41.0, 59.0, 43.0, 42.0, 36.0, 37.0, 34.0, 32.0, 40.0, 33.0, 26.0, 24.0, 25.0, 24.0, 26.0, 18.0, 16.0, 12.0, 6.0, 6.0, 4.0, 5.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.03515625, -6.8370361328125, -6.638916015625, -6.4407958984375, -6.24267578125, -6.0445556640625, -5.846435546875, -5.6483154296875, -5.4501953125, -5.2520751953125, -5.053955078125, -4.8558349609375, -4.65771484375, -4.4595947265625, -4.261474609375, -4.0633544921875, -3.865234375, -3.6671142578125, -3.468994140625, -3.2708740234375, -3.07275390625, -2.8746337890625, -2.676513671875, -2.4783935546875, -2.2802734375, -2.0821533203125, -1.884033203125, -1.6859130859375, -1.48779296875, -1.2896728515625, -1.091552734375, -0.8934326171875, -0.6953125, -0.4971923828125, -0.299072265625, -0.1009521484375, 0.09716796875, 0.2952880859375, 0.493408203125, 0.6915283203125, 0.8896484375, 1.0877685546875, 1.285888671875, 1.4840087890625, 1.68212890625, 1.8802490234375, 2.078369140625, 2.2764892578125, 2.474609375, 2.6727294921875, 2.870849609375, 3.0689697265625, 3.26708984375, 3.4652099609375, 3.663330078125, 3.8614501953125, 4.0595703125, 4.2576904296875, 4.455810546875, 4.6539306640625, 4.85205078125, 5.0501708984375, 5.248291015625, 5.4464111328125, 5.64453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 13.0, 18.0, 24.0, 34.0, 42.0, 62.0, 97.0, 159.0, 211.0, 365.0, 533.0, 866.0, 1494.0, 2693.0, 4783.0, 9357.0, 20046.0, 49415.0, 206343.0, 2092413.0, 1571433.0, 154918.0, 42346.0, 17741.0, 8435.0, 4417.0, 2365.0, 1331.0, 846.0, 527.0, 335.0, 180.0, 137.0, 87.0, 67.0, 38.0, 36.0, 16.0, 11.0, 14.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.125, -16.552734375, -15.98046875, -15.408203125, -14.8359375, -14.263671875, -13.69140625, -13.119140625, -12.546875, -11.974609375, -11.40234375, -10.830078125, -10.2578125, -9.685546875, -9.11328125, -8.541015625, -7.96875, -7.396484375, -6.82421875, -6.251953125, -5.6796875, -5.107421875, -4.53515625, -3.962890625, -3.390625, -2.818359375, -2.24609375, -1.673828125, -1.1015625, -0.529296875, 0.04296875, 0.615234375, 1.1875, 1.759765625, 2.33203125, 2.904296875, 3.4765625, 4.048828125, 4.62109375, 5.193359375, 5.765625, 6.337890625, 6.91015625, 7.482421875, 8.0546875, 8.626953125, 9.19921875, 9.771484375, 10.34375, 10.916015625, 11.48828125, 12.060546875, 12.6328125, 13.205078125, 13.77734375, 14.349609375, 14.921875, 15.494140625, 16.06640625, 16.638671875, 17.2109375, 17.783203125, 18.35546875, 18.927734375, 19.5]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 11.0, 13.0, 14.0, 17.0, 36.0, 45.0, 45.0, 65.0, 95.0, 128.0, 181.0, 276.0, 419.0, 558.0, 613.0, 457.0, 336.0, 196.0, 151.0, 98.0, 82.0, 50.0, 44.0, 28.0, 26.0, 13.0, 20.0, 13.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.712158203125, -16.15869140625, -15.605224609375, -15.0517578125, -14.498291015625, -13.94482421875, -13.391357421875, -12.837890625, -12.284423828125, -11.73095703125, -11.177490234375, -10.6240234375, -10.070556640625, -9.51708984375, -8.963623046875, -8.41015625, -7.856689453125, -7.30322265625, -6.749755859375, -6.1962890625, -5.642822265625, -5.08935546875, -4.535888671875, -3.982421875, -3.428955078125, -2.87548828125, -2.322021484375, -1.7685546875, -1.215087890625, -0.66162109375, -0.108154296875, 0.4453125, 0.998779296875, 1.55224609375, 2.105712890625, 2.6591796875, 3.212646484375, 3.76611328125, 4.319580078125, 4.873046875, 5.426513671875, 5.97998046875, 6.533447265625, 7.0869140625, 7.640380859375, 8.19384765625, 8.747314453125, 9.30078125, 9.854248046875, 10.40771484375, 10.961181640625, 11.5146484375, 12.068115234375, 12.62158203125, 13.175048828125, 13.728515625, 14.281982421875, 14.83544921875, 15.388916015625, 15.9423828125, 16.495849609375, 17.04931640625, 17.602783203125, 18.15625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 8.0, 25.0, 24.0, 44.0, 69.0, 99.0, 174.0, 252.0, 498.0, 813.0, 1450.0, 2621.0, 4954.0, 9908.0, 20682.0, 47786.0, 134025.0, 644431.0, 2510797.0, 599983.0, 129101.0, 46126.0, 20149.0, 9595.0, 4754.0, 2493.0, 1413.0, 788.0, 453.0, 296.0, 159.0, 117.0, 68.0, 46.0, 23.0, 24.0, 8.0, 7.0, 3.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -25.2216796875, -24.490234375, -23.7587890625, -23.02734375, -22.2958984375, -21.564453125, -20.8330078125, -20.1015625, -19.3701171875, -18.638671875, -17.9072265625, -17.17578125, -16.4443359375, -15.712890625, -14.9814453125, -14.25, -13.5185546875, -12.787109375, -12.0556640625, -11.32421875, -10.5927734375, -9.861328125, -9.1298828125, -8.3984375, -7.6669921875, -6.935546875, -6.2041015625, -5.47265625, -4.7412109375, -4.009765625, -3.2783203125, -2.546875, -1.8154296875, -1.083984375, -0.3525390625, 0.37890625, 1.1103515625, 1.841796875, 2.5732421875, 3.3046875, 4.0361328125, 4.767578125, 5.4990234375, 6.23046875, 6.9619140625, 7.693359375, 8.4248046875, 9.15625, 9.8876953125, 10.619140625, 11.3505859375, 12.08203125, 12.8134765625, 13.544921875, 14.2763671875, 15.0078125, 15.7392578125, 16.470703125, 17.2021484375, 17.93359375, 18.6650390625, 19.396484375, 20.1279296875, 20.859375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 11.0, 17.0, 22.0, 31.0, 40.0, 59.0, 58.0, 82.0, 93.0, 99.0, 87.0, 89.0, 81.0, 56.0, 53.0, 25.0, 21.0, 18.0, 14.0, 7.0, 7.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.526580810546875, -48.63359451293945, -45.74060821533203, -42.84762191772461, -39.95463562011719, -37.061649322509766, -34.168663024902344, -31.275676727294922, -28.3826904296875, -25.489704132080078, -22.596717834472656, -19.703731536865234, -16.810745239257812, -13.91775894165039, -11.024772644042969, -8.131786346435547, -5.238800048828125, -2.345813751220703, 0.5471725463867188, 3.4401588439941406, 6.3331451416015625, 9.226131439208984, 12.119117736816406, 15.012104034423828, 17.90509033203125, 20.798076629638672, 23.691062927246094, 26.584049224853516, 29.477035522460938, 32.37002182006836, 35.26300811767578, 38.1559944152832, 41.048980712890625, 43.94196701049805, 46.83495330810547, 49.72793960571289, 52.62092590332031, 55.513912200927734, 58.406898498535156, 61.29988479614258, 64.19287109375, 67.08586120605469, 69.97884368896484, 72.871826171875, 75.76481628417969, 78.65780639648438, 81.55078887939453, 84.44377136230469, 87.33676147460938, 90.22975158691406, 93.12273406982422, 96.01571655273438, 98.90870666503906, 101.80169677734375, 104.6946792602539, 107.58766174316406, 110.48065185546875, 113.37364196777344, 116.2666244506836, 119.15960693359375, 122.05259704589844, 124.94558715820312, 127.83856964111328, 130.73155212402344, 133.62454223632812]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 11.0, 9.0, 6.0, 15.0, 20.0, 18.0, 24.0, 29.0, 31.0, 34.0, 40.0, 36.0, 53.0, 39.0, 54.0, 55.0, 57.0, 52.0, 45.0, 44.0, 43.0, 42.0, 40.0, 31.0, 21.0, 31.0, 28.0, 23.0, 16.0, 9.0, 8.0, 4.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.716678619384766, -57.68655014038086, -55.65642166137695, -53.62629318237305, -51.59616470336914, -49.566036224365234, -47.535911560058594, -45.50578308105469, -43.47565460205078, -41.445526123046875, -39.41539764404297, -37.38526916503906, -35.355140686035156, -33.32501220703125, -31.294885635375977, -29.26475715637207, -27.23462677001953, -25.204498291015625, -23.17436981201172, -21.144241333007812, -19.114112854003906, -17.083984375, -15.053857803344727, -13.02372932434082, -10.993600845336914, -8.963472366333008, -6.93334436416626, -4.903216361999512, -2.8730878829956055, -0.8429594039916992, 1.1871681213378906, 3.217296600341797, 5.247428894042969, 7.277557373046875, 9.307685852050781, 11.337813377380371, 13.367941856384277, 15.398070335388184, 17.428197860717773, 19.45832633972168, 21.488454818725586, 23.518583297729492, 25.5487117767334, 27.578838348388672, 29.608966827392578, 31.639095306396484, 33.66922378540039, 35.6993522644043, 37.7294807434082, 39.75960922241211, 41.789737701416016, 43.81986618041992, 45.84999465942383, 47.880123138427734, 49.910247802734375, 51.94037628173828, 53.97050476074219, 56.000633239746094, 58.03076171875, 60.060890197753906, 62.09101867675781, 64.12114715576172, 66.15127563476562, 68.18140411376953, 70.21153259277344]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 10.0, 7.0, 11.0, 13.0, 12.0, 12.0, 18.0, 22.0, 29.0, 38.0, 33.0, 28.0, 39.0, 34.0, 39.0, 52.0, 48.0, 44.0, 47.0, 41.0, 40.0, 34.0, 37.0, 31.0, 33.0, 36.0, 32.0, 18.0, 25.0, 20.0, 15.0, 17.0, 12.0, 13.0, 6.0, 7.0, 6.0, 6.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 5.0], "bins": [-7.48046875, -7.2774658203125, -7.074462890625, -6.8714599609375, -6.66845703125, -6.4654541015625, -6.262451171875, -6.0594482421875, -5.8564453125, -5.6534423828125, -5.450439453125, -5.2474365234375, -5.04443359375, -4.8414306640625, -4.638427734375, -4.4354248046875, -4.232421875, -4.0294189453125, -3.826416015625, -3.6234130859375, -3.42041015625, -3.2174072265625, -3.014404296875, -2.8114013671875, -2.6083984375, -2.4053955078125, -2.202392578125, -1.9993896484375, -1.79638671875, -1.5933837890625, -1.390380859375, -1.1873779296875, -0.984375, -0.7813720703125, -0.578369140625, -0.3753662109375, -0.17236328125, 0.0306396484375, 0.233642578125, 0.4366455078125, 0.6396484375, 0.8426513671875, 1.045654296875, 1.2486572265625, 1.45166015625, 1.6546630859375, 1.857666015625, 2.0606689453125, 2.263671875, 2.4666748046875, 2.669677734375, 2.8726806640625, 3.07568359375, 3.2786865234375, 3.481689453125, 3.6846923828125, 3.8876953125, 4.0906982421875, 4.293701171875, 4.4967041015625, 4.69970703125, 4.9027099609375, 5.105712890625, 5.3087158203125, 5.51171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 6.0, 6.0, 25.0, 24.0, 33.0, 65.0, 62.0, 119.0, 186.0, 246.0, 371.0, 635.0, 848.0, 1303.0, 2130.0, 3310.0, 5220.0, 8614.0, 14124.0, 24186.0, 42488.0, 77162.0, 140210.0, 232712.0, 213107.0, 122195.0, 67094.0, 37190.0, 21456.0, 12674.0, 7682.0, 4643.0, 2939.0, 1820.0, 1265.0, 819.0, 507.0, 349.0, 220.0, 160.0, 113.0, 80.0, 52.0, 37.0, 29.0, 7.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1131439208984375, -1.075897216796875, -1.0386505126953125, -1.00140380859375, -0.9641571044921875, -0.926910400390625, -0.8896636962890625, -0.8524169921875, -0.8151702880859375, -0.777923583984375, -0.7406768798828125, -0.70343017578125, -0.6661834716796875, -0.628936767578125, -0.5916900634765625, -0.554443359375, -0.5171966552734375, -0.479949951171875, -0.4427032470703125, -0.40545654296875, -0.3682098388671875, -0.330963134765625, -0.2937164306640625, -0.2564697265625, -0.2192230224609375, -0.181976318359375, -0.1447296142578125, -0.10748291015625, -0.0702362060546875, -0.032989501953125, 0.0042572021484375, 0.04150390625, 0.0787506103515625, 0.115997314453125, 0.1532440185546875, 0.19049072265625, 0.2277374267578125, 0.264984130859375, 0.3022308349609375, 0.3394775390625, 0.3767242431640625, 0.413970947265625, 0.4512176513671875, 0.48846435546875, 0.5257110595703125, 0.562957763671875, 0.6002044677734375, 0.637451171875, 0.6746978759765625, 0.711944580078125, 0.7491912841796875, 0.78643798828125, 0.8236846923828125, 0.860931396484375, 0.8981781005859375, 0.9354248046875, 0.9726715087890625, 1.009918212890625, 1.0471649169921875, 1.08441162109375, 1.1216583251953125, 1.158905029296875, 1.1961517333984375, 1.2333984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 2.0, 7.0, 3.0, 5.0, 5.0, 10.0, 9.0, 16.0, 14.0, 16.0, 13.0, 19.0, 26.0, 24.0, 20.0, 30.0, 31.0, 29.0, 35.0, 26.0, 32.0, 39.0, 39.0, 34.0, 1057.0, 37.0, 40.0, 40.0, 32.0, 27.0, 30.0, 34.0, 25.0, 18.0, 21.0, 24.0, 22.0, 19.0, 23.0, 20.0, 18.0, 12.0, 11.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.626953125, -3.506256103515625, -3.38555908203125, -3.264862060546875, -3.1441650390625, -3.023468017578125, -2.90277099609375, -2.782073974609375, -2.661376953125, -2.540679931640625, -2.41998291015625, -2.299285888671875, -2.1785888671875, -2.057891845703125, -1.93719482421875, -1.816497802734375, -1.69580078125, -1.575103759765625, -1.45440673828125, -1.333709716796875, -1.2130126953125, -1.092315673828125, -0.97161865234375, -0.850921630859375, -0.730224609375, -0.609527587890625, -0.48883056640625, -0.368133544921875, -0.2474365234375, -0.126739501953125, -0.00604248046875, 0.114654541015625, 0.2353515625, 0.356048583984375, 0.47674560546875, 0.597442626953125, 0.7181396484375, 0.838836669921875, 0.95953369140625, 1.080230712890625, 1.200927734375, 1.321624755859375, 1.44232177734375, 1.563018798828125, 1.6837158203125, 1.804412841796875, 1.92510986328125, 2.045806884765625, 2.16650390625, 2.287200927734375, 2.40789794921875, 2.528594970703125, 2.6492919921875, 2.769989013671875, 2.89068603515625, 3.011383056640625, 3.132080078125, 3.252777099609375, 3.37347412109375, 3.494171142578125, 3.6148681640625, 3.735565185546875, 3.85626220703125, 3.976959228515625, 4.09765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 11.0, 11.0, 20.0, 27.0, 34.0, 56.0, 76.0, 101.0, 204.0, 271.0, 455.0, 733.0, 1111.0, 1890.0, 3352.0, 6129.0, 10973.0, 20779.0, 39234.0, 79302.0, 176744.0, 1143632.0, 360488.0, 126102.0, 58994.0, 30294.0, 15891.0, 8599.0, 4880.0, 2747.0, 1465.0, 935.0, 539.0, 353.0, 219.0, 129.0, 116.0, 63.0, 35.0, 32.0, 25.0, 20.0, 12.0, 6.0, 12.0, 6.0, 5.0, 7.0, 1.0, 0.0, 2.0], "bins": [-0.65234375, -0.6335983276367188, -0.6148529052734375, -0.5961074829101562, -0.577362060546875, -0.5586166381835938, -0.5398712158203125, -0.5211257934570312, -0.50238037109375, -0.48363494873046875, -0.4648895263671875, -0.44614410400390625, -0.427398681640625, -0.40865325927734375, -0.3899078369140625, -0.37116241455078125, -0.3524169921875, -0.33367156982421875, -0.3149261474609375, -0.29618072509765625, -0.277435302734375, -0.25868988037109375, -0.2399444580078125, -0.22119903564453125, -0.20245361328125, -0.18370819091796875, -0.1649627685546875, -0.14621734619140625, -0.127471923828125, -0.10872650146484375, -0.0899810791015625, -0.07123565673828125, -0.052490234375, -0.03374481201171875, -0.0149993896484375, 0.00374603271484375, 0.022491455078125, 0.04123687744140625, 0.0599822998046875, 0.07872772216796875, 0.09747314453125, 0.11621856689453125, 0.1349639892578125, 0.15370941162109375, 0.172454833984375, 0.19120025634765625, 0.2099456787109375, 0.22869110107421875, 0.2474365234375, 0.26618194580078125, 0.2849273681640625, 0.30367279052734375, 0.322418212890625, 0.34116363525390625, 0.3599090576171875, 0.37865447998046875, 0.39739990234375, 0.41614532470703125, 0.4348907470703125, 0.45363616943359375, 0.472381591796875, 0.49112701416015625, 0.5098724365234375, 0.5286178588867188, 0.54736328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 3.0, 13.0, 6.0, 15.0, 4.0, 16.0, 15.0, 16.0, 26.0, 24.0, 46.0, 50.0, 80.0, 138.0, 170.0, 80.0, 63.0, 48.0, 25.0, 26.0, 18.0, 19.0, 14.0, 14.0, 14.0, 4.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.267822265625, -0.2599773406982422, -0.2521324157714844, -0.24428749084472656, -0.23644256591796875, -0.22859764099121094, -0.22075271606445312, -0.2129077911376953, -0.2050628662109375, -0.1972179412841797, -0.18937301635742188, -0.18152809143066406, -0.17368316650390625, -0.16583824157714844, -0.15799331665039062, -0.1501483917236328, -0.142303466796875, -0.1344585418701172, -0.12661361694335938, -0.11876869201660156, -0.11092376708984375, -0.10307884216308594, -0.09523391723632812, -0.08738899230957031, -0.0795440673828125, -0.07169914245605469, -0.06385421752929688, -0.05600929260253906, -0.04816436767578125, -0.04031944274902344, -0.032474517822265625, -0.024629592895507812, -0.01678466796875, -0.008939743041992188, -0.001094818115234375, 0.0067501068115234375, 0.01459503173828125, 0.022439956665039062, 0.030284881591796875, 0.03812980651855469, 0.0459747314453125, 0.05381965637207031, 0.061664581298828125, 0.06950950622558594, 0.07735443115234375, 0.08519935607910156, 0.09304428100585938, 0.10088920593261719, 0.108734130859375, 0.11657905578613281, 0.12442398071289062, 0.13226890563964844, 0.14011383056640625, 0.14795875549316406, 0.15580368041992188, 0.1636486053466797, 0.1714935302734375, 0.1793384552001953, 0.18718338012695312, 0.19502830505371094, 0.20287322998046875, 0.21071815490722656, 0.21856307983398438, 0.2264080047607422, 0.2342529296875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 7.0, 5.0, 17.0, 27.0, 31.0, 36.0, 52.0, 81.0, 94.0, 194.0, 425.0, 3604.0, 948206.0, 93417.0, 1493.0, 319.0, 177.0, 99.0, 64.0, 36.0, 34.0, 26.0, 10.0, 17.0, 10.0, 12.0, 4.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4765625, -4.32659912109375, -4.1766357421875, -4.02667236328125, -3.876708984375, -3.72674560546875, -3.5767822265625, -3.42681884765625, -3.27685546875, -3.12689208984375, -2.9769287109375, -2.82696533203125, -2.677001953125, -2.52703857421875, -2.3770751953125, -2.22711181640625, -2.0771484375, -1.92718505859375, -1.7772216796875, -1.62725830078125, -1.477294921875, -1.32733154296875, -1.1773681640625, -1.02740478515625, -0.87744140625, -0.72747802734375, -0.5775146484375, -0.42755126953125, -0.277587890625, -0.12762451171875, 0.0223388671875, 0.17230224609375, 0.322265625, 0.47222900390625, 0.6221923828125, 0.77215576171875, 0.922119140625, 1.07208251953125, 1.2220458984375, 1.37200927734375, 1.52197265625, 1.67193603515625, 1.8218994140625, 1.97186279296875, 2.121826171875, 2.27178955078125, 2.4217529296875, 2.57171630859375, 2.7216796875, 2.87164306640625, 3.0216064453125, 3.17156982421875, 3.321533203125, 3.47149658203125, 3.6214599609375, 3.77142333984375, 3.92138671875, 4.07135009765625, 4.2213134765625, 4.37127685546875, 4.521240234375, 4.67120361328125, 4.8211669921875, 4.97113037109375, 5.12109375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 19.0, 26.0, 59.0, 90.0, 237.0, 310.0, 116.0, 60.0, 32.0, 20.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3423917293548584, -1.3018056154251099, -1.2612195014953613, -1.2206332683563232, -1.1800471544265747, -1.1394610404968262, -1.0988749265670776, -1.058288812637329, -1.017702579498291, -0.9771164655685425, -0.9365302920341492, -0.8959441781044006, -0.8553580045700073, -0.8147718906402588, -0.7741857767105103, -0.7335996627807617, -0.6930135488510132, -0.6524274349212646, -0.6118412613868713, -0.5712551474571228, -0.5306689739227295, -0.49008285999298096, -0.4494967460632324, -0.4089106023311615, -0.3683244585990906, -0.32773831486701965, -0.28715217113494873, -0.2465660572052002, -0.20597991347312927, -0.16539376974105835, -0.12480764091014862, -0.08422151207923889, -0.04363536834716797, -0.003049232065677643, 0.03753690421581268, 0.07812304049730301, 0.11870917677879333, 0.15929532051086426, 0.199881449341774, 0.24046757817268372, 0.28105372190475464, 0.32163986563682556, 0.3622260093688965, 0.402812123298645, 0.44339826703071594, 0.48398441076278687, 0.5245705246925354, 0.5651566982269287, 0.6057428121566772, 0.6463289260864258, 0.6869150996208191, 0.7275012135505676, 0.7680873870849609, 0.8086735010147095, 0.849259614944458, 0.8898457288742065, 0.9304319024085999, 0.9710180163383484, 1.0116041898727417, 1.0521903038024902, 1.0927764177322388, 1.1333625316619873, 1.1739487648010254, 1.214534878730774, 1.2551209926605225]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 11.0, 9.0, 20.0, 19.0, 19.0, 22.0, 10.0, 22.0, 28.0, 20.0, 27.0, 44.0, 27.0, 35.0, 38.0, 50.0, 48.0, 48.0, 31.0, 40.0, 33.0, 49.0, 38.0, 31.0, 45.0, 20.0, 27.0, 16.0, 21.0, 23.0, 23.0, 20.0, 13.0, 11.0, 10.0, 7.0, 5.0, 8.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.7208524346351624, -0.7001281976699829, -0.6794039607048035, -0.658679723739624, -0.6379554867744446, -0.6172312498092651, -0.5965070128440857, -0.5757827758789062, -0.5550585389137268, -0.5343343019485474, -0.5136100649833679, -0.4928858280181885, -0.47216159105300903, -0.4514373540878296, -0.43071311712265015, -0.4099888801574707, -0.38926464319229126, -0.3685404062271118, -0.3478161692619324, -0.32709193229675293, -0.3063676953315735, -0.28564345836639404, -0.2649192214012146, -0.24419498443603516, -0.2234707474708557, -0.20274651050567627, -0.18202227354049683, -0.16129803657531738, -0.14057379961013794, -0.1198495626449585, -0.09912532567977905, -0.07840108871459961, -0.057676851749420166, -0.03695261478424072, -0.01622837781906128, 0.004495859146118164, 0.025220096111297607, 0.04594433307647705, 0.0666685700416565, 0.08739280700683594, 0.10811704397201538, 0.12884128093719482, 0.14956551790237427, 0.1702897548675537, 0.19101399183273315, 0.2117382287979126, 0.23246246576309204, 0.2531867027282715, 0.2739109396934509, 0.29463517665863037, 0.3153594136238098, 0.33608365058898926, 0.3568078875541687, 0.37753212451934814, 0.3982563614845276, 0.41898059844970703, 0.4397048354148865, 0.4604290723800659, 0.48115330934524536, 0.5018775463104248, 0.5226017832756042, 0.5433260202407837, 0.5640502572059631, 0.5847744941711426, 0.605498731136322]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 7.0, 10.0, 13.0, 11.0, 10.0, 13.0, 18.0, 22.0, 29.0, 37.0, 34.0, 30.0, 35.0, 35.0, 41.0, 55.0, 45.0, 44.0, 47.0, 41.0, 40.0, 35.0, 39.0, 28.0, 35.0, 35.0, 33.0, 17.0, 27.0, 17.0, 16.0, 17.0, 10.0, 14.0, 7.0, 6.0, 7.0, 5.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0], "bins": [-7.50390625, -7.30023193359375, -7.0965576171875, -6.89288330078125, -6.689208984375, -6.48553466796875, -6.2818603515625, -6.07818603515625, -5.87451171875, -5.67083740234375, -5.4671630859375, -5.26348876953125, -5.059814453125, -4.85614013671875, -4.6524658203125, -4.44879150390625, -4.2451171875, -4.04144287109375, -3.8377685546875, -3.63409423828125, -3.430419921875, -3.22674560546875, -3.0230712890625, -2.81939697265625, -2.61572265625, -2.41204833984375, -2.2083740234375, -2.00469970703125, -1.801025390625, -1.59735107421875, -1.3936767578125, -1.19000244140625, -0.986328125, -0.78265380859375, -0.5789794921875, -0.37530517578125, -0.171630859375, 0.03204345703125, 0.2357177734375, 0.43939208984375, 0.64306640625, 0.84674072265625, 1.0504150390625, 1.25408935546875, 1.457763671875, 1.66143798828125, 1.8651123046875, 2.06878662109375, 2.2724609375, 2.47613525390625, 2.6798095703125, 2.88348388671875, 3.087158203125, 3.29083251953125, 3.4945068359375, 3.69818115234375, 3.90185546875, 4.10552978515625, 4.3092041015625, 4.51287841796875, 4.716552734375, 4.92022705078125, 5.1239013671875, 5.32757568359375, 5.53125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 9.0, 10.0, 19.0, 16.0, 21.0, 40.0, 56.0, 66.0, 98.0, 148.0, 191.0, 258.0, 352.0, 500.0, 627.0, 924.0, 1297.0, 1945.0, 2902.0, 4716.0, 7849.0, 16736.0, 49871.0, 231793.0, 527118.0, 135576.0, 33800.0, 12692.0, 6528.0, 3917.0, 2574.0, 1710.0, 1185.0, 823.0, 614.0, 396.0, 312.0, 256.0, 143.0, 115.0, 75.0, 65.0, 47.0, 41.0, 30.0, 26.0, 16.0, 18.0, 11.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.5234375, -8.25146484375, -7.9794921875, -7.70751953125, -7.435546875, -7.16357421875, -6.8916015625, -6.61962890625, -6.34765625, -6.07568359375, -5.8037109375, -5.53173828125, -5.259765625, -4.98779296875, -4.7158203125, -4.44384765625, -4.171875, -3.89990234375, -3.6279296875, -3.35595703125, -3.083984375, -2.81201171875, -2.5400390625, -2.26806640625, -1.99609375, -1.72412109375, -1.4521484375, -1.18017578125, -0.908203125, -0.63623046875, -0.3642578125, -0.09228515625, 0.1796875, 0.45166015625, 0.7236328125, 0.99560546875, 1.267578125, 1.53955078125, 1.8115234375, 2.08349609375, 2.35546875, 2.62744140625, 2.8994140625, 3.17138671875, 3.443359375, 3.71533203125, 3.9873046875, 4.25927734375, 4.53125, 4.80322265625, 5.0751953125, 5.34716796875, 5.619140625, 5.89111328125, 6.1630859375, 6.43505859375, 6.70703125, 6.97900390625, 7.2509765625, 7.52294921875, 7.794921875, 8.06689453125, 8.3388671875, 8.61083984375, 8.8828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 0.0, 5.0, 5.0, 2.0, 12.0, 11.0, 7.0, 10.0, 15.0, 14.0, 24.0, 13.0, 22.0, 24.0, 30.0, 30.0, 36.0, 35.0, 37.0, 47.0, 45.0, 87.0, 225.0, 1492.0, 271.0, 91.0, 48.0, 51.0, 37.0, 32.0, 39.0, 34.0, 37.0, 22.0, 19.0, 15.0, 24.0, 15.0, 15.0, 10.0, 12.0, 11.0, 15.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.9375, -17.331298828125, -16.72509765625, -16.118896484375, -15.5126953125, -14.906494140625, -14.30029296875, -13.694091796875, -13.087890625, -12.481689453125, -11.87548828125, -11.269287109375, -10.6630859375, -10.056884765625, -9.45068359375, -8.844482421875, -8.23828125, -7.632080078125, -7.02587890625, -6.419677734375, -5.8134765625, -5.207275390625, -4.60107421875, -3.994873046875, -3.388671875, -2.782470703125, -2.17626953125, -1.570068359375, -0.9638671875, -0.357666015625, 0.24853515625, 0.854736328125, 1.4609375, 2.067138671875, 2.67333984375, 3.279541015625, 3.8857421875, 4.491943359375, 5.09814453125, 5.704345703125, 6.310546875, 6.916748046875, 7.52294921875, 8.129150390625, 8.7353515625, 9.341552734375, 9.94775390625, 10.553955078125, 11.16015625, 11.766357421875, 12.37255859375, 12.978759765625, 13.5849609375, 14.191162109375, 14.79736328125, 15.403564453125, 16.009765625, 16.615966796875, 17.22216796875, 17.828369140625, 18.4345703125, 19.040771484375, 19.64697265625, 20.253173828125, 20.859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 13.0, 11.0, 14.0, 10.0, 15.0, 21.0, 19.0, 25.0, 33.0, 41.0, 59.0, 103.0, 115.0, 185.0, 288.0, 517.0, 1079.0, 3037.0, 14597.0, 434921.0, 2652179.0, 30305.0, 4885.0, 1446.0, 681.0, 368.0, 208.0, 110.0, 102.0, 56.0, 59.0, 34.0, 30.0, 30.0, 18.0, 16.0, 7.0, 8.0, 10.0, 14.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-39.34375, -38.1923828125, -37.041015625, -35.8896484375, -34.73828125, -33.5869140625, -32.435546875, -31.2841796875, -30.1328125, -28.9814453125, -27.830078125, -26.6787109375, -25.52734375, -24.3759765625, -23.224609375, -22.0732421875, -20.921875, -19.7705078125, -18.619140625, -17.4677734375, -16.31640625, -15.1650390625, -14.013671875, -12.8623046875, -11.7109375, -10.5595703125, -9.408203125, -8.2568359375, -7.10546875, -5.9541015625, -4.802734375, -3.6513671875, -2.5, -1.3486328125, -0.197265625, 0.9541015625, 2.10546875, 3.2568359375, 4.408203125, 5.5595703125, 6.7109375, 7.8623046875, 9.013671875, 10.1650390625, 11.31640625, 12.4677734375, 13.619140625, 14.7705078125, 15.921875, 17.0732421875, 18.224609375, 19.3759765625, 20.52734375, 21.6787109375, 22.830078125, 23.9814453125, 25.1328125, 26.2841796875, 27.435546875, 28.5869140625, 29.73828125, 30.8896484375, 32.041015625, 33.1923828125, 34.34375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 793.0, 217.0, 2.0], "bins": [-854.281005859375, -840.447265625, -826.6135864257812, -812.7798461914062, -798.9461669921875, -785.1124267578125, -771.2787475585938, -757.4450073242188, -743.611328125, -729.777587890625, -715.9439086914062, -702.1101684570312, -688.2764892578125, -674.4427490234375, -660.6090698242188, -646.7753295898438, -632.9415893554688, -619.1078491210938, -605.274169921875, -591.4404296875, -577.6067504882812, -563.7730102539062, -549.9393310546875, -536.1055908203125, -522.2718505859375, -508.4381408691406, -494.60443115234375, -480.7707214355469, -466.93701171875, -453.103271484375, -439.2695617675781, -425.43585205078125, -411.6021423339844, -397.7684326171875, -383.9347229003906, -370.10101318359375, -356.26727294921875, -342.43359375, -328.599853515625, -314.7661437988281, -300.93243408203125, -287.0987243652344, -273.2650146484375, -259.4313049316406, -245.5975799560547, -231.7638702392578, -217.93014526367188, -204.096435546875, -190.2627410888672, -176.4290313720703, -162.59530639648438, -148.7615966796875, -134.92788696289062, -121.09417724609375, -107.26045989990234, -93.42674255371094, -79.59302520751953, -65.75930786132812, -51.92559814453125, -38.09188461303711, -24.25817108154297, -10.424461364746094, 3.4092559814453125, 17.24297332763672, 31.07668113708496]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 3.0, 9.0, 8.0, 14.0, 19.0, 15.0, 15.0, 17.0, 17.0, 28.0, 19.0, 26.0, 40.0, 33.0, 37.0, 33.0, 42.0, 47.0, 47.0, 31.0, 45.0, 24.0, 19.0, 42.0, 25.0, 38.0, 34.0, 28.0, 30.0, 26.0, 20.0, 25.0, 14.0, 23.0, 13.0, 9.0, 10.0, 6.0, 11.0, 14.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.142913818359375, -45.61171340942383, -44.08051300048828, -42.549312591552734, -41.01811218261719, -39.48691177368164, -37.955711364746094, -36.42450714111328, -34.893310546875, -33.36211013793945, -31.830909729003906, -30.29970932006836, -28.768508911132812, -27.237308502197266, -25.706106185913086, -24.17490577697754, -22.64370346069336, -21.112503051757812, -19.581302642822266, -18.05010223388672, -16.518901824951172, -14.987700462341309, -13.456499099731445, -11.925298690795898, -10.394098281860352, -8.862897872924805, -7.3316969871521, -5.8004961013793945, -4.269295692443848, -2.738095283508301, -1.2068939208984375, 0.3243064880371094, 1.8555068969726562, 3.3867075443267822, 4.917908191680908, 6.449109077453613, 7.98030948638916, 9.511509895324707, 11.04271125793457, 12.573911666870117, 14.105112075805664, 15.636312484741211, 17.167512893676758, 18.698715209960938, 20.229915618896484, 21.76111602783203, 23.292316436767578, 24.823516845703125, 26.354717254638672, 27.88591766357422, 29.417118072509766, 30.948318481445312, 32.47951889038086, 34.010719299316406, 35.54192352294922, 37.0731201171875, 38.60432434082031, 40.13552474975586, 41.666725158691406, 43.19792556762695, 44.7291259765625, 46.26032638549805, 47.791526794433594, 49.322731018066406, 50.85392761230469]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 15.0, 8.0, 10.0, 6.0, 10.0, 12.0, 10.0, 20.0, 29.0, 25.0, 30.0, 36.0, 32.0, 27.0, 37.0, 37.0, 37.0, 65.0, 54.0, 63.0, 30.0, 43.0, 33.0, 34.0, 40.0, 34.0, 35.0, 20.0, 29.0, 26.0, 13.0, 14.0, 15.0, 15.0, 11.0, 7.0, 8.0, 5.0, 4.0, 8.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.80859375, -7.5965576171875, -7.384521484375, -7.1724853515625, -6.96044921875, -6.7484130859375, -6.536376953125, -6.3243408203125, -6.1123046875, -5.9002685546875, -5.688232421875, -5.4761962890625, -5.26416015625, -5.0521240234375, -4.840087890625, -4.6280517578125, -4.416015625, -4.2039794921875, -3.991943359375, -3.7799072265625, -3.56787109375, -3.3558349609375, -3.143798828125, -2.9317626953125, -2.7197265625, -2.5076904296875, -2.295654296875, -2.0836181640625, -1.87158203125, -1.6595458984375, -1.447509765625, -1.2354736328125, -1.0234375, -0.8114013671875, -0.599365234375, -0.3873291015625, -0.17529296875, 0.0367431640625, 0.248779296875, 0.4608154296875, 0.6728515625, 0.8848876953125, 1.096923828125, 1.3089599609375, 1.52099609375, 1.7330322265625, 1.945068359375, 2.1571044921875, 2.369140625, 2.5811767578125, 2.793212890625, 3.0052490234375, 3.21728515625, 3.4293212890625, 3.641357421875, 3.8533935546875, 4.0654296875, 4.2774658203125, 4.489501953125, 4.7015380859375, 4.91357421875, 5.1256103515625, 5.337646484375, 5.5496826171875, 5.76171875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 5.0, 14.0, 12.0, 26.0, 44.0, 47.0, 85.0, 114.0, 189.0, 276.0, 559.0, 970.0, 1831.0, 3765.0, 8287.0, 20583.0, 64948.0, 556522.0, 3144163.0, 311988.0, 49479.0, 16786.0, 6747.0, 3196.0, 1577.0, 837.0, 474.0, 267.0, 161.0, 105.0, 57.0, 53.0, 29.0, 22.0, 16.0, 12.0, 6.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.890625, -25.115478515625, -24.34033203125, -23.565185546875, -22.7900390625, -22.014892578125, -21.23974609375, -20.464599609375, -19.689453125, -18.914306640625, -18.13916015625, -17.364013671875, -16.5888671875, -15.813720703125, -15.03857421875, -14.263427734375, -13.48828125, -12.713134765625, -11.93798828125, -11.162841796875, -10.3876953125, -9.612548828125, -8.83740234375, -8.062255859375, -7.287109375, -6.511962890625, -5.73681640625, -4.961669921875, -4.1865234375, -3.411376953125, -2.63623046875, -1.861083984375, -1.0859375, -0.310791015625, 0.46435546875, 1.239501953125, 2.0146484375, 2.789794921875, 3.56494140625, 4.340087890625, 5.115234375, 5.890380859375, 6.66552734375, 7.440673828125, 8.2158203125, 8.990966796875, 9.76611328125, 10.541259765625, 11.31640625, 12.091552734375, 12.86669921875, 13.641845703125, 14.4169921875, 15.192138671875, 15.96728515625, 16.742431640625, 17.517578125, 18.292724609375, 19.06787109375, 19.843017578125, 20.6181640625, 21.393310546875, 22.16845703125, 22.943603515625, 23.71875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 13.0, 8.0, 19.0, 26.0, 38.0, 73.0, 79.0, 140.0, 240.0, 426.0, 718.0, 856.0, 604.0, 322.0, 198.0, 126.0, 56.0, 42.0, 29.0, 19.0, 12.0, 12.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.426025390625, -19.61767578125, -18.809326171875, -18.0009765625, -17.192626953125, -16.38427734375, -15.575927734375, -14.767578125, -13.959228515625, -13.15087890625, -12.342529296875, -11.5341796875, -10.725830078125, -9.91748046875, -9.109130859375, -8.30078125, -7.492431640625, -6.68408203125, -5.875732421875, -5.0673828125, -4.259033203125, -3.45068359375, -2.642333984375, -1.833984375, -1.025634765625, -0.21728515625, 0.591064453125, 1.3994140625, 2.207763671875, 3.01611328125, 3.824462890625, 4.6328125, 5.441162109375, 6.24951171875, 7.057861328125, 7.8662109375, 8.674560546875, 9.48291015625, 10.291259765625, 11.099609375, 11.907958984375, 12.71630859375, 13.524658203125, 14.3330078125, 15.141357421875, 15.94970703125, 16.758056640625, 17.56640625, 18.374755859375, 19.18310546875, 19.991455078125, 20.7998046875, 21.608154296875, 22.41650390625, 23.224853515625, 24.033203125, 24.841552734375, 25.64990234375, 26.458251953125, 27.2666015625, 28.074951171875, 28.88330078125, 29.691650390625, 30.5]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 7.0, 16.0, 17.0, 36.0, 54.0, 114.0, 168.0, 381.0, 981.0, 2916.0, 11145.0, 60151.0, 947518.0, 3013689.0, 130292.0, 19545.0, 4642.0, 1500.0, 534.0, 237.0, 140.0, 63.0, 55.0, 23.0, 21.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.625, -55.06005859375, -53.4951171875, -51.93017578125, -50.365234375, -48.80029296875, -47.2353515625, -45.67041015625, -44.10546875, -42.54052734375, -40.9755859375, -39.41064453125, -37.845703125, -36.28076171875, -34.7158203125, -33.15087890625, -31.5859375, -30.02099609375, -28.4560546875, -26.89111328125, -25.326171875, -23.76123046875, -22.1962890625, -20.63134765625, -19.06640625, -17.50146484375, -15.9365234375, -14.37158203125, -12.806640625, -11.24169921875, -9.6767578125, -8.11181640625, -6.546875, -4.98193359375, -3.4169921875, -1.85205078125, -0.287109375, 1.27783203125, 2.8427734375, 4.40771484375, 5.97265625, 7.53759765625, 9.1025390625, 10.66748046875, 12.232421875, 13.79736328125, 15.3623046875, 16.92724609375, 18.4921875, 20.05712890625, 21.6220703125, 23.18701171875, 24.751953125, 26.31689453125, 27.8818359375, 29.44677734375, 31.01171875, 32.57666015625, 34.1416015625, 35.70654296875, 37.271484375, 38.83642578125, 40.4013671875, 41.96630859375, 43.53125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 7.0, 13.0, 13.0, 19.0, 21.0, 33.0, 39.0, 57.0, 61.0, 61.0, 85.0, 83.0, 77.0, 88.0, 64.0, 79.0, 45.0, 38.0, 33.0, 16.0, 26.0, 16.0, 10.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-98.3864974975586, -95.80854797363281, -93.23059844970703, -90.65264892578125, -88.07469940185547, -85.49674987792969, -82.9188003540039, -80.34085083007812, -77.76290130615234, -75.18495178222656, -72.60700225830078, -70.029052734375, -67.45110321044922, -64.87315368652344, -62.295204162597656, -59.717254638671875, -57.139305114746094, -54.56135559082031, -51.98340606689453, -49.40545654296875, -46.82750701904297, -44.24955749511719, -41.671607971191406, -39.093658447265625, -36.515708923339844, -33.93775939941406, -31.35980987548828, -28.7818603515625, -26.20391082763672, -23.625961303710938, -21.048011779785156, -18.470062255859375, -15.892112731933594, -13.314163208007812, -10.736213684082031, -8.15826416015625, -5.580314636230469, -3.0023651123046875, -0.42441558837890625, 2.153533935546875, 4.731483459472656, 7.3094329833984375, 9.887382507324219, 12.46533203125, 15.043281555175781, 17.621231079101562, 20.199180603027344, 22.777130126953125, 25.355079650878906, 27.933029174804688, 30.51097869873047, 33.08892822265625, 35.66687774658203, 38.24482727050781, 40.822776794433594, 43.400726318359375, 45.978675842285156, 48.55662536621094, 51.13457489013672, 53.7125244140625, 56.29047393798828, 58.86842346191406, 61.446372985839844, 64.02432250976562, 66.6022720336914]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 3.0, 7.0, 10.0, 13.0, 9.0, 11.0, 10.0, 14.0, 11.0, 20.0, 19.0, 22.0, 33.0, 31.0, 30.0, 37.0, 37.0, 37.0, 29.0, 41.0, 47.0, 38.0, 45.0, 34.0, 27.0, 34.0, 36.0, 42.0, 21.0, 33.0, 26.0, 23.0, 20.0, 24.0, 15.0, 20.0, 19.0, 12.0, 9.0, 14.0, 12.0, 7.0, 4.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.45613098144531, -48.80888366699219, -47.16163635253906, -45.51438903808594, -43.86714172363281, -42.21989440917969, -40.57264709472656, -38.92539978027344, -37.27815246582031, -35.63090515136719, -33.98365783691406, -32.33641052246094, -30.689163208007812, -29.041915893554688, -27.39466667175293, -25.747419357299805, -24.100170135498047, -22.452922821044922, -20.805675506591797, -19.158428192138672, -17.511180877685547, -15.863932609558105, -14.216684341430664, -12.569437026977539, -10.922189712524414, -9.274942398071289, -7.627694606781006, -5.980446815490723, -4.333199501037598, -2.6859521865844727, -1.0387039184570312, 0.6085433959960938, 2.2557907104492188, 3.903038263320923, 5.550285816192627, 7.19753360748291, 8.844780921936035, 10.49202823638916, 12.139276504516602, 13.786523818969727, 15.433771133422852, 17.081018447875977, 18.7282657623291, 20.37551498413086, 22.022762298583984, 23.67000961303711, 25.317256927490234, 26.96450424194336, 28.611751556396484, 30.25899887084961, 31.906246185302734, 33.55349349975586, 35.200740814208984, 36.84798812866211, 38.4952392578125, 40.142486572265625, 41.78973388671875, 43.436981201171875, 45.084228515625, 46.731475830078125, 48.37872314453125, 50.025970458984375, 51.6732177734375, 53.320465087890625, 54.96771240234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 9.0, 3.0, 3.0, 9.0, 11.0, 7.0, 12.0, 8.0, 12.0, 9.0, 15.0, 20.0, 20.0, 32.0, 24.0, 26.0, 33.0, 41.0, 41.0, 49.0, 38.0, 45.0, 48.0, 33.0, 47.0, 39.0, 40.0, 41.0, 29.0, 24.0, 34.0, 33.0, 27.0, 26.0, 21.0, 15.0, 15.0, 10.0, 10.0, 10.0, 7.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-7.6953125, -7.48626708984375, -7.2772216796875, -7.06817626953125, -6.859130859375, -6.65008544921875, -6.4410400390625, -6.23199462890625, -6.02294921875, -5.81390380859375, -5.6048583984375, -5.39581298828125, -5.186767578125, -4.97772216796875, -4.7686767578125, -4.55963134765625, -4.3505859375, -4.14154052734375, -3.9324951171875, -3.72344970703125, -3.514404296875, -3.30535888671875, -3.0963134765625, -2.88726806640625, -2.67822265625, -2.46917724609375, -2.2601318359375, -2.05108642578125, -1.842041015625, -1.63299560546875, -1.4239501953125, -1.21490478515625, -1.005859375, -0.79681396484375, -0.5877685546875, -0.37872314453125, -0.169677734375, 0.03936767578125, 0.2484130859375, 0.45745849609375, 0.66650390625, 0.87554931640625, 1.0845947265625, 1.29364013671875, 1.502685546875, 1.71173095703125, 1.9207763671875, 2.12982177734375, 2.3388671875, 2.54791259765625, 2.7569580078125, 2.96600341796875, 3.175048828125, 3.38409423828125, 3.5931396484375, 3.80218505859375, 4.01123046875, 4.22027587890625, 4.4293212890625, 4.63836669921875, 4.847412109375, 5.05645751953125, 5.2655029296875, 5.47454833984375, 5.68359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 14.0, 16.0, 19.0, 40.0, 60.0, 80.0, 134.0, 201.0, 368.0, 569.0, 917.0, 1605.0, 2521.0, 4078.0, 6978.0, 12025.0, 21066.0, 38319.0, 72346.0, 139654.0, 247485.0, 229488.0, 124483.0, 65094.0, 34856.0, 19083.0, 10968.0, 6290.0, 3803.0, 2325.0, 1439.0, 849.0, 496.0, 338.0, 202.0, 121.0, 74.0, 56.0, 28.0, 12.0, 11.0, 14.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.140625, -1.103729248046875, -1.06683349609375, -1.029937744140625, -0.9930419921875, -0.956146240234375, -0.91925048828125, -0.882354736328125, -0.845458984375, -0.808563232421875, -0.77166748046875, -0.734771728515625, -0.6978759765625, -0.660980224609375, -0.62408447265625, -0.587188720703125, -0.55029296875, -0.513397216796875, -0.47650146484375, -0.439605712890625, -0.4027099609375, -0.365814208984375, -0.32891845703125, -0.292022705078125, -0.255126953125, -0.218231201171875, -0.18133544921875, -0.144439697265625, -0.1075439453125, -0.070648193359375, -0.03375244140625, 0.003143310546875, 0.0400390625, 0.076934814453125, 0.11383056640625, 0.150726318359375, 0.1876220703125, 0.224517822265625, 0.26141357421875, 0.298309326171875, 0.335205078125, 0.372100830078125, 0.40899658203125, 0.445892333984375, 0.4827880859375, 0.519683837890625, 0.55657958984375, 0.593475341796875, 0.63037109375, 0.667266845703125, 0.70416259765625, 0.741058349609375, 0.7779541015625, 0.814849853515625, 0.85174560546875, 0.888641357421875, 0.925537109375, 0.962432861328125, 0.99932861328125, 1.036224365234375, 1.0731201171875, 1.110015869140625, 1.14691162109375, 1.183807373046875, 1.220703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 6.0, 21.0, 19.0, 18.0, 22.0, 27.0, 16.0, 21.0, 25.0, 26.0, 20.0, 47.0, 48.0, 34.0, 43.0, 42.0, 1066.0, 44.0, 36.0, 31.0, 25.0, 47.0, 44.0, 30.0, 26.0, 31.0, 24.0, 24.0, 18.0, 17.0, 19.0, 16.0, 11.0, 7.0, 7.0, 5.0, 3.0, 9.0, 3.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.37890625, -4.24139404296875, -4.1038818359375, -3.96636962890625, -3.828857421875, -3.69134521484375, -3.5538330078125, -3.41632080078125, -3.27880859375, -3.14129638671875, -3.0037841796875, -2.86627197265625, -2.728759765625, -2.59124755859375, -2.4537353515625, -2.31622314453125, -2.1787109375, -2.04119873046875, -1.9036865234375, -1.76617431640625, -1.628662109375, -1.49114990234375, -1.3536376953125, -1.21612548828125, -1.07861328125, -0.94110107421875, -0.8035888671875, -0.66607666015625, -0.528564453125, -0.39105224609375, -0.2535400390625, -0.11602783203125, 0.021484375, 0.15899658203125, 0.2965087890625, 0.43402099609375, 0.571533203125, 0.70904541015625, 0.8465576171875, 0.98406982421875, 1.12158203125, 1.25909423828125, 1.3966064453125, 1.53411865234375, 1.671630859375, 1.80914306640625, 1.9466552734375, 2.08416748046875, 2.2216796875, 2.35919189453125, 2.4967041015625, 2.63421630859375, 2.771728515625, 2.90924072265625, 3.0467529296875, 3.18426513671875, 3.32177734375, 3.45928955078125, 3.5968017578125, 3.73431396484375, 3.871826171875, 4.00933837890625, 4.1468505859375, 4.28436279296875, 4.421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 11.0, 17.0, 19.0, 33.0, 55.0, 60.0, 113.0, 163.0, 210.0, 312.0, 432.0, 629.0, 1027.0, 1663.0, 2398.0, 3921.0, 6175.0, 9613.0, 15854.0, 25496.0, 42040.0, 70857.0, 120373.0, 287802.0, 1138285.0, 149152.0, 86457.0, 51826.0, 30916.0, 19062.0, 11650.0, 7396.0, 4564.0, 2889.0, 1919.0, 1232.0, 817.0, 564.0, 367.0, 247.0, 180.0, 97.0, 74.0, 44.0, 36.0, 24.0, 21.0, 18.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0], "bins": [-0.4111328125, -0.39910888671875, -0.3870849609375, -0.37506103515625, -0.363037109375, -0.35101318359375, -0.3389892578125, -0.32696533203125, -0.31494140625, -0.30291748046875, -0.2908935546875, -0.27886962890625, -0.266845703125, -0.25482177734375, -0.2427978515625, -0.23077392578125, -0.21875, -0.20672607421875, -0.1947021484375, -0.18267822265625, -0.170654296875, -0.15863037109375, -0.1466064453125, -0.13458251953125, -0.12255859375, -0.11053466796875, -0.0985107421875, -0.08648681640625, -0.074462890625, -0.06243896484375, -0.0504150390625, -0.03839111328125, -0.0263671875, -0.01434326171875, -0.0023193359375, 0.00970458984375, 0.021728515625, 0.03375244140625, 0.0457763671875, 0.05780029296875, 0.06982421875, 0.08184814453125, 0.0938720703125, 0.10589599609375, 0.117919921875, 0.12994384765625, 0.1419677734375, 0.15399169921875, 0.166015625, 0.17803955078125, 0.1900634765625, 0.20208740234375, 0.214111328125, 0.22613525390625, 0.2381591796875, 0.25018310546875, 0.26220703125, 0.27423095703125, 0.2862548828125, 0.29827880859375, 0.310302734375, 0.32232666015625, 0.3343505859375, 0.34637451171875, 0.3583984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 11.0, 14.0, 9.0, 21.0, 13.0, 20.0, 18.0, 20.0, 37.0, 51.0, 63.0, 53.0, 46.0, 48.0, 45.0, 49.0, 40.0, 45.0, 55.0, 39.0, 37.0, 43.0, 22.0, 34.0, 24.0, 14.0, 13.0, 11.0, 11.0, 9.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.06640625, -0.06417655944824219, -0.061946868896484375, -0.05971717834472656, -0.05748748779296875, -0.05525779724121094, -0.053028106689453125, -0.05079841613769531, -0.0485687255859375, -0.04633903503417969, -0.044109344482421875, -0.04187965393066406, -0.03964996337890625, -0.03742027282714844, -0.035190582275390625, -0.03296089172363281, -0.030731201171875, -0.028501510620117188, -0.026271820068359375, -0.024042129516601562, -0.02181243896484375, -0.019582748413085938, -0.017353057861328125, -0.015123367309570312, -0.0128936767578125, -0.010663986206054688, -0.008434295654296875, -0.0062046051025390625, -0.00397491455078125, -0.0017452239990234375, 0.000484466552734375, 0.0027141571044921875, 0.00494384765625, 0.0071735382080078125, 0.009403228759765625, 0.011632919311523438, 0.01386260986328125, 0.016092300415039062, 0.018321990966796875, 0.020551681518554688, 0.0227813720703125, 0.025011062622070312, 0.027240753173828125, 0.029470443725585938, 0.03170013427734375, 0.03392982482910156, 0.036159515380859375, 0.03838920593261719, 0.040618896484375, 0.04284858703613281, 0.045078277587890625, 0.04730796813964844, 0.04953765869140625, 0.05176734924316406, 0.053997039794921875, 0.05622673034667969, 0.0584564208984375, 0.06068611145019531, 0.06291580200195312, 0.06514549255371094, 0.06737518310546875, 0.06960487365722656, 0.07183456420898438, 0.07406425476074219, 0.0762939453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 14.0, 13.0, 15.0, 20.0, 27.0, 45.0, 48.0, 60.0, 56.0, 135.0, 220.0, 409.0, 2091.0, 78093.0, 957944.0, 7696.0, 761.0, 277.0, 161.0, 100.0, 73.0, 46.0, 34.0, 27.0, 18.0, 24.0, 19.0, 11.0, 11.0, 10.0, 7.0, 12.0, 3.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5185546875, -1.4741973876953125, -1.429840087890625, -1.3854827880859375, -1.34112548828125, -1.2967681884765625, -1.252410888671875, -1.2080535888671875, -1.1636962890625, -1.1193389892578125, -1.074981689453125, -1.0306243896484375, -0.98626708984375, -0.9419097900390625, -0.897552490234375, -0.8531951904296875, -0.808837890625, -0.7644805908203125, -0.720123291015625, -0.6757659912109375, -0.63140869140625, -0.5870513916015625, -0.542694091796875, -0.4983367919921875, -0.4539794921875, -0.4096221923828125, -0.365264892578125, -0.3209075927734375, -0.27655029296875, -0.2321929931640625, -0.187835693359375, -0.1434783935546875, -0.09912109375, -0.0547637939453125, -0.010406494140625, 0.0339508056640625, 0.07830810546875, 0.1226654052734375, 0.167022705078125, 0.2113800048828125, 0.2557373046875, 0.3000946044921875, 0.344451904296875, 0.3888092041015625, 0.43316650390625, 0.4775238037109375, 0.521881103515625, 0.5662384033203125, 0.610595703125, 0.6549530029296875, 0.699310302734375, 0.7436676025390625, 0.78802490234375, 0.8323822021484375, 0.876739501953125, 0.9210968017578125, 0.9654541015625, 1.0098114013671875, 1.054168701171875, 1.0985260009765625, 1.14288330078125, 1.1872406005859375, 1.231597900390625, 1.2759552001953125, 1.3203125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 10.0, 40.0, 89.0, 388.0, 342.0, 89.0, 34.0, 11.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17508479952812195, -0.14563986659049988, -0.11619493365287781, -0.08675000071525574, -0.05730506777763367, -0.027860134840011597, 0.0015847980976104736, 0.031029731035232544, 0.060474663972854614, 0.08991959691047668, 0.11936452984809875, 0.14880946278572083, 0.1782543957233429, 0.20769932866096497, 0.23714426159858704, 0.2665891945362091, 0.2960341274738312, 0.32547906041145325, 0.3549239933490753, 0.3843689262866974, 0.41381385922431946, 0.44325879216194153, 0.4727037250995636, 0.5021486282348633, 0.5315935611724854, 0.5610384941101074, 0.5904834270477295, 0.6199283599853516, 0.6493732929229736, 0.6788182258605957, 0.7082631587982178, 0.7377080917358398, 0.7671530246734619, 0.796597957611084, 0.826042890548706, 0.8554878234863281, 0.8849327564239502, 0.9143776893615723, 0.9438226222991943, 0.9732675552368164, 1.0027124881744385, 1.0321574211120605, 1.0616023540496826, 1.0910472869873047, 1.1204922199249268, 1.1499371528625488, 1.179382085800171, 1.208827018737793, 1.238271951675415, 1.267716884613037, 1.2971618175506592, 1.3266067504882812, 1.3560516834259033, 1.3854966163635254, 1.4149415493011475, 1.4443864822387695, 1.4738314151763916, 1.5032763481140137, 1.5327212810516357, 1.5621662139892578, 1.5916111469268799, 1.621056079864502, 1.650501012802124, 1.679945945739746, 1.7093908786773682]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 11.0, 7.0, 5.0, 11.0, 11.0, 12.0, 9.0, 16.0, 14.0, 16.0, 21.0, 20.0, 20.0, 32.0, 35.0, 31.0, 24.0, 26.0, 41.0, 38.0, 34.0, 40.0, 34.0, 37.0, 39.0, 40.0, 40.0, 30.0, 32.0, 37.0, 24.0, 21.0, 28.0, 34.0, 17.0, 17.0, 13.0, 13.0, 14.0, 7.0, 7.0, 8.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0], "bins": [-0.2874789237976074, -0.27904948592185974, -0.27062007784843445, -0.26219063997268677, -0.2537612318992615, -0.2453317940235138, -0.2369023710489273, -0.22847294807434082, -0.22004352509975433, -0.21161410212516785, -0.20318467915058136, -0.19475525617599487, -0.1863258183002472, -0.1778964102268219, -0.16946697235107422, -0.16103754937648773, -0.15260812640190125, -0.14417870342731476, -0.13574928045272827, -0.12731985747814178, -0.1188904270529747, -0.11046100407838821, -0.10203157365322113, -0.09360215067863464, -0.08517272770404816, -0.07674330472946167, -0.06831388175487518, -0.0598844513297081, -0.05145502835512161, -0.043025605380535126, -0.03459617868065834, -0.026166751980781555, -0.01773732900619507, -0.009307904168963432, -0.0008784793317317963, 0.00755094550549984, 0.015980370342731476, 0.024409793317317963, 0.03283922001719475, 0.04126864671707153, 0.04969806969165802, 0.05812749266624451, 0.066556915640831, 0.07498634606599808, 0.08341576904058456, 0.09184519201517105, 0.10027462244033813, 0.10870404541492462, 0.11713346838951111, 0.1255628913640976, 0.13399231433868408, 0.14242173731327057, 0.15085116028785706, 0.15928059816360474, 0.16771002113819122, 0.1761394441127777, 0.1845688670873642, 0.19299829006195068, 0.20142771303653717, 0.20985713601112366, 0.21828657388687134, 0.22671598196029663, 0.2351454198360443, 0.2435748428106308, 0.2520042657852173]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 9.0, 3.0, 3.0, 9.0, 11.0, 7.0, 12.0, 8.0, 12.0, 9.0, 15.0, 21.0, 19.0, 32.0, 24.0, 27.0, 33.0, 40.0, 39.0, 51.0, 38.0, 46.0, 46.0, 35.0, 47.0, 36.0, 43.0, 42.0, 28.0, 24.0, 32.0, 34.0, 28.0, 26.0, 20.0, 15.0, 16.0, 9.0, 10.0, 10.0, 7.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-7.69921875, -7.49005126953125, -7.2808837890625, -7.07171630859375, -6.862548828125, -6.65338134765625, -6.4442138671875, -6.23504638671875, -6.02587890625, -5.81671142578125, -5.6075439453125, -5.39837646484375, -5.189208984375, -4.98004150390625, -4.7708740234375, -4.56170654296875, -4.3525390625, -4.14337158203125, -3.9342041015625, -3.72503662109375, -3.515869140625, -3.30670166015625, -3.0975341796875, -2.88836669921875, -2.67919921875, -2.47003173828125, -2.2608642578125, -2.05169677734375, -1.842529296875, -1.63336181640625, -1.4241943359375, -1.21502685546875, -1.005859375, -0.79669189453125, -0.5875244140625, -0.37835693359375, -0.169189453125, 0.03997802734375, 0.2491455078125, 0.45831298828125, 0.66748046875, 0.87664794921875, 1.0858154296875, 1.29498291015625, 1.504150390625, 1.71331787109375, 1.9224853515625, 2.13165283203125, 2.3408203125, 2.54998779296875, 2.7591552734375, 2.96832275390625, 3.177490234375, 3.38665771484375, 3.5958251953125, 3.80499267578125, 4.01416015625, 4.22332763671875, 4.4324951171875, 4.64166259765625, 4.850830078125, 5.05999755859375, 5.2691650390625, 5.47833251953125, 5.6875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 16.0, 14.0, 20.0, 28.0, 38.0, 52.0, 79.0, 109.0, 137.0, 208.0, 274.0, 363.0, 552.0, 682.0, 1003.0, 1332.0, 1886.0, 2429.0, 3527.0, 5366.0, 9080.0, 19869.0, 54726.0, 224417.0, 504071.0, 139584.0, 39462.0, 15270.0, 7765.0, 4621.0, 3147.0, 2364.0, 1608.0, 1171.0, 873.0, 668.0, 472.0, 363.0, 262.0, 181.0, 129.0, 97.0, 76.0, 56.0, 35.0, 17.0, 27.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0], "bins": [-8.96875, -8.6998291015625, -8.430908203125, -8.1619873046875, -7.89306640625, -7.6241455078125, -7.355224609375, -7.0863037109375, -6.8173828125, -6.5484619140625, -6.279541015625, -6.0106201171875, -5.74169921875, -5.4727783203125, -5.203857421875, -4.9349365234375, -4.666015625, -4.3970947265625, -4.128173828125, -3.8592529296875, -3.59033203125, -3.3214111328125, -3.052490234375, -2.7835693359375, -2.5146484375, -2.2457275390625, -1.976806640625, -1.7078857421875, -1.43896484375, -1.1700439453125, -0.901123046875, -0.6322021484375, -0.36328125, -0.0943603515625, 0.174560546875, 0.4434814453125, 0.71240234375, 0.9813232421875, 1.250244140625, 1.5191650390625, 1.7880859375, 2.0570068359375, 2.325927734375, 2.5948486328125, 2.86376953125, 3.1326904296875, 3.401611328125, 3.6705322265625, 3.939453125, 4.2083740234375, 4.477294921875, 4.7462158203125, 5.01513671875, 5.2840576171875, 5.552978515625, 5.8218994140625, 6.0908203125, 6.3597412109375, 6.628662109375, 6.8975830078125, 7.16650390625, 7.4354248046875, 7.704345703125, 7.9732666015625, 8.2421875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 8.0, 9.0, 20.0, 17.0, 13.0, 31.0, 14.0, 30.0, 31.0, 27.0, 43.0, 38.0, 57.0, 44.0, 77.0, 159.0, 1552.0, 300.0, 101.0, 71.0, 54.0, 48.0, 40.0, 36.0, 34.0, 29.0, 20.0, 20.0, 14.0, 18.0, 17.0, 14.0, 8.0, 15.0, 6.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.65673828125, -18.9228515625, -18.18896484375, -17.455078125, -16.72119140625, -15.9873046875, -15.25341796875, -14.51953125, -13.78564453125, -13.0517578125, -12.31787109375, -11.583984375, -10.85009765625, -10.1162109375, -9.38232421875, -8.6484375, -7.91455078125, -7.1806640625, -6.44677734375, -5.712890625, -4.97900390625, -4.2451171875, -3.51123046875, -2.77734375, -2.04345703125, -1.3095703125, -0.57568359375, 0.158203125, 0.89208984375, 1.6259765625, 2.35986328125, 3.09375, 3.82763671875, 4.5615234375, 5.29541015625, 6.029296875, 6.76318359375, 7.4970703125, 8.23095703125, 8.96484375, 9.69873046875, 10.4326171875, 11.16650390625, 11.900390625, 12.63427734375, 13.3681640625, 14.10205078125, 14.8359375, 15.56982421875, 16.3037109375, 17.03759765625, 17.771484375, 18.50537109375, 19.2392578125, 19.97314453125, 20.70703125, 21.44091796875, 22.1748046875, 22.90869140625, 23.642578125, 24.37646484375, 25.1103515625, 25.84423828125, 26.578125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 13.0, 22.0, 15.0, 26.0, 30.0, 31.0, 53.0, 79.0, 111.0, 144.0, 261.0, 433.0, 1149.0, 4233.0, 23021.0, 2182775.0, 908671.0, 18739.0, 3719.0, 1001.0, 420.0, 227.0, 158.0, 100.0, 57.0, 43.0, 35.0, 32.0, 27.0, 17.0, 19.0, 10.0, 3.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.3828125, -39.953125, -38.5234375, -37.09375, -35.6640625, -34.234375, -32.8046875, -31.375, -29.9453125, -28.515625, -27.0859375, -25.65625, -24.2265625, -22.796875, -21.3671875, -19.9375, -18.5078125, -17.078125, -15.6484375, -14.21875, -12.7890625, -11.359375, -9.9296875, -8.5, -7.0703125, -5.640625, -4.2109375, -2.78125, -1.3515625, 0.078125, 1.5078125, 2.9375, 4.3671875, 5.796875, 7.2265625, 8.65625, 10.0859375, 11.515625, 12.9453125, 14.375, 15.8046875, 17.234375, 18.6640625, 20.09375, 21.5234375, 22.953125, 24.3828125, 25.8125, 27.2421875, 28.671875, 30.1015625, 31.53125, 32.9609375, 34.390625, 35.8203125, 37.25, 38.6796875, 40.109375, 41.5390625, 42.96875, 44.3984375, 45.828125, 47.2578125, 48.6875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 54.0, 760.0, 204.0], "bins": [-727.6083374023438, -715.9910278320312, -704.3737182617188, -692.7564697265625, -681.13916015625, -669.5218505859375, -657.904541015625, -646.2872314453125, -634.669921875, -623.0526123046875, -611.435302734375, -599.8180541992188, -588.2007446289062, -576.5834350585938, -564.9661254882812, -553.3488159179688, -541.7315673828125, -530.1142578125, -518.4969482421875, -506.8796691894531, -495.26239013671875, -483.64508056640625, -472.02777099609375, -460.41046142578125, -448.7931823730469, -437.1758728027344, -425.55859375, -413.9412841796875, -402.323974609375, -390.7066955566406, -379.0893859863281, -367.47210693359375, -355.85479736328125, -344.23748779296875, -332.6202087402344, -321.0028991699219, -309.3856201171875, -297.768310546875, -286.1510009765625, -274.53369140625, -262.9164123535156, -251.2991180419922, -239.68182373046875, -228.06451416015625, -216.4472198486328, -204.82992553710938, -193.21261596679688, -181.59532165527344, -169.97804260253906, -158.36074829101562, -146.74343872070312, -135.1261444091797, -123.50885009765625, -111.89155578613281, -100.27425384521484, -88.65695190429688, -77.03965759277344, -65.42236328125, -53.80506134033203, -42.18776321411133, -30.570465087890625, -18.953166961669922, -7.335868835449219, 4.28143310546875, 15.898731231689453]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 4.0, 13.0, 15.0, 14.0, 11.0, 26.0, 21.0, 26.0, 21.0, 16.0, 26.0, 25.0, 34.0, 34.0, 36.0, 35.0, 38.0, 35.0, 41.0, 34.0, 35.0, 40.0, 29.0, 34.0, 40.0, 30.0, 29.0, 28.0, 37.0, 24.0, 21.0, 17.0, 19.0, 15.0, 13.0, 7.0, 11.0, 14.0, 8.0, 9.0, 2.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-57.890052795410156, -56.039669036865234, -54.18928527832031, -52.338905334472656, -50.488521575927734, -48.63813781738281, -46.787757873535156, -44.937374114990234, -43.08699035644531, -41.23660659790039, -39.38622283935547, -37.53584289550781, -35.68545913696289, -33.83507537841797, -31.98469352722168, -30.13431167602539, -28.28392791748047, -26.433544158935547, -24.583162307739258, -22.73278045654297, -20.882396697998047, -19.032012939453125, -17.181631088256836, -15.33124828338623, -13.480865478515625, -11.63048267364502, -9.780099868774414, -7.929717063903809, -6.079334259033203, -4.228951454162598, -2.378568649291992, -0.5281858444213867, 1.3222007751464844, 3.17258358001709, 5.022966384887695, 6.873349189758301, 8.723731994628906, 10.574114799499512, 12.424497604370117, 14.274880409240723, 16.125263214111328, 17.97564697265625, 19.82602882385254, 21.676410675048828, 23.52679443359375, 25.377178192138672, 27.22756004333496, 29.07794189453125, 30.928325653076172, 32.778709411621094, 34.62908935546875, 36.47947311401367, 38.329856872558594, 40.180240631103516, 42.03062438964844, 43.881004333496094, 45.731388092041016, 47.58177185058594, 49.432151794433594, 51.282535552978516, 53.13291931152344, 54.98330307006836, 56.83368682861328, 58.68406677246094, 60.53445053100586]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 4.0, 10.0, 9.0, 10.0, 8.0, 10.0, 13.0, 14.0, 24.0, 19.0, 17.0, 33.0, 36.0, 30.0, 35.0, 41.0, 33.0, 43.0, 37.0, 51.0, 42.0, 52.0, 40.0, 47.0, 36.0, 22.0, 29.0, 38.0, 27.0, 25.0, 20.0, 28.0, 13.0, 13.0, 21.0, 11.0, 12.0, 5.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0], "bins": [-8.0703125, -7.852783203125, -7.63525390625, -7.417724609375, -7.2001953125, -6.982666015625, -6.76513671875, -6.547607421875, -6.330078125, -6.112548828125, -5.89501953125, -5.677490234375, -5.4599609375, -5.242431640625, -5.02490234375, -4.807373046875, -4.58984375, -4.372314453125, -4.15478515625, -3.937255859375, -3.7197265625, -3.502197265625, -3.28466796875, -3.067138671875, -2.849609375, -2.632080078125, -2.41455078125, -2.197021484375, -1.9794921875, -1.761962890625, -1.54443359375, -1.326904296875, -1.109375, -0.891845703125, -0.67431640625, -0.456787109375, -0.2392578125, -0.021728515625, 0.19580078125, 0.413330078125, 0.630859375, 0.848388671875, 1.06591796875, 1.283447265625, 1.5009765625, 1.718505859375, 1.93603515625, 2.153564453125, 2.37109375, 2.588623046875, 2.80615234375, 3.023681640625, 3.2412109375, 3.458740234375, 3.67626953125, 3.893798828125, 4.111328125, 4.328857421875, 4.54638671875, 4.763916015625, 4.9814453125, 5.198974609375, 5.41650390625, 5.634033203125, 5.8515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 6.0, 5.0, 6.0, 8.0, 7.0, 14.0, 14.0, 26.0, 37.0, 67.0, 87.0, 154.0, 252.0, 446.0, 817.0, 1420.0, 2754.0, 5599.0, 12068.0, 28660.0, 95322.0, 798084.0, 2727034.0, 414070.0, 65984.0, 22244.0, 9582.0, 4466.0, 2273.0, 1134.0, 656.0, 397.0, 213.0, 124.0, 82.0, 48.0, 38.0, 29.0, 18.0, 10.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.124267578125, -16.49853515625, -15.872802734375, -15.2470703125, -14.621337890625, -13.99560546875, -13.369873046875, -12.744140625, -12.118408203125, -11.49267578125, -10.866943359375, -10.2412109375, -9.615478515625, -8.98974609375, -8.364013671875, -7.73828125, -7.112548828125, -6.48681640625, -5.861083984375, -5.2353515625, -4.609619140625, -3.98388671875, -3.358154296875, -2.732421875, -2.106689453125, -1.48095703125, -0.855224609375, -0.2294921875, 0.396240234375, 1.02197265625, 1.647705078125, 2.2734375, 2.899169921875, 3.52490234375, 4.150634765625, 4.7763671875, 5.402099609375, 6.02783203125, 6.653564453125, 7.279296875, 7.905029296875, 8.53076171875, 9.156494140625, 9.7822265625, 10.407958984375, 11.03369140625, 11.659423828125, 12.28515625, 12.910888671875, 13.53662109375, 14.162353515625, 14.7880859375, 15.413818359375, 16.03955078125, 16.665283203125, 17.291015625, 17.916748046875, 18.54248046875, 19.168212890625, 19.7939453125, 20.419677734375, 21.04541015625, 21.671142578125, 22.296875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 13.0, 19.0, 29.0, 48.0, 69.0, 91.0, 167.0, 291.0, 429.0, 652.0, 753.0, 552.0, 328.0, 211.0, 116.0, 104.0, 61.0, 35.0, 19.0, 15.0, 17.0, 9.0, 10.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.21875, -31.473388671875, -30.72802734375, -29.982666015625, -29.2373046875, -28.491943359375, -27.74658203125, -27.001220703125, -26.255859375, -25.510498046875, -24.76513671875, -24.019775390625, -23.2744140625, -22.529052734375, -21.78369140625, -21.038330078125, -20.29296875, -19.547607421875, -18.80224609375, -18.056884765625, -17.3115234375, -16.566162109375, -15.82080078125, -15.075439453125, -14.330078125, -13.584716796875, -12.83935546875, -12.093994140625, -11.3486328125, -10.603271484375, -9.85791015625, -9.112548828125, -8.3671875, -7.621826171875, -6.87646484375, -6.131103515625, -5.3857421875, -4.640380859375, -3.89501953125, -3.149658203125, -2.404296875, -1.658935546875, -0.91357421875, -0.168212890625, 0.5771484375, 1.322509765625, 2.06787109375, 2.813232421875, 3.55859375, 4.303955078125, 5.04931640625, 5.794677734375, 6.5400390625, 7.285400390625, 8.03076171875, 8.776123046875, 9.521484375, 10.266845703125, 11.01220703125, 11.757568359375, 12.5029296875, 13.248291015625, 13.99365234375, 14.739013671875, 15.484375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 13.0, 8.0, 30.0, 29.0, 53.0, 68.0, 88.0, 170.0, 361.0, 791.0, 1867.0, 5089.0, 15984.0, 62787.0, 431453.0, 3090150.0, 491118.0, 68356.0, 16779.0, 5478.0, 1972.0, 836.0, 353.0, 177.0, 115.0, 49.0, 32.0, 24.0, 19.0, 8.0, 8.0, 9.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.609375, -24.520751953125, -23.43212890625, -22.343505859375, -21.2548828125, -20.166259765625, -19.07763671875, -17.989013671875, -16.900390625, -15.811767578125, -14.72314453125, -13.634521484375, -12.5458984375, -11.457275390625, -10.36865234375, -9.280029296875, -8.19140625, -7.102783203125, -6.01416015625, -4.925537109375, -3.8369140625, -2.748291015625, -1.65966796875, -0.571044921875, 0.517578125, 1.606201171875, 2.69482421875, 3.783447265625, 4.8720703125, 5.960693359375, 7.04931640625, 8.137939453125, 9.2265625, 10.315185546875, 11.40380859375, 12.492431640625, 13.5810546875, 14.669677734375, 15.75830078125, 16.846923828125, 17.935546875, 19.024169921875, 20.11279296875, 21.201416015625, 22.2900390625, 23.378662109375, 24.46728515625, 25.555908203125, 26.64453125, 27.733154296875, 28.82177734375, 29.910400390625, 30.9990234375, 32.087646484375, 33.17626953125, 34.264892578125, 35.353515625, 36.442138671875, 37.53076171875, 38.619384765625, 39.7080078125, 40.796630859375, 41.88525390625, 42.973876953125, 44.0625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 7.0, 15.0, 33.0, 56.0, 81.0, 134.0, 153.0, 140.0, 125.0, 106.0, 59.0, 39.0, 27.0, 14.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-217.85951232910156, -213.31866455078125, -208.77783203125, -204.23699951171875, -199.69615173339844, -195.15530395507812, -190.61447143554688, -186.07363891601562, -181.5327911376953, -176.991943359375, -172.45111083984375, -167.9102783203125, -163.3694305419922, -158.82858276367188, -154.28775024414062, -149.74691772460938, -145.20606994628906, -140.66522216796875, -136.1243896484375, -131.58355712890625, -127.04270935058594, -122.50186920166016, -117.96102905273438, -113.4201889038086, -108.87934875488281, -104.33850860595703, -99.79766845703125, -95.25682830810547, -90.71598815917969, -86.1751480102539, -81.63430786132812, -77.09346771240234, -72.5526351928711, -68.01179504394531, -63.47095489501953, -58.93011474609375, -54.38927459716797, -49.84843444824219, -45.307594299316406, -40.766754150390625, -36.225914001464844, -31.685073852539062, -27.14423370361328, -22.6033935546875, -18.06255340576172, -13.521713256835938, -8.980873107910156, -4.440032958984375, 0.10080718994140625, 4.6416473388671875, 9.182487487792969, 13.72332763671875, 18.26416778564453, 22.805007934570312, 27.345848083496094, 31.886688232421875, 36.427528381347656, 40.96836853027344, 45.50920867919922, 50.050048828125, 54.59088897705078, 59.13172912597656, 63.672569274902344, 68.21340942382812, 72.7542495727539]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 8.0, 11.0, 10.0, 5.0, 18.0, 18.0, 26.0, 23.0, 33.0, 43.0, 28.0, 36.0, 30.0, 32.0, 43.0, 47.0, 52.0, 41.0, 49.0, 33.0, 44.0, 40.0, 46.0, 30.0, 29.0, 24.0, 31.0, 26.0, 30.0, 18.0, 18.0, 9.0, 4.0, 5.0, 5.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.053070068359375, -59.09006881713867, -57.1270637512207, -55.1640625, -53.2010612487793, -51.238059997558594, -49.275054931640625, -47.31205368041992, -45.34905242919922, -43.386051177978516, -41.42304611206055, -39.460044860839844, -37.49704360961914, -35.53404235839844, -33.57103729248047, -31.608036041259766, -29.645030975341797, -27.68202781677246, -25.719026565551758, -23.756023406982422, -21.79302215576172, -19.830018997192383, -17.867015838623047, -15.904013633728027, -13.941011428833008, -11.978009223937988, -10.015007019042969, -8.052003860473633, -6.089001655578613, -4.125999450683594, -2.162996292114258, -0.19999408721923828, 1.7630081176757812, 3.72601056098938, 5.6890130043029785, 7.652015686035156, 9.615017890930176, 11.578020095825195, 13.541023254394531, 15.50402545928955, 17.46702766418457, 19.430030822753906, 21.39303207397461, 23.356035232543945, 25.31903839111328, 27.282039642333984, 29.24504280090332, 31.208045959472656, 33.17104721069336, 35.13404846191406, 37.09705352783203, 39.060054779052734, 41.02305603027344, 42.986061096191406, 44.94906234741211, 46.91206359863281, 48.87506866455078, 50.838069915771484, 52.80107498168945, 54.764076232910156, 56.72707748413086, 58.69007873535156, 60.65308380126953, 62.616085052490234, 64.57908630371094]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 5.0, 13.0, 9.0, 13.0, 13.0, 12.0, 13.0, 13.0, 22.0, 24.0, 27.0, 20.0, 32.0, 41.0, 46.0, 33.0, 50.0, 38.0, 43.0, 42.0, 46.0, 45.0, 38.0, 36.0, 47.0, 34.0, 24.0, 34.0, 18.0, 23.0, 22.0, 23.0, 15.0, 12.0, 9.0, 10.0, 10.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.58203125, -7.3623046875, -7.142578125, -6.9228515625, -6.703125, -6.4833984375, -6.263671875, -6.0439453125, -5.82421875, -5.6044921875, -5.384765625, -5.1650390625, -4.9453125, -4.7255859375, -4.505859375, -4.2861328125, -4.06640625, -3.8466796875, -3.626953125, -3.4072265625, -3.1875, -2.9677734375, -2.748046875, -2.5283203125, -2.30859375, -2.0888671875, -1.869140625, -1.6494140625, -1.4296875, -1.2099609375, -0.990234375, -0.7705078125, -0.55078125, -0.3310546875, -0.111328125, 0.1083984375, 0.328125, 0.5478515625, 0.767578125, 0.9873046875, 1.20703125, 1.4267578125, 1.646484375, 1.8662109375, 2.0859375, 2.3056640625, 2.525390625, 2.7451171875, 2.96484375, 3.1845703125, 3.404296875, 3.6240234375, 3.84375, 4.0634765625, 4.283203125, 4.5029296875, 4.72265625, 4.9423828125, 5.162109375, 5.3818359375, 5.6015625, 5.8212890625, 6.041015625, 6.2607421875, 6.48046875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 12.0, 15.0, 14.0, 20.0, 31.0, 49.0, 56.0, 94.0, 171.0, 241.0, 399.0, 546.0, 781.0, 1236.0, 1884.0, 2863.0, 4438.0, 6846.0, 11219.0, 17956.0, 30096.0, 51186.0, 88877.0, 154248.0, 228397.0, 183555.0, 108196.0, 61781.0, 35810.0, 21497.0, 12890.0, 8174.0, 5276.0, 3301.0, 2198.0, 1427.0, 941.0, 614.0, 405.0, 232.0, 190.0, 117.0, 76.0, 72.0, 39.0, 31.0, 25.0, 13.0, 10.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.039581298828125, -1.00201416015625, -0.964447021484375, -0.9268798828125, -0.889312744140625, -0.85174560546875, -0.814178466796875, -0.776611328125, -0.739044189453125, -0.70147705078125, -0.663909912109375, -0.6263427734375, -0.588775634765625, -0.55120849609375, -0.513641357421875, -0.47607421875, -0.438507080078125, -0.40093994140625, -0.363372802734375, -0.3258056640625, -0.288238525390625, -0.25067138671875, -0.213104248046875, -0.175537109375, -0.137969970703125, -0.10040283203125, -0.062835693359375, -0.0252685546875, 0.012298583984375, 0.04986572265625, 0.087432861328125, 0.125, 0.162567138671875, 0.20013427734375, 0.237701416015625, 0.2752685546875, 0.312835693359375, 0.35040283203125, 0.387969970703125, 0.425537109375, 0.463104248046875, 0.50067138671875, 0.538238525390625, 0.5758056640625, 0.613372802734375, 0.65093994140625, 0.688507080078125, 0.72607421875, 0.763641357421875, 0.80120849609375, 0.838775634765625, 0.8763427734375, 0.913909912109375, 0.95147705078125, 0.989044189453125, 1.026611328125, 1.064178466796875, 1.10174560546875, 1.139312744140625, 1.1768798828125, 1.214447021484375, 1.25201416015625, 1.289581298828125, 1.3271484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 11.0, 12.0, 10.0, 16.0, 10.0, 17.0, 17.0, 16.0, 8.0, 33.0, 19.0, 22.0, 34.0, 21.0, 33.0, 43.0, 31.0, 36.0, 32.0, 36.0, 1054.0, 37.0, 42.0, 40.0, 41.0, 33.0, 34.0, 26.0, 24.0, 28.0, 27.0, 13.0, 25.0, 22.0, 23.0, 14.0, 14.0, 12.0, 10.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 7.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.96484375, -3.84027099609375, -3.7156982421875, -3.59112548828125, -3.466552734375, -3.34197998046875, -3.2174072265625, -3.09283447265625, -2.96826171875, -2.84368896484375, -2.7191162109375, -2.59454345703125, -2.469970703125, -2.34539794921875, -2.2208251953125, -2.09625244140625, -1.9716796875, -1.84710693359375, -1.7225341796875, -1.59796142578125, -1.473388671875, -1.34881591796875, -1.2242431640625, -1.09967041015625, -0.97509765625, -0.85052490234375, -0.7259521484375, -0.60137939453125, -0.476806640625, -0.35223388671875, -0.2276611328125, -0.10308837890625, 0.021484375, 0.14605712890625, 0.2706298828125, 0.39520263671875, 0.519775390625, 0.64434814453125, 0.7689208984375, 0.89349365234375, 1.01806640625, 1.14263916015625, 1.2672119140625, 1.39178466796875, 1.516357421875, 1.64093017578125, 1.7655029296875, 1.89007568359375, 2.0146484375, 2.13922119140625, 2.2637939453125, 2.38836669921875, 2.512939453125, 2.63751220703125, 2.7620849609375, 2.88665771484375, 3.01123046875, 3.13580322265625, 3.2603759765625, 3.38494873046875, 3.509521484375, 3.63409423828125, 3.7586669921875, 3.88323974609375, 4.0078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 0.0, 6.0, 2.0, 7.0, 10.0, 11.0, 12.0, 27.0, 30.0, 38.0, 49.0, 69.0, 104.0, 155.0, 210.0, 368.0, 485.0, 898.0, 1341.0, 2217.0, 3532.0, 5974.0, 9991.0, 17262.0, 30365.0, 52681.0, 94966.0, 177568.0, 1206583.0, 229081.0, 114111.0, 62854.0, 35713.0, 20280.0, 12031.0, 7038.0, 4168.0, 2565.0, 1545.0, 949.0, 590.0, 418.0, 270.0, 156.0, 123.0, 90.0, 56.0, 37.0, 30.0, 22.0, 20.0, 13.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.482421875, -0.4676475524902344, -0.45287322998046875, -0.4380989074707031, -0.4233245849609375, -0.4085502624511719, -0.39377593994140625, -0.3790016174316406, -0.364227294921875, -0.3494529724121094, -0.33467864990234375, -0.3199043273925781, -0.3051300048828125, -0.2903556823730469, -0.27558135986328125, -0.2608070373535156, -0.24603271484375, -0.23125839233398438, -0.21648406982421875, -0.20170974731445312, -0.1869354248046875, -0.17216110229492188, -0.15738677978515625, -0.14261245727539062, -0.127838134765625, -0.11306381225585938, -0.09828948974609375, -0.08351516723632812, -0.0687408447265625, -0.053966522216796875, -0.03919219970703125, -0.024417877197265625, -0.0096435546875, 0.005130767822265625, 0.01990509033203125, 0.034679412841796875, 0.0494537353515625, 0.06422805786132812, 0.07900238037109375, 0.09377670288085938, 0.108551025390625, 0.12332534790039062, 0.13809967041015625, 0.15287399291992188, 0.1676483154296875, 0.18242263793945312, 0.19719696044921875, 0.21197128295898438, 0.22674560546875, 0.24151992797851562, 0.25629425048828125, 0.2710685729980469, 0.2858428955078125, 0.3006172180175781, 0.31539154052734375, 0.3301658630371094, 0.344940185546875, 0.3597145080566406, 0.37448883056640625, 0.3892631530761719, 0.4040374755859375, 0.4188117980957031, 0.43358612060546875, 0.4483604431152344, 0.463134765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 6.0, 5.0, 7.0, 13.0, 12.0, 17.0, 14.0, 14.0, 35.0, 62.0, 127.0, 187.0, 191.0, 94.0, 41.0, 30.0, 14.0, 12.0, 17.0, 20.0, 8.0, 8.0, 10.0, 4.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19091796875, -0.18510818481445312, -0.17929840087890625, -0.17348861694335938, -0.1676788330078125, -0.16186904907226562, -0.15605926513671875, -0.15024948120117188, -0.144439697265625, -0.13862991333007812, -0.13282012939453125, -0.12701034545898438, -0.1212005615234375, -0.11539077758789062, -0.10958099365234375, -0.10377120971679688, -0.09796142578125, -0.09215164184570312, -0.08634185791015625, -0.08053207397460938, -0.0747222900390625, -0.06891250610351562, -0.06310272216796875, -0.057292938232421875, -0.051483154296875, -0.045673370361328125, -0.03986358642578125, -0.034053802490234375, -0.0282440185546875, -0.022434234619140625, -0.01662445068359375, -0.010814666748046875, -0.0050048828125, 0.000804901123046875, 0.00661468505859375, 0.012424468994140625, 0.0182342529296875, 0.024044036865234375, 0.02985382080078125, 0.035663604736328125, 0.041473388671875, 0.047283172607421875, 0.05309295654296875, 0.058902740478515625, 0.0647125244140625, 0.07052230834960938, 0.07633209228515625, 0.08214187622070312, 0.08795166015625, 0.09376144409179688, 0.09957122802734375, 0.10538101196289062, 0.1111907958984375, 0.11700057983398438, 0.12281036376953125, 0.12862014770507812, 0.134429931640625, 0.14023971557617188, 0.14604949951171875, 0.15185928344726562, 0.1576690673828125, 0.16347885131835938, 0.16928863525390625, 0.17509841918945312, 0.180908203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 8.0, 4.0, 7.0, 7.0, 14.0, 23.0, 27.0, 35.0, 42.0, 119.0, 245.0, 1097.0, 84639.0, 959275.0, 2312.0, 329.0, 152.0, 56.0, 37.0, 26.0, 17.0, 13.0, 11.0, 6.0, 4.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.68621826171875, -3.5638427734375, -3.44146728515625, -3.319091796875, -3.19671630859375, -3.0743408203125, -2.95196533203125, -2.82958984375, -2.70721435546875, -2.5848388671875, -2.46246337890625, -2.340087890625, -2.21771240234375, -2.0953369140625, -1.97296142578125, -1.8505859375, -1.72821044921875, -1.6058349609375, -1.48345947265625, -1.361083984375, -1.23870849609375, -1.1163330078125, -0.99395751953125, -0.87158203125, -0.74920654296875, -0.6268310546875, -0.50445556640625, -0.382080078125, -0.25970458984375, -0.1373291015625, -0.01495361328125, 0.107421875, 0.22979736328125, 0.3521728515625, 0.47454833984375, 0.596923828125, 0.71929931640625, 0.8416748046875, 0.96405029296875, 1.08642578125, 1.20880126953125, 1.3311767578125, 1.45355224609375, 1.575927734375, 1.69830322265625, 1.8206787109375, 1.94305419921875, 2.0654296875, 2.18780517578125, 2.3101806640625, 2.43255615234375, 2.554931640625, 2.67730712890625, 2.7996826171875, 2.92205810546875, 3.04443359375, 3.16680908203125, 3.2891845703125, 3.41156005859375, 3.533935546875, 3.65631103515625, 3.7786865234375, 3.90106201171875, 4.0234375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0, 5.0, 15.0, 15.0, 13.0, 26.0, 47.0, 70.0, 106.0, 207.0, 222.0, 88.0, 63.0, 35.0, 29.0, 16.0, 12.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.309217631816864, -0.2910042703151703, -0.2727908790111542, -0.25457751750946045, -0.23636414110660553, -0.2181507647037506, -0.19993740320205688, -0.18172402679920197, -0.16351065039634705, -0.14529727399349213, -0.1270838975906372, -0.10887053608894348, -0.09065715968608856, -0.07244378328323364, -0.05423041433095932, -0.036017045378685, -0.017803668975830078, 0.00040970370173454285, 0.018623076379299164, 0.036836449056863785, 0.055049821734428406, 0.07326319813728333, 0.09147656708955765, 0.10968993604183197, 0.1279033124446869, 0.1461166888475418, 0.16433006525039673, 0.18254342675209045, 0.20075680315494537, 0.2189701795578003, 0.23718354105949402, 0.25539690256118774, 0.2736102342605591, 0.2918235957622528, 0.3100369870662689, 0.32825034856796265, 0.34646373987197876, 0.3646771013736725, 0.3828904628753662, 0.4011038541793823, 0.41931721568107605, 0.4375305771827698, 0.4557439684867859, 0.4739573299884796, 0.49217069149017334, 0.5103840827941895, 0.5285974740982056, 0.5468108057975769, 0.565024197101593, 0.5832375884056091, 0.6014509201049805, 0.6196643114089966, 0.6378777027130127, 0.6560910940170288, 0.6743044257164001, 0.6925178170204163, 0.7107311487197876, 0.7289445400238037, 0.747157871723175, 0.7653712630271912, 0.7835846543312073, 0.8017979860305786, 0.8200113773345947, 0.8382247686386108, 0.856438159942627]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 4.0, 9.0, 3.0, 12.0, 17.0, 13.0, 23.0, 18.0, 16.0, 19.0, 27.0, 21.0, 32.0, 38.0, 40.0, 29.0, 33.0, 38.0, 26.0, 43.0, 42.0, 37.0, 36.0, 33.0, 40.0, 34.0, 38.0, 37.0, 26.0, 31.0, 22.0, 10.0, 25.0, 24.0, 20.0, 14.0, 6.0, 6.0, 6.0, 12.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.41460734605789185, -0.4021484851837158, -0.3896896243095398, -0.37723076343536377, -0.36477190256118774, -0.3523130416870117, -0.3398541808128357, -0.32739534974098206, -0.31493648886680603, -0.30247762799263, -0.290018767118454, -0.27755990624427795, -0.26510104537010193, -0.2526422142982483, -0.24018333852291107, -0.22772449254989624, -0.21526561677455902, -0.202806755900383, -0.19034789502620697, -0.17788904905319214, -0.1654301881790161, -0.1529713273048401, -0.14051246643066406, -0.12805360555648804, -0.11559475213289261, -0.10313589125871658, -0.09067703783512115, -0.07821817696094513, -0.0657593160867691, -0.053300462663173676, -0.04084160178899765, -0.02838274836540222, -0.015923887491226196, -0.0034650294110178947, 0.008993828669190407, 0.021452687680721283, 0.03391154482960701, 0.04637040197849274, 0.05882926285266876, 0.07128811627626419, 0.08374697715044022, 0.09620583802461624, 0.10866469144821167, 0.1211235523223877, 0.13358241319656372, 0.14604127407073975, 0.15850013494491577, 0.1709589809179306, 0.18341784179210663, 0.19587670266628265, 0.20833556354045868, 0.2207944095134735, 0.23325327038764954, 0.24571213126182556, 0.2581709921360016, 0.2706298530101776, 0.28308871388435364, 0.29554757475852966, 0.3080064356327057, 0.3204652965068817, 0.33292415738105774, 0.3453829884529114, 0.3578418493270874, 0.3703007102012634, 0.38275957107543945]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 3.0, 13.0, 9.0, 13.0, 14.0, 12.0, 13.0, 13.0, 22.0, 23.0, 27.0, 21.0, 32.0, 41.0, 44.0, 30.0, 54.0, 37.0, 41.0, 40.0, 50.0, 48.0, 37.0, 38.0, 42.0, 38.0, 23.0, 35.0, 18.0, 23.0, 21.0, 24.0, 15.0, 11.0, 9.0, 10.0, 10.0, 13.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.59765625, -7.377685546875, -7.15771484375, -6.937744140625, -6.7177734375, -6.497802734375, -6.27783203125, -6.057861328125, -5.837890625, -5.617919921875, -5.39794921875, -5.177978515625, -4.9580078125, -4.738037109375, -4.51806640625, -4.298095703125, -4.078125, -3.858154296875, -3.63818359375, -3.418212890625, -3.1982421875, -2.978271484375, -2.75830078125, -2.538330078125, -2.318359375, -2.098388671875, -1.87841796875, -1.658447265625, -1.4384765625, -1.218505859375, -0.99853515625, -0.778564453125, -0.55859375, -0.338623046875, -0.11865234375, 0.101318359375, 0.3212890625, 0.541259765625, 0.76123046875, 0.981201171875, 1.201171875, 1.421142578125, 1.64111328125, 1.861083984375, 2.0810546875, 2.301025390625, 2.52099609375, 2.740966796875, 2.9609375, 3.180908203125, 3.40087890625, 3.620849609375, 3.8408203125, 4.060791015625, 4.28076171875, 4.500732421875, 4.720703125, 4.940673828125, 5.16064453125, 5.380615234375, 5.6005859375, 5.820556640625, 6.04052734375, 6.260498046875, 6.48046875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 11.0, 16.0, 17.0, 38.0, 38.0, 44.0, 52.0, 88.0, 137.0, 186.0, 278.0, 388.0, 488.0, 706.0, 1047.0, 1489.0, 2294.0, 3782.0, 7061.0, 16079.0, 46873.0, 156922.0, 398491.0, 274851.0, 86319.0, 26576.0, 10252.0, 4996.0, 2929.0, 1905.0, 1235.0, 873.0, 600.0, 415.0, 320.0, 222.0, 152.0, 109.0, 90.0, 42.0, 53.0, 29.0, 14.0, 13.0, 12.0, 8.0, 11.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.46875, -8.2020263671875, -7.935302734375, -7.6685791015625, -7.40185546875, -7.1351318359375, -6.868408203125, -6.6016845703125, -6.3349609375, -6.0682373046875, -5.801513671875, -5.5347900390625, -5.26806640625, -5.0013427734375, -4.734619140625, -4.4678955078125, -4.201171875, -3.9344482421875, -3.667724609375, -3.4010009765625, -3.13427734375, -2.8675537109375, -2.600830078125, -2.3341064453125, -2.0673828125, -1.8006591796875, -1.533935546875, -1.2672119140625, -1.00048828125, -0.7337646484375, -0.467041015625, -0.2003173828125, 0.06640625, 0.3331298828125, 0.599853515625, 0.8665771484375, 1.13330078125, 1.4000244140625, 1.666748046875, 1.9334716796875, 2.2001953125, 2.4669189453125, 2.733642578125, 3.0003662109375, 3.26708984375, 3.5338134765625, 3.800537109375, 4.0672607421875, 4.333984375, 4.6007080078125, 4.867431640625, 5.1341552734375, 5.40087890625, 5.6676025390625, 5.934326171875, 6.2010498046875, 6.4677734375, 6.7344970703125, 7.001220703125, 7.2679443359375, 7.53466796875, 7.8013916015625, 8.068115234375, 8.3348388671875, 8.6015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 10.0, 3.0, 8.0, 10.0, 10.0, 15.0, 16.0, 18.0, 22.0, 27.0, 32.0, 36.0, 30.0, 49.0, 50.0, 60.0, 57.0, 114.0, 227.0, 1397.0, 277.0, 125.0, 81.0, 55.0, 49.0, 27.0, 34.0, 41.0, 28.0, 14.0, 16.0, 25.0, 16.0, 15.0, 16.0, 11.0, 7.0, 6.0, 2.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.265625, -24.533447265625, -23.80126953125, -23.069091796875, -22.3369140625, -21.604736328125, -20.87255859375, -20.140380859375, -19.408203125, -18.676025390625, -17.94384765625, -17.211669921875, -16.4794921875, -15.747314453125, -15.01513671875, -14.282958984375, -13.55078125, -12.818603515625, -12.08642578125, -11.354248046875, -10.6220703125, -9.889892578125, -9.15771484375, -8.425537109375, -7.693359375, -6.961181640625, -6.22900390625, -5.496826171875, -4.7646484375, -4.032470703125, -3.30029296875, -2.568115234375, -1.8359375, -1.103759765625, -0.37158203125, 0.360595703125, 1.0927734375, 1.824951171875, 2.55712890625, 3.289306640625, 4.021484375, 4.753662109375, 5.48583984375, 6.218017578125, 6.9501953125, 7.682373046875, 8.41455078125, 9.146728515625, 9.87890625, 10.611083984375, 11.34326171875, 12.075439453125, 12.8076171875, 13.539794921875, 14.27197265625, 15.004150390625, 15.736328125, 16.468505859375, 17.20068359375, 17.932861328125, 18.6650390625, 19.397216796875, 20.12939453125, 20.861572265625, 21.59375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 15.0, 12.0, 25.0, 21.0, 27.0, 36.0, 51.0, 71.0, 97.0, 123.0, 169.0, 334.0, 548.0, 1414.0, 5924.0, 98861.0, 2969061.0, 61222.0, 4952.0, 1197.0, 525.0, 292.0, 182.0, 133.0, 97.0, 66.0, 49.0, 47.0, 26.0, 27.0, 17.0, 15.0, 10.0, 6.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.5, -39.076171875, -37.65234375, -36.228515625, -34.8046875, -33.380859375, -31.95703125, -30.533203125, -29.109375, -27.685546875, -26.26171875, -24.837890625, -23.4140625, -21.990234375, -20.56640625, -19.142578125, -17.71875, -16.294921875, -14.87109375, -13.447265625, -12.0234375, -10.599609375, -9.17578125, -7.751953125, -6.328125, -4.904296875, -3.48046875, -2.056640625, -0.6328125, 0.791015625, 2.21484375, 3.638671875, 5.0625, 6.486328125, 7.91015625, 9.333984375, 10.7578125, 12.181640625, 13.60546875, 15.029296875, 16.453125, 17.876953125, 19.30078125, 20.724609375, 22.1484375, 23.572265625, 24.99609375, 26.419921875, 27.84375, 29.267578125, 30.69140625, 32.115234375, 33.5390625, 34.962890625, 36.38671875, 37.810546875, 39.234375, 40.658203125, 42.08203125, 43.505859375, 44.9296875, 46.353515625, 47.77734375, 49.201171875, 50.625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 91.0, 423.0, 394.0, 94.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.11189270019531, -85.93836212158203, -79.76482391357422, -73.59129333496094, -67.41775512695312, -61.244224548339844, -55.07069396972656, -48.897159576416016, -42.72362518310547, -36.55009078979492, -30.376558303833008, -24.203025817871094, -18.029491424560547, -11.85595703125, -5.682426452636719, 0.4911079406738281, 6.664642333984375, 12.838175773620605, 19.011709213256836, 25.18524169921875, 31.358776092529297, 37.532310485839844, 43.705841064453125, 49.87937545776367, 56.05290985107422, 62.226444244384766, 68.39997863769531, 74.5735092163086, 80.74703979492188, 86.92057800292969, 93.09410858154297, 99.26763916015625, 105.441162109375, 111.61469268798828, 117.7882308959961, 123.96176147460938, 130.1352996826172, 136.308837890625, 142.48236083984375, 148.65589904785156, 154.82943725585938, 161.0029754638672, 167.17649841308594, 173.35003662109375, 179.52357482910156, 185.69711303710938, 191.87063598632812, 198.04417419433594, 204.2176971435547, 210.3912353515625, 216.56475830078125, 222.73829650878906, 228.91183471679688, 235.08535766601562, 241.25889587402344, 247.43243408203125, 253.60595703125, 259.77947998046875, 265.9530334472656, 272.1265563964844, 278.3000793457031, 284.4736328125, 290.64715576171875, 296.8206787109375, 302.9942321777344]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 4.0, 7.0, 13.0, 15.0, 19.0, 19.0, 23.0, 24.0, 22.0, 35.0, 31.0, 39.0, 36.0, 34.0, 41.0, 40.0, 39.0, 38.0, 45.0, 41.0, 41.0, 32.0, 36.0, 31.0, 32.0, 28.0, 29.0, 23.0, 23.0, 22.0, 13.0, 17.0, 19.0, 15.0, 11.0, 8.0, 11.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-61.509971618652344, -59.73705291748047, -57.96413040161133, -56.19121170043945, -54.41828918457031, -52.64537048339844, -50.8724479675293, -49.09952926635742, -47.32660675048828, -45.553688049316406, -43.780765533447266, -42.00784683227539, -40.23492431640625, -38.462005615234375, -36.689083099365234, -34.91616439819336, -33.14324188232422, -31.37032127380371, -29.597400665283203, -27.824480056762695, -26.051559448242188, -24.278640747070312, -22.505718231201172, -20.732799530029297, -18.959880828857422, -17.186960220336914, -15.414039611816406, -13.641119003295898, -11.86819839477539, -10.0952787399292, -8.322358131408691, -6.549437522888184, -4.776515960693359, -3.0035953521728516, -1.2306749820709229, 0.5422453880310059, 2.3151659965515137, 4.088086128234863, 5.861006736755371, 7.633927345275879, 9.406847953796387, 11.179768562316895, 12.952689170837402, 14.725608825683594, 16.4985294342041, 18.27145004272461, 20.044370651245117, 21.817291259765625, 23.590211868286133, 25.36313247680664, 27.13605308532715, 28.908973693847656, 30.681894302368164, 32.45481491088867, 34.22773361206055, 36.00065612792969, 37.77357482910156, 39.54649353027344, 41.31941604614258, 43.09233474731445, 44.865257263183594, 46.63817596435547, 48.41109848022461, 50.184017181396484, 51.956939697265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 5.0, 10.0, 13.0, 10.0, 13.0, 11.0, 10.0, 9.0, 15.0, 28.0, 28.0, 20.0, 27.0, 29.0, 44.0, 36.0, 45.0, 35.0, 42.0, 42.0, 38.0, 52.0, 28.0, 37.0, 40.0, 41.0, 35.0, 29.0, 25.0, 20.0, 17.0, 25.0, 28.0, 17.0, 10.0, 9.0, 7.0, 10.0, 14.0, 9.0, 9.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.2421875, -7.02587890625, -6.8095703125, -6.59326171875, -6.376953125, -6.16064453125, -5.9443359375, -5.72802734375, -5.51171875, -5.29541015625, -5.0791015625, -4.86279296875, -4.646484375, -4.43017578125, -4.2138671875, -3.99755859375, -3.78125, -3.56494140625, -3.3486328125, -3.13232421875, -2.916015625, -2.69970703125, -2.4833984375, -2.26708984375, -2.05078125, -1.83447265625, -1.6181640625, -1.40185546875, -1.185546875, -0.96923828125, -0.7529296875, -0.53662109375, -0.3203125, -0.10400390625, 0.1123046875, 0.32861328125, 0.544921875, 0.76123046875, 0.9775390625, 1.19384765625, 1.41015625, 1.62646484375, 1.8427734375, 2.05908203125, 2.275390625, 2.49169921875, 2.7080078125, 2.92431640625, 3.140625, 3.35693359375, 3.5732421875, 3.78955078125, 4.005859375, 4.22216796875, 4.4384765625, 4.65478515625, 4.87109375, 5.08740234375, 5.3037109375, 5.52001953125, 5.736328125, 5.95263671875, 6.1689453125, 6.38525390625, 6.6015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 7.0, 17.0, 8.0, 32.0, 29.0, 48.0, 78.0, 99.0, 155.0, 236.0, 342.0, 642.0, 1207.0, 2279.0, 4523.0, 9610.0, 22935.0, 68472.0, 438612.0, 2777615.0, 727444.0, 89927.0, 27803.0, 11234.0, 5040.0, 2636.0, 1293.0, 755.0, 421.0, 256.0, 171.0, 113.0, 73.0, 48.0, 36.0, 19.0, 15.0, 13.0, 14.0, 6.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.5625, -20.880126953125, -20.19775390625, -19.515380859375, -18.8330078125, -18.150634765625, -17.46826171875, -16.785888671875, -16.103515625, -15.421142578125, -14.73876953125, -14.056396484375, -13.3740234375, -12.691650390625, -12.00927734375, -11.326904296875, -10.64453125, -9.962158203125, -9.27978515625, -8.597412109375, -7.9150390625, -7.232666015625, -6.55029296875, -5.867919921875, -5.185546875, -4.503173828125, -3.82080078125, -3.138427734375, -2.4560546875, -1.773681640625, -1.09130859375, -0.408935546875, 0.2734375, 0.955810546875, 1.63818359375, 2.320556640625, 3.0029296875, 3.685302734375, 4.36767578125, 5.050048828125, 5.732421875, 6.414794921875, 7.09716796875, 7.779541015625, 8.4619140625, 9.144287109375, 9.82666015625, 10.509033203125, 11.19140625, 11.873779296875, 12.55615234375, 13.238525390625, 13.9208984375, 14.603271484375, 15.28564453125, 15.968017578125, 16.650390625, 17.332763671875, 18.01513671875, 18.697509765625, 19.3798828125, 20.062255859375, 20.74462890625, 21.427001953125, 22.109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 7.0, 10.0, 9.0, 13.0, 11.0, 22.0, 34.0, 41.0, 60.0, 94.0, 134.0, 179.0, 243.0, 397.0, 575.0, 637.0, 500.0, 347.0, 237.0, 160.0, 117.0, 69.0, 43.0, 34.0, 26.0, 23.0, 20.0, 8.0, 6.0, 11.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.8173828125, -17.166015625, -16.5146484375, -15.86328125, -15.2119140625, -14.560546875, -13.9091796875, -13.2578125, -12.6064453125, -11.955078125, -11.3037109375, -10.65234375, -10.0009765625, -9.349609375, -8.6982421875, -8.046875, -7.3955078125, -6.744140625, -6.0927734375, -5.44140625, -4.7900390625, -4.138671875, -3.4873046875, -2.8359375, -2.1845703125, -1.533203125, -0.8818359375, -0.23046875, 0.4208984375, 1.072265625, 1.7236328125, 2.375, 3.0263671875, 3.677734375, 4.3291015625, 4.98046875, 5.6318359375, 6.283203125, 6.9345703125, 7.5859375, 8.2373046875, 8.888671875, 9.5400390625, 10.19140625, 10.8427734375, 11.494140625, 12.1455078125, 12.796875, 13.4482421875, 14.099609375, 14.7509765625, 15.40234375, 16.0537109375, 16.705078125, 17.3564453125, 18.0078125, 18.6591796875, 19.310546875, 19.9619140625, 20.61328125, 21.2646484375, 21.916015625, 22.5673828125, 23.21875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 12.0, 24.0, 26.0, 48.0, 61.0, 78.0, 160.0, 318.0, 559.0, 1431.0, 3533.0, 10622.0, 38168.0, 199695.0, 2555355.0, 1235229.0, 111353.0, 25193.0, 7496.0, 2682.0, 1101.0, 491.0, 260.0, 128.0, 88.0, 53.0, 28.0, 22.0, 15.0, 12.0, 7.0, 9.0, 9.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.03125, -41.894287109375, -40.75732421875, -39.620361328125, -38.4833984375, -37.346435546875, -36.20947265625, -35.072509765625, -33.935546875, -32.798583984375, -31.66162109375, -30.524658203125, -29.3876953125, -28.250732421875, -27.11376953125, -25.976806640625, -24.83984375, -23.702880859375, -22.56591796875, -21.428955078125, -20.2919921875, -19.155029296875, -18.01806640625, -16.881103515625, -15.744140625, -14.607177734375, -13.47021484375, -12.333251953125, -11.1962890625, -10.059326171875, -8.92236328125, -7.785400390625, -6.6484375, -5.511474609375, -4.37451171875, -3.237548828125, -2.1005859375, -0.963623046875, 0.17333984375, 1.310302734375, 2.447265625, 3.584228515625, 4.72119140625, 5.858154296875, 6.9951171875, 8.132080078125, 9.26904296875, 10.406005859375, 11.54296875, 12.679931640625, 13.81689453125, 14.953857421875, 16.0908203125, 17.227783203125, 18.36474609375, 19.501708984375, 20.638671875, 21.775634765625, 22.91259765625, 24.049560546875, 25.1865234375, 26.323486328125, 27.46044921875, 28.597412109375, 29.734375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 16.0, 20.0, 60.0, 117.0, 186.0, 218.0, 185.0, 119.0, 50.0, 27.0, 12.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.3811950683594, -343.4544372558594, -336.5276794433594, -329.6009216308594, -322.6741638183594, -315.7474060058594, -308.8206481933594, -301.8938903808594, -294.9671325683594, -288.0403747558594, -281.1136169433594, -274.1868591308594, -267.2601013183594, -260.3333435058594, -253.40658569335938, -246.47982788085938, -239.55307006835938, -232.62631225585938, -225.69955444335938, -218.77279663085938, -211.84603881835938, -204.91928100585938, -197.99252319335938, -191.06576538085938, -184.13900756835938, -177.21224975585938, -170.28549194335938, -163.35873413085938, -156.43197631835938, -149.50521850585938, -142.57846069335938, -135.65170288085938, -128.7249298095703, -121.79817199707031, -114.87141418457031, -107.94465637207031, -101.01789855957031, -94.09114074707031, -87.16438293457031, -80.23762512207031, -73.31086730957031, -66.38410949707031, -59.45735168457031, -52.53059387207031, -45.60383605957031, -38.67707824707031, -31.750320434570312, -24.823562622070312, -17.896804809570312, -10.970046997070312, -4.0432891845703125, 2.8834686279296875, 9.810226440429688, 16.736984252929688, 23.663742065429688, 30.590499877929688, 37.51725769042969, 44.44401550292969, 51.37077331542969, 58.29753112792969, 65.22428894042969, 72.15104675292969, 79.07780456542969, 86.00456237792969, 92.93132019042969]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 13.0, 11.0, 11.0, 14.0, 12.0, 16.0, 16.0, 19.0, 22.0, 18.0, 33.0, 27.0, 36.0, 23.0, 34.0, 43.0, 31.0, 35.0, 40.0, 34.0, 37.0, 24.0, 27.0, 37.0, 42.0, 35.0, 32.0, 25.0, 30.0, 25.0, 18.0, 15.0, 16.0, 26.0, 19.0, 15.0, 15.0, 5.0, 12.0, 6.0, 2.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0], "bins": [-49.65329360961914, -48.12528991699219, -46.597286224365234, -45.06928253173828, -43.541282653808594, -42.01327896118164, -40.48527526855469, -38.957271575927734, -37.42926788330078, -35.90126419067383, -34.373260498046875, -32.84526062011719, -31.3172550201416, -29.78925323486328, -28.261249542236328, -26.733245849609375, -25.205244064331055, -23.6772403717041, -22.14923858642578, -20.621234893798828, -19.093231201171875, -17.565227508544922, -16.0372257232666, -14.509222030639648, -12.981219291687012, -11.453216552734375, -9.925212860107422, -8.397210121154785, -6.86920690536499, -5.341203689575195, -3.8132009506225586, -2.2851972579956055, -0.7571945190429688, 0.7708085775375366, 2.298811674118042, 3.826814651489258, 5.354817867279053, 6.882821083068848, 8.410823822021484, 9.938827514648438, 11.466830253601074, 12.994832992553711, 14.522836685180664, 16.050838470458984, 17.578842163085938, 19.10684585571289, 20.634849548339844, 22.162853240966797, 23.690855026245117, 25.21885871887207, 26.74686050415039, 28.274864196777344, 29.802867889404297, 31.33087158203125, 32.85887145996094, 34.386878967285156, 35.914878845214844, 37.4428825378418, 38.97088623046875, 40.49888610839844, 42.02688980102539, 43.554893493652344, 45.0828971862793, 46.61090087890625, 48.1389045715332]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 3.0, 11.0, 10.0, 9.0, 10.0, 18.0, 16.0, 14.0, 27.0, 24.0, 19.0, 32.0, 25.0, 30.0, 25.0, 41.0, 32.0, 46.0, 38.0, 39.0, 58.0, 47.0, 35.0, 38.0, 29.0, 36.0, 41.0, 26.0, 25.0, 21.0, 22.0, 15.0, 23.0, 17.0, 13.0, 12.0, 13.0, 16.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.88671875, -6.6641845703125, -6.441650390625, -6.2191162109375, -5.99658203125, -5.7740478515625, -5.551513671875, -5.3289794921875, -5.1064453125, -4.8839111328125, -4.661376953125, -4.4388427734375, -4.21630859375, -3.9937744140625, -3.771240234375, -3.5487060546875, -3.326171875, -3.1036376953125, -2.881103515625, -2.6585693359375, -2.43603515625, -2.2135009765625, -1.990966796875, -1.7684326171875, -1.5458984375, -1.3233642578125, -1.100830078125, -0.8782958984375, -0.65576171875, -0.4332275390625, -0.210693359375, 0.0118408203125, 0.234375, 0.4569091796875, 0.679443359375, 0.9019775390625, 1.12451171875, 1.3470458984375, 1.569580078125, 1.7921142578125, 2.0146484375, 2.2371826171875, 2.459716796875, 2.6822509765625, 2.90478515625, 3.1273193359375, 3.349853515625, 3.5723876953125, 3.794921875, 4.0174560546875, 4.239990234375, 4.4625244140625, 4.68505859375, 4.9075927734375, 5.130126953125, 5.3526611328125, 5.5751953125, 5.7977294921875, 6.020263671875, 6.2427978515625, 6.46533203125, 6.6878662109375, 6.910400390625, 7.1329345703125, 7.35546875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 23.0, 14.0, 21.0, 43.0, 72.0, 113.0, 161.0, 260.0, 360.0, 562.0, 916.0, 1364.0, 2303.0, 3601.0, 5923.0, 10226.0, 16669.0, 29045.0, 51262.0, 89632.0, 156698.0, 233470.0, 186755.0, 110098.0, 62189.0, 35241.0, 20475.0, 12158.0, 7138.0, 4367.0, 2708.0, 1739.0, 1061.0, 622.0, 430.0, 301.0, 180.0, 116.0, 67.0, 45.0, 42.0, 23.0, 20.0, 13.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.2939453125, -1.2543487548828125, -1.214752197265625, -1.1751556396484375, -1.13555908203125, -1.0959625244140625, -1.056365966796875, -1.0167694091796875, -0.9771728515625, -0.9375762939453125, -0.897979736328125, -0.8583831787109375, -0.81878662109375, -0.7791900634765625, -0.739593505859375, -0.6999969482421875, -0.660400390625, -0.6208038330078125, -0.581207275390625, -0.5416107177734375, -0.50201416015625, -0.4624176025390625, -0.422821044921875, -0.3832244873046875, -0.3436279296875, -0.3040313720703125, -0.264434814453125, -0.2248382568359375, -0.18524169921875, -0.1456451416015625, -0.106048583984375, -0.0664520263671875, -0.02685546875, 0.0127410888671875, 0.052337646484375, 0.0919342041015625, 0.13153076171875, 0.1711273193359375, 0.210723876953125, 0.2503204345703125, 0.2899169921875, 0.3295135498046875, 0.369110107421875, 0.4087066650390625, 0.44830322265625, 0.4878997802734375, 0.527496337890625, 0.5670928955078125, 0.606689453125, 0.6462860107421875, 0.685882568359375, 0.7254791259765625, 0.76507568359375, 0.8046722412109375, 0.844268798828125, 0.8838653564453125, 0.9234619140625, 0.9630584716796875, 1.002655029296875, 1.0422515869140625, 1.08184814453125, 1.1214447021484375, 1.161041259765625, 1.2006378173828125, 1.240234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 12.0, 13.0, 18.0, 18.0, 8.0, 24.0, 26.0, 24.0, 25.0, 27.0, 43.0, 33.0, 46.0, 39.0, 38.0, 41.0, 40.0, 1079.0, 55.0, 41.0, 38.0, 35.0, 29.0, 26.0, 24.0, 30.0, 23.0, 23.0, 31.0, 27.0, 20.0, 11.0, 12.0, 7.0, 9.0, 3.0, 3.0, 9.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.35546875, -5.18988037109375, -5.0242919921875, -4.85870361328125, -4.693115234375, -4.52752685546875, -4.3619384765625, -4.19635009765625, -4.03076171875, -3.86517333984375, -3.6995849609375, -3.53399658203125, -3.368408203125, -3.20281982421875, -3.0372314453125, -2.87164306640625, -2.7060546875, -2.54046630859375, -2.3748779296875, -2.20928955078125, -2.043701171875, -1.87811279296875, -1.7125244140625, -1.54693603515625, -1.38134765625, -1.21575927734375, -1.0501708984375, -0.88458251953125, -0.718994140625, -0.55340576171875, -0.3878173828125, -0.22222900390625, -0.056640625, 0.10894775390625, 0.2745361328125, 0.44012451171875, 0.605712890625, 0.77130126953125, 0.9368896484375, 1.10247802734375, 1.26806640625, 1.43365478515625, 1.5992431640625, 1.76483154296875, 1.930419921875, 2.09600830078125, 2.2615966796875, 2.42718505859375, 2.5927734375, 2.75836181640625, 2.9239501953125, 3.08953857421875, 3.255126953125, 3.42071533203125, 3.5863037109375, 3.75189208984375, 3.91748046875, 4.08306884765625, 4.2486572265625, 4.41424560546875, 4.579833984375, 4.74542236328125, 4.9110107421875, 5.07659912109375, 5.2421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 13.0, 18.0, 31.0, 58.0, 105.0, 131.0, 214.0, 312.0, 453.0, 769.0, 1224.0, 1943.0, 3241.0, 5067.0, 8537.0, 13896.0, 23334.0, 40332.0, 71627.0, 130888.0, 330645.0, 1102407.0, 158964.0, 85426.0, 47757.0, 27622.0, 16357.0, 9869.0, 5990.0, 3633.0, 2218.0, 1515.0, 916.0, 541.0, 357.0, 232.0, 159.0, 118.0, 64.0, 43.0, 33.0, 16.0, 10.0, 11.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.46142578125, -0.4466133117675781, -0.43180084228515625, -0.4169883728027344, -0.4021759033203125, -0.3873634338378906, -0.37255096435546875, -0.3577384948730469, -0.342926025390625, -0.3281135559082031, -0.31330108642578125, -0.2984886169433594, -0.2836761474609375, -0.2688636779785156, -0.25405120849609375, -0.23923873901367188, -0.22442626953125, -0.20961380004882812, -0.19480133056640625, -0.17998886108398438, -0.1651763916015625, -0.15036392211914062, -0.13555145263671875, -0.12073898315429688, -0.105926513671875, -0.09111404418945312, -0.07630157470703125, -0.061489105224609375, -0.0466766357421875, -0.031864166259765625, -0.01705169677734375, -0.002239227294921875, 0.0125732421875, 0.027385711669921875, 0.04219818115234375, 0.057010650634765625, 0.0718231201171875, 0.08663558959960938, 0.10144805908203125, 0.11626052856445312, 0.131072998046875, 0.14588546752929688, 0.16069793701171875, 0.17551040649414062, 0.1903228759765625, 0.20513534545898438, 0.21994781494140625, 0.23476028442382812, 0.24957275390625, 0.2643852233886719, 0.27919769287109375, 0.2940101623535156, 0.3088226318359375, 0.3236351013183594, 0.33844757080078125, 0.3532600402832031, 0.368072509765625, 0.3828849792480469, 0.39769744873046875, 0.4125099182128906, 0.4273223876953125, 0.4421348571777344, 0.45694732666015625, 0.4717597961425781, 0.486572265625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 4.0, 8.0, 10.0, 4.0, 12.0, 12.0, 25.0, 39.0, 95.0, 202.0, 250.0, 144.0, 65.0, 32.0, 17.0, 19.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32958984375, -0.3190498352050781, -0.30850982666015625, -0.2979698181152344, -0.2874298095703125, -0.2768898010253906, -0.26634979248046875, -0.2558097839355469, -0.245269775390625, -0.23472976684570312, -0.22418975830078125, -0.21364974975585938, -0.2031097412109375, -0.19256973266601562, -0.18202972412109375, -0.17148971557617188, -0.16094970703125, -0.15040969848632812, -0.13986968994140625, -0.12932968139648438, -0.1187896728515625, -0.10824966430664062, -0.09770965576171875, -0.08716964721679688, -0.076629638671875, -0.06608963012695312, -0.05554962158203125, -0.045009613037109375, -0.0344696044921875, -0.023929595947265625, -0.01338958740234375, -0.002849578857421875, 0.0076904296875, 0.018230438232421875, 0.02877044677734375, 0.039310455322265625, 0.0498504638671875, 0.060390472412109375, 0.07093048095703125, 0.08147048950195312, 0.092010498046875, 0.10255050659179688, 0.11309051513671875, 0.12363052368164062, 0.1341705322265625, 0.14471054077148438, 0.15525054931640625, 0.16579055786132812, 0.17633056640625, 0.18687057495117188, 0.19741058349609375, 0.20795059204101562, 0.2184906005859375, 0.22903060913085938, 0.23957061767578125, 0.2501106262207031, 0.260650634765625, 0.2711906433105469, 0.28173065185546875, 0.2922706604003906, 0.3028106689453125, 0.3133506774902344, 0.32389068603515625, 0.3344306945800781, 0.344970703125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 8.0, 25.0, 38.0, 52.0, 113.0, 293.0, 3302.0, 1019622.0, 24090.0, 634.0, 161.0, 75.0, 32.0, 22.0, 9.0, 16.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.953125, -6.74066162109375, -6.5281982421875, -6.31573486328125, -6.103271484375, -5.89080810546875, -5.6783447265625, -5.46588134765625, -5.25341796875, -5.04095458984375, -4.8284912109375, -4.61602783203125, -4.403564453125, -4.19110107421875, -3.9786376953125, -3.76617431640625, -3.5537109375, -3.34124755859375, -3.1287841796875, -2.91632080078125, -2.703857421875, -2.49139404296875, -2.2789306640625, -2.06646728515625, -1.85400390625, -1.64154052734375, -1.4290771484375, -1.21661376953125, -1.004150390625, -0.79168701171875, -0.5792236328125, -0.36676025390625, -0.154296875, 0.05816650390625, 0.2706298828125, 0.48309326171875, 0.695556640625, 0.90802001953125, 1.1204833984375, 1.33294677734375, 1.54541015625, 1.75787353515625, 1.9703369140625, 2.18280029296875, 2.395263671875, 2.60772705078125, 2.8201904296875, 3.03265380859375, 3.2451171875, 3.45758056640625, 3.6700439453125, 3.88250732421875, 4.094970703125, 4.30743408203125, 4.5198974609375, 4.73236083984375, 4.94482421875, 5.15728759765625, 5.3697509765625, 5.58221435546875, 5.794677734375, 6.00714111328125, 6.2196044921875, 6.43206787109375, 6.64453125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 10.0, 3.0, 12.0, 18.0, 23.0, 43.0, 51.0, 94.0, 153.0, 261.0, 133.0, 67.0, 50.0, 25.0, 19.0, 16.0, 3.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46889767050743103, -0.44180095195770264, -0.41470426321029663, -0.38760754466056824, -0.36051082611083984, -0.33341413736343384, -0.30631741881370544, -0.27922070026397705, -0.25212401151657104, -0.22502730786800385, -0.19793058931827545, -0.17083388566970825, -0.14373716711997986, -0.11664046347141266, -0.08954375982284546, -0.062447041273117065, -0.03535032272338867, -0.008253613486886024, 0.018843095749616623, 0.04593980312347412, 0.07303651422262192, 0.10013322532176971, 0.12722992897033691, 0.1543266475200653, 0.1814233511686325, 0.2085200548171997, 0.2356167733669281, 0.2627134919166565, 0.2898101806640625, 0.3169068992137909, 0.3440036177635193, 0.3711003065109253, 0.3981969952583313, 0.4252937138080597, 0.4523904025554657, 0.4794871211051941, 0.5065838098526001, 0.5336805582046509, 0.5607772469520569, 0.5878739356994629, 0.6149706840515137, 0.6420673727989197, 0.6691641211509705, 0.6962608098983765, 0.7233574986457825, 0.7504542469978333, 0.7775509357452393, 0.80464768409729, 0.8317443132400513, 0.8588410019874573, 0.8859377503395081, 0.9130344390869141, 0.9401311278343201, 0.9672278761863708, 0.9943245649337769, 1.0214213132858276, 1.0485180616378784, 1.0756148099899292, 1.1027114391326904, 1.1298081874847412, 1.156904935836792, 1.1840015649795532, 1.211098313331604, 1.2381950616836548, 1.265291690826416]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 6.0, 4.0, 8.0, 3.0, 5.0, 13.0, 12.0, 22.0, 16.0, 24.0, 20.0, 20.0, 27.0, 28.0, 26.0, 37.0, 33.0, 31.0, 36.0, 33.0, 42.0, 28.0, 47.0, 38.0, 32.0, 30.0, 35.0, 36.0, 36.0, 29.0, 38.0, 30.0, 25.0, 22.0, 17.0, 26.0, 16.0, 17.0, 10.0, 11.0, 2.0, 7.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.49825114011764526, -0.482431024312973, -0.4666109085083008, -0.45079079270362854, -0.4349706768989563, -0.41915053129196167, -0.40333041548728943, -0.3875102996826172, -0.37169018387794495, -0.3558700680732727, -0.34004995226860046, -0.3242298364639282, -0.3084096908569336, -0.29258960485458374, -0.2767694592475891, -0.26094934344291687, -0.24512922763824463, -0.2293091118335724, -0.21348899602890015, -0.1976688653230667, -0.18184874951839447, -0.16602863371372223, -0.1502085030078888, -0.13438838720321655, -0.11856827139854431, -0.10274815559387207, -0.08692803233861923, -0.0711079090833664, -0.05528779327869415, -0.03946767747402191, -0.023647554218769073, -0.007827430963516235, 0.00799262523651123, 0.02381274476647377, 0.03963286429643631, 0.05545298382639885, 0.07127310335636139, 0.08709321916103363, 0.10291334241628647, 0.1187334656715393, 0.13455358147621155, 0.1503736972808838, 0.16619381308555603, 0.18201394379138947, 0.1978340595960617, 0.21365417540073395, 0.22947430610656738, 0.24529442191123962, 0.26111453771591187, 0.2769346535205841, 0.29275476932525635, 0.3085748851299286, 0.32439500093460083, 0.34021514654159546, 0.3560352623462677, 0.37185537815093994, 0.3876754939556122, 0.4034956097602844, 0.41931572556495667, 0.4351358413696289, 0.45095598697662354, 0.4667760729789734, 0.482596218585968, 0.49841633439064026, 0.5142364501953125]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 3.0, 4.0, 3.0, 10.0, 11.0, 9.0, 11.0, 18.0, 17.0, 13.0, 26.0, 22.0, 20.0, 35.0, 24.0, 30.0, 25.0, 43.0, 30.0, 45.0, 39.0, 38.0, 60.0, 46.0, 36.0, 37.0, 27.0, 40.0, 36.0, 29.0, 25.0, 22.0, 19.0, 17.0, 24.0, 14.0, 16.0, 12.0, 12.0, 13.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.8828125, -6.66033935546875, -6.4378662109375, -6.21539306640625, -5.992919921875, -5.77044677734375, -5.5479736328125, -5.32550048828125, -5.10302734375, -4.88055419921875, -4.6580810546875, -4.43560791015625, -4.213134765625, -3.99066162109375, -3.7681884765625, -3.54571533203125, -3.3232421875, -3.10076904296875, -2.8782958984375, -2.65582275390625, -2.433349609375, -2.21087646484375, -1.9884033203125, -1.76593017578125, -1.54345703125, -1.32098388671875, -1.0985107421875, -0.87603759765625, -0.653564453125, -0.43109130859375, -0.2086181640625, 0.01385498046875, 0.236328125, 0.45880126953125, 0.6812744140625, 0.90374755859375, 1.126220703125, 1.34869384765625, 1.5711669921875, 1.79364013671875, 2.01611328125, 2.23858642578125, 2.4610595703125, 2.68353271484375, 2.906005859375, 3.12847900390625, 3.3509521484375, 3.57342529296875, 3.7958984375, 4.01837158203125, 4.2408447265625, 4.46331787109375, 4.685791015625, 4.90826416015625, 5.1307373046875, 5.35321044921875, 5.57568359375, 5.79815673828125, 6.0206298828125, 6.24310302734375, 6.465576171875, 6.68804931640625, 6.9105224609375, 7.13299560546875, 7.35546875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 18.0, 16.0, 25.0, 22.0, 46.0, 58.0, 73.0, 65.0, 125.0, 192.0, 278.0, 452.0, 792.0, 1186.0, 2073.0, 4030.0, 8511.0, 21281.0, 60377.0, 211630.0, 491411.0, 163690.0, 48788.0, 17533.0, 7357.0, 3586.0, 1852.0, 1088.0, 672.0, 423.0, 260.0, 177.0, 120.0, 94.0, 66.0, 48.0, 36.0, 24.0, 13.0, 16.0, 13.0, 10.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.5, -12.1142578125, -11.728515625, -11.3427734375, -10.95703125, -10.5712890625, -10.185546875, -9.7998046875, -9.4140625, -9.0283203125, -8.642578125, -8.2568359375, -7.87109375, -7.4853515625, -7.099609375, -6.7138671875, -6.328125, -5.9423828125, -5.556640625, -5.1708984375, -4.78515625, -4.3994140625, -4.013671875, -3.6279296875, -3.2421875, -2.8564453125, -2.470703125, -2.0849609375, -1.69921875, -1.3134765625, -0.927734375, -0.5419921875, -0.15625, 0.2294921875, 0.615234375, 1.0009765625, 1.38671875, 1.7724609375, 2.158203125, 2.5439453125, 2.9296875, 3.3154296875, 3.701171875, 4.0869140625, 4.47265625, 4.8583984375, 5.244140625, 5.6298828125, 6.015625, 6.4013671875, 6.787109375, 7.1728515625, 7.55859375, 7.9443359375, 8.330078125, 8.7158203125, 9.1015625, 9.4873046875, 9.873046875, 10.2587890625, 10.64453125, 11.0302734375, 11.416015625, 11.8017578125, 12.1875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 13.0, 6.0, 9.0, 20.0, 14.0, 23.0, 24.0, 22.0, 30.0, 37.0, 37.0, 32.0, 49.0, 66.0, 91.0, 112.0, 252.0, 1458.0, 193.0, 110.0, 72.0, 49.0, 47.0, 38.0, 32.0, 31.0, 31.0, 24.0, 20.0, 14.0, 18.0, 7.0, 5.0, 15.0, 6.0, 3.0, 9.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.3369140625, -20.611328125, -19.8857421875, -19.16015625, -18.4345703125, -17.708984375, -16.9833984375, -16.2578125, -15.5322265625, -14.806640625, -14.0810546875, -13.35546875, -12.6298828125, -11.904296875, -11.1787109375, -10.453125, -9.7275390625, -9.001953125, -8.2763671875, -7.55078125, -6.8251953125, -6.099609375, -5.3740234375, -4.6484375, -3.9228515625, -3.197265625, -2.4716796875, -1.74609375, -1.0205078125, -0.294921875, 0.4306640625, 1.15625, 1.8818359375, 2.607421875, 3.3330078125, 4.05859375, 4.7841796875, 5.509765625, 6.2353515625, 6.9609375, 7.6865234375, 8.412109375, 9.1376953125, 9.86328125, 10.5888671875, 11.314453125, 12.0400390625, 12.765625, 13.4912109375, 14.216796875, 14.9423828125, 15.66796875, 16.3935546875, 17.119140625, 17.8447265625, 18.5703125, 19.2958984375, 20.021484375, 20.7470703125, 21.47265625, 22.1982421875, 22.923828125, 23.6494140625, 24.375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 5.0, 11.0, 12.0, 8.0, 10.0, 22.0, 21.0, 25.0, 47.0, 67.0, 86.0, 97.0, 133.0, 244.0, 371.0, 865.0, 3165.0, 31580.0, 2427450.0, 661957.0, 15676.0, 2129.0, 649.0, 326.0, 192.0, 126.0, 104.0, 84.0, 43.0, 45.0, 42.0, 26.0, 19.0, 12.0, 14.0, 9.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.1875, -47.7353515625, -46.283203125, -44.8310546875, -43.37890625, -41.9267578125, -40.474609375, -39.0224609375, -37.5703125, -36.1181640625, -34.666015625, -33.2138671875, -31.76171875, -30.3095703125, -28.857421875, -27.4052734375, -25.953125, -24.5009765625, -23.048828125, -21.5966796875, -20.14453125, -18.6923828125, -17.240234375, -15.7880859375, -14.3359375, -12.8837890625, -11.431640625, -9.9794921875, -8.52734375, -7.0751953125, -5.623046875, -4.1708984375, -2.71875, -1.2666015625, 0.185546875, 1.6376953125, 3.08984375, 4.5419921875, 5.994140625, 7.4462890625, 8.8984375, 10.3505859375, 11.802734375, 13.2548828125, 14.70703125, 16.1591796875, 17.611328125, 19.0634765625, 20.515625, 21.9677734375, 23.419921875, 24.8720703125, 26.32421875, 27.7763671875, 29.228515625, 30.6806640625, 32.1328125, 33.5849609375, 35.037109375, 36.4892578125, 37.94140625, 39.3935546875, 40.845703125, 42.2978515625, 43.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 8.0, 174.0, 607.0, 211.0, 18.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.11866760253906, -30.5842342376709, -22.049800872802734, -13.51536750793457, -4.980934143066406, 3.553497314453125, 12.087932586669922, 20.62236785888672, 29.15679931640625, 37.69123077392578, 46.22566604614258, 54.760101318359375, 63.294532775878906, 71.82896423339844, 80.3634033203125, 88.89783477783203, 97.43226623535156, 105.9666976928711, 114.50112915039062, 123.03556823730469, 131.57000732421875, 140.10443115234375, 148.6388702392578, 157.17330932617188, 165.70773315429688, 174.24217224121094, 182.77659606933594, 191.31103515625, 199.845458984375, 208.37989807128906, 216.91433715820312, 225.44876098632812, 233.98318481445312, 242.5176239013672, 251.0520477294922, 259.58648681640625, 268.12091064453125, 276.65533447265625, 285.1897888183594, 293.7242126464844, 302.2586669921875, 310.7930908203125, 319.3275451660156, 327.8619689941406, 336.3963928222656, 344.93084716796875, 353.46527099609375, 361.99969482421875, 370.53411865234375, 379.06854248046875, 387.6029968261719, 396.1374206542969, 404.6718444824219, 413.206298828125, 421.74072265625, 430.275146484375, 438.8095703125, 447.343994140625, 455.8784484863281, 464.4128723144531, 472.9472961425781, 481.48175048828125, 490.01617431640625, 498.55059814453125, 507.0850524902344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 12.0, 4.0, 10.0, 17.0, 9.0, 11.0, 15.0, 23.0, 33.0, 15.0, 33.0, 45.0, 33.0, 53.0, 48.0, 63.0, 46.0, 34.0, 63.0, 48.0, 49.0, 34.0, 35.0, 34.0, 37.0, 26.0, 24.0, 26.0, 31.0, 18.0, 9.0, 12.0, 14.0, 7.0, 6.0, 3.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.59678649902344, -68.30347442626953, -66.01016235351562, -63.71685028076172, -61.42353820800781, -59.130226135253906, -56.8369140625, -54.543601989746094, -52.25028991699219, -49.95697784423828, -47.663665771484375, -45.37035369873047, -43.07704162597656, -40.783729553222656, -38.49041748046875, -36.197105407714844, -33.90379333496094, -31.61048126220703, -29.317169189453125, -27.02385711669922, -24.730545043945312, -22.437232971191406, -20.1439208984375, -17.850608825683594, -15.557296752929688, -13.263984680175781, -10.970672607421875, -8.677360534667969, -6.3840484619140625, -4.090736389160156, -1.79742431640625, 0.49588775634765625, 2.7891998291015625, 5.082511901855469, 7.375823974609375, 9.669136047363281, 11.962448120117188, 14.255760192871094, 16.549072265625, 18.842384338378906, 21.135696411132812, 23.42900848388672, 25.722320556640625, 28.01563262939453, 30.308944702148438, 32.602256774902344, 34.89556884765625, 37.188880920410156, 39.48219299316406, 41.77550506591797, 44.068817138671875, 46.36212921142578, 48.65544128417969, 50.948753356933594, 53.2420654296875, 55.535377502441406, 57.82868957519531, 60.12200164794922, 62.415313720703125, 64.70862579345703, 67.00193786621094, 69.29524993896484, 71.58856201171875, 73.88187408447266, 76.17518615722656]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 11.0, 13.0, 14.0, 19.0, 15.0, 18.0, 19.0, 25.0, 28.0, 26.0, 31.0, 40.0, 26.0, 34.0, 37.0, 49.0, 34.0, 32.0, 42.0, 34.0, 52.0, 34.0, 47.0, 37.0, 36.0, 25.0, 28.0, 17.0, 27.0, 20.0, 19.0, 10.0, 16.0, 11.0, 6.0, 8.0, 9.0, 3.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.16796875, -6.93243408203125, -6.6968994140625, -6.46136474609375, -6.225830078125, -5.99029541015625, -5.7547607421875, -5.51922607421875, -5.28369140625, -5.04815673828125, -4.8126220703125, -4.57708740234375, -4.341552734375, -4.10601806640625, -3.8704833984375, -3.63494873046875, -3.3994140625, -3.16387939453125, -2.9283447265625, -2.69281005859375, -2.457275390625, -2.22174072265625, -1.9862060546875, -1.75067138671875, -1.51513671875, -1.27960205078125, -1.0440673828125, -0.80853271484375, -0.572998046875, -0.33746337890625, -0.1019287109375, 0.13360595703125, 0.369140625, 0.60467529296875, 0.8402099609375, 1.07574462890625, 1.311279296875, 1.54681396484375, 1.7823486328125, 2.01788330078125, 2.25341796875, 2.48895263671875, 2.7244873046875, 2.96002197265625, 3.195556640625, 3.43109130859375, 3.6666259765625, 3.90216064453125, 4.1376953125, 4.37322998046875, 4.6087646484375, 4.84429931640625, 5.079833984375, 5.31536865234375, 5.5509033203125, 5.78643798828125, 6.02197265625, 6.25750732421875, 6.4930419921875, 6.72857666015625, 6.964111328125, 7.19964599609375, 7.4351806640625, 7.67071533203125, 7.90625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 2.0, 6.0, 11.0, 18.0, 25.0, 28.0, 22.0, 44.0, 53.0, 85.0, 129.0, 143.0, 227.0, 369.0, 688.0, 1365.0, 2728.0, 6163.0, 15734.0, 50149.0, 334028.0, 2812325.0, 849183.0, 83306.0, 22224.0, 7920.0, 3452.0, 1621.0, 850.0, 457.0, 273.0, 197.0, 115.0, 96.0, 58.0, 40.0, 38.0, 29.0, 19.0, 19.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.15625, -24.38623046875, -23.6162109375, -22.84619140625, -22.076171875, -21.30615234375, -20.5361328125, -19.76611328125, -18.99609375, -18.22607421875, -17.4560546875, -16.68603515625, -15.916015625, -15.14599609375, -14.3759765625, -13.60595703125, -12.8359375, -12.06591796875, -11.2958984375, -10.52587890625, -9.755859375, -8.98583984375, -8.2158203125, -7.44580078125, -6.67578125, -5.90576171875, -5.1357421875, -4.36572265625, -3.595703125, -2.82568359375, -2.0556640625, -1.28564453125, -0.515625, 0.25439453125, 1.0244140625, 1.79443359375, 2.564453125, 3.33447265625, 4.1044921875, 4.87451171875, 5.64453125, 6.41455078125, 7.1845703125, 7.95458984375, 8.724609375, 9.49462890625, 10.2646484375, 11.03466796875, 11.8046875, 12.57470703125, 13.3447265625, 14.11474609375, 14.884765625, 15.65478515625, 16.4248046875, 17.19482421875, 17.96484375, 18.73486328125, 19.5048828125, 20.27490234375, 21.044921875, 21.81494140625, 22.5849609375, 23.35498046875, 24.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 6.0, 4.0, 2.0, 8.0, 12.0, 23.0, 13.0, 33.0, 33.0, 35.0, 42.0, 68.0, 97.0, 130.0, 164.0, 220.0, 298.0, 360.0, 449.0, 479.0, 372.0, 311.0, 233.0, 157.0, 119.0, 82.0, 72.0, 66.0, 44.0, 36.0, 18.0, 9.0, 20.0, 18.0, 4.0, 4.0, 3.0, 6.0, 1.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.2215576171875, -14.732177734375, -14.2427978515625, -13.75341796875, -13.2640380859375, -12.774658203125, -12.2852783203125, -11.7958984375, -11.3065185546875, -10.817138671875, -10.3277587890625, -9.83837890625, -9.3489990234375, -8.859619140625, -8.3702392578125, -7.880859375, -7.3914794921875, -6.902099609375, -6.4127197265625, -5.92333984375, -5.4339599609375, -4.944580078125, -4.4552001953125, -3.9658203125, -3.4764404296875, -2.987060546875, -2.4976806640625, -2.00830078125, -1.5189208984375, -1.029541015625, -0.5401611328125, -0.05078125, 0.4385986328125, 0.927978515625, 1.4173583984375, 1.90673828125, 2.3961181640625, 2.885498046875, 3.3748779296875, 3.8642578125, 4.3536376953125, 4.843017578125, 5.3323974609375, 5.82177734375, 6.3111572265625, 6.800537109375, 7.2899169921875, 7.779296875, 8.2686767578125, 8.758056640625, 9.2474365234375, 9.73681640625, 10.2261962890625, 10.715576171875, 11.2049560546875, 11.6943359375, 12.1837158203125, 12.673095703125, 13.1624755859375, 13.65185546875, 14.1412353515625, 14.630615234375, 15.1199951171875, 15.609375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 0.0, 8.0, 7.0, 10.0, 16.0, 19.0, 32.0, 31.0, 43.0, 79.0, 125.0, 201.0, 388.0, 1114.0, 3262.0, 12975.0, 74027.0, 1460138.0, 2510265.0, 108209.0, 16825.0, 3966.0, 1343.0, 510.0, 247.0, 128.0, 85.0, 60.0, 43.0, 28.0, 24.0, 22.0, 14.0, 8.0, 8.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.46875, -42.99072265625, -41.5126953125, -40.03466796875, -38.556640625, -37.07861328125, -35.6005859375, -34.12255859375, -32.64453125, -31.16650390625, -29.6884765625, -28.21044921875, -26.732421875, -25.25439453125, -23.7763671875, -22.29833984375, -20.8203125, -19.34228515625, -17.8642578125, -16.38623046875, -14.908203125, -13.43017578125, -11.9521484375, -10.47412109375, -8.99609375, -7.51806640625, -6.0400390625, -4.56201171875, -3.083984375, -1.60595703125, -0.1279296875, 1.35009765625, 2.828125, 4.30615234375, 5.7841796875, 7.26220703125, 8.740234375, 10.21826171875, 11.6962890625, 13.17431640625, 14.65234375, 16.13037109375, 17.6083984375, 19.08642578125, 20.564453125, 22.04248046875, 23.5205078125, 24.99853515625, 26.4765625, 27.95458984375, 29.4326171875, 30.91064453125, 32.388671875, 33.86669921875, 35.3447265625, 36.82275390625, 38.30078125, 39.77880859375, 41.2568359375, 42.73486328125, 44.212890625, 45.69091796875, 47.1689453125, 48.64697265625, 50.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 32.0, 43.0, 97.0, 165.0, 235.0, 181.0, 136.0, 60.0, 31.0, 13.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.46383666992188, -134.3179473876953, -128.1720733642578, -122.02618408203125, -115.88031005859375, -109.73442077636719, -103.58853912353516, -97.44265747070312, -91.2967758178711, -85.15089416503906, -79.00501251220703, -72.859130859375, -66.71324157714844, -60.56736373901367, -54.421478271484375, -48.275596618652344, -42.12971496582031, -35.98383331298828, -29.837949752807617, -23.692066192626953, -17.546184539794922, -11.40030288696289, -5.254417419433594, 0.8914642333984375, 7.037345886230469, 13.183228492736816, 19.329111099243164, 25.474994659423828, 31.62087631225586, 37.76675796508789, 43.91264343261719, 50.05852508544922, 56.20440673828125, 62.35028839111328, 68.49617004394531, 74.64205932617188, 80.78793334960938, 86.93382263183594, 93.07970428466797, 99.2255859375, 105.37146759033203, 111.51734924316406, 117.6632308959961, 123.80911254882812, 129.9550018310547, 136.1008758544922, 142.24676513671875, 148.39263916015625, 154.5385284423828, 160.68441772460938, 166.83029174804688, 172.97618103027344, 179.12205505371094, 185.2679443359375, 191.413818359375, 197.55970764160156, 203.70559692382812, 209.8514862060547, 215.9973602294922, 222.14324951171875, 228.28912353515625, 234.4350128173828, 240.58090209960938, 246.72677612304688, 252.87265014648438]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 9.0, 7.0, 11.0, 9.0, 15.0, 21.0, 16.0, 23.0, 25.0, 16.0, 32.0, 31.0, 31.0, 34.0, 46.0, 45.0, 44.0, 39.0, 36.0, 41.0, 31.0, 37.0, 46.0, 44.0, 39.0, 33.0, 34.0, 34.0, 27.0, 22.0, 20.0, 13.0, 20.0, 12.0, 11.0, 11.0, 3.0, 12.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.09138870239258, -53.208168029785156, -51.324951171875, -49.44173049926758, -47.558509826660156, -45.67529296875, -43.79207229614258, -41.908851623535156, -40.025634765625, -38.14241409301758, -36.25919723510742, -34.3759765625, -32.492759704589844, -30.609539031982422, -28.726318359375, -26.84309959411621, -24.959880828857422, -23.076662063598633, -21.193443298339844, -19.310222625732422, -17.427003860473633, -15.543785095214844, -13.660565376281738, -11.777345657348633, -9.894126892089844, -8.010908126831055, -6.127688407897949, -4.244469165802002, -2.3612499237060547, -0.4780311584472656, 1.4051885604858398, 3.2884082794189453, 5.171630859375, 7.054850101470947, 8.938069343566895, 10.8212890625, 12.704507827758789, 14.587726593017578, 16.470947265625, 18.35416603088379, 20.237384796142578, 22.120603561401367, 24.003822326660156, 25.887042999267578, 27.770261764526367, 29.653480529785156, 31.536701202392578, 33.419921875, 35.303138732910156, 37.18635940551758, 39.069576263427734, 40.952796936035156, 42.83601379394531, 44.719234466552734, 46.602455139160156, 48.48567199707031, 50.368892669677734, 52.252113342285156, 54.13533020019531, 56.018550872802734, 57.901771545410156, 59.78498840332031, 61.668209075927734, 63.551429748535156, 65.43464660644531]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 2.0, 4.0, 8.0, 4.0, 10.0, 14.0, 12.0, 18.0, 21.0, 20.0, 25.0, 21.0, 33.0, 46.0, 33.0, 41.0, 42.0, 29.0, 47.0, 39.0, 43.0, 32.0, 50.0, 41.0, 41.0, 47.0, 37.0, 27.0, 19.0, 25.0, 22.0, 23.0, 25.0, 12.0, 17.0, 12.0, 11.0, 7.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.80859375, -7.56024169921875, -7.3118896484375, -7.06353759765625, -6.815185546875, -6.56683349609375, -6.3184814453125, -6.07012939453125, -5.82177734375, -5.57342529296875, -5.3250732421875, -5.07672119140625, -4.828369140625, -4.58001708984375, -4.3316650390625, -4.08331298828125, -3.8349609375, -3.58660888671875, -3.3382568359375, -3.08990478515625, -2.841552734375, -2.59320068359375, -2.3448486328125, -2.09649658203125, -1.84814453125, -1.59979248046875, -1.3514404296875, -1.10308837890625, -0.854736328125, -0.60638427734375, -0.3580322265625, -0.10968017578125, 0.138671875, 0.38702392578125, 0.6353759765625, 0.88372802734375, 1.132080078125, 1.38043212890625, 1.6287841796875, 1.87713623046875, 2.12548828125, 2.37384033203125, 2.6221923828125, 2.87054443359375, 3.118896484375, 3.36724853515625, 3.6156005859375, 3.86395263671875, 4.1123046875, 4.36065673828125, 4.6090087890625, 4.85736083984375, 5.105712890625, 5.35406494140625, 5.6024169921875, 5.85076904296875, 6.09912109375, 6.34747314453125, 6.5958251953125, 6.84417724609375, 7.092529296875, 7.34088134765625, 7.5892333984375, 7.83758544921875, 8.0859375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 16.0, 20.0, 17.0, 34.0, 40.0, 65.0, 78.0, 101.0, 150.0, 257.0, 389.0, 517.0, 826.0, 1211.0, 1954.0, 3114.0, 5175.0, 8936.0, 15673.0, 28551.0, 53169.0, 103358.0, 203164.0, 277766.0, 162869.0, 82427.0, 43086.0, 23057.0, 12986.0, 7425.0, 4373.0, 2768.0, 1709.0, 1050.0, 708.0, 465.0, 291.0, 239.0, 142.0, 125.0, 68.0, 55.0, 36.0, 22.0, 21.0, 14.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6708984375, -1.615814208984375, -1.56072998046875, -1.505645751953125, -1.4505615234375, -1.395477294921875, -1.34039306640625, -1.285308837890625, -1.230224609375, -1.175140380859375, -1.12005615234375, -1.064971923828125, -1.0098876953125, -0.954803466796875, -0.89971923828125, -0.844635009765625, -0.78955078125, -0.734466552734375, -0.67938232421875, -0.624298095703125, -0.5692138671875, -0.514129638671875, -0.45904541015625, -0.403961181640625, -0.348876953125, -0.293792724609375, -0.23870849609375, -0.183624267578125, -0.1285400390625, -0.073455810546875, -0.01837158203125, 0.036712646484375, 0.091796875, 0.146881103515625, 0.20196533203125, 0.257049560546875, 0.3121337890625, 0.367218017578125, 0.42230224609375, 0.477386474609375, 0.532470703125, 0.587554931640625, 0.64263916015625, 0.697723388671875, 0.7528076171875, 0.807891845703125, 0.86297607421875, 0.918060302734375, 0.97314453125, 1.028228759765625, 1.08331298828125, 1.138397216796875, 1.1934814453125, 1.248565673828125, 1.30364990234375, 1.358734130859375, 1.413818359375, 1.468902587890625, 1.52398681640625, 1.579071044921875, 1.6341552734375, 1.689239501953125, 1.74432373046875, 1.799407958984375, 1.8544921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 7.0, 10.0, 6.0, 5.0, 7.0, 9.0, 7.0, 10.0, 21.0, 23.0, 30.0, 22.0, 23.0, 26.0, 29.0, 35.0, 33.0, 34.0, 36.0, 32.0, 37.0, 37.0, 1072.0, 46.0, 46.0, 45.0, 40.0, 26.0, 38.0, 30.0, 33.0, 22.0, 31.0, 25.0, 16.0, 12.0, 10.0, 11.0, 5.0, 11.0, 6.0, 5.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.29296875, -5.12322998046875, -4.9534912109375, -4.78375244140625, -4.614013671875, -4.44427490234375, -4.2745361328125, -4.10479736328125, -3.93505859375, -3.76531982421875, -3.5955810546875, -3.42584228515625, -3.256103515625, -3.08636474609375, -2.9166259765625, -2.74688720703125, -2.5771484375, -2.40740966796875, -2.2376708984375, -2.06793212890625, -1.898193359375, -1.72845458984375, -1.5587158203125, -1.38897705078125, -1.21923828125, -1.04949951171875, -0.8797607421875, -0.71002197265625, -0.540283203125, -0.37054443359375, -0.2008056640625, -0.03106689453125, 0.138671875, 0.30841064453125, 0.4781494140625, 0.64788818359375, 0.817626953125, 0.98736572265625, 1.1571044921875, 1.32684326171875, 1.49658203125, 1.66632080078125, 1.8360595703125, 2.00579833984375, 2.175537109375, 2.34527587890625, 2.5150146484375, 2.68475341796875, 2.8544921875, 3.02423095703125, 3.1939697265625, 3.36370849609375, 3.533447265625, 3.70318603515625, 3.8729248046875, 4.04266357421875, 4.21240234375, 4.38214111328125, 4.5518798828125, 4.72161865234375, 4.891357421875, 5.06109619140625, 5.2308349609375, 5.40057373046875, 5.5703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 11.0, 16.0, 12.0, 22.0, 35.0, 44.0, 55.0, 100.0, 130.0, 168.0, 273.0, 453.0, 711.0, 1291.0, 2264.0, 4302.0, 8222.0, 17175.0, 36059.0, 82595.0, 209549.0, 1301861.0, 254898.0, 95655.0, 41717.0, 19165.0, 9419.0, 4679.0, 2567.0, 1415.0, 837.0, 481.0, 318.0, 205.0, 115.0, 97.0, 58.0, 40.0, 34.0, 17.0, 18.0, 16.0, 9.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7744140625, -0.7482376098632812, -0.7220611572265625, -0.6958847045898438, -0.669708251953125, -0.6435317993164062, -0.6173553466796875, -0.5911788940429688, -0.56500244140625, -0.5388259887695312, -0.5126495361328125, -0.48647308349609375, -0.460296630859375, -0.43412017822265625, -0.4079437255859375, -0.38176727294921875, -0.3555908203125, -0.32941436767578125, -0.3032379150390625, -0.27706146240234375, -0.250885009765625, -0.22470855712890625, -0.1985321044921875, -0.17235565185546875, -0.14617919921875, -0.12000274658203125, -0.0938262939453125, -0.06764984130859375, -0.041473388671875, -0.01529693603515625, 0.0108795166015625, 0.03705596923828125, 0.063232421875, 0.08940887451171875, 0.1155853271484375, 0.14176177978515625, 0.167938232421875, 0.19411468505859375, 0.2202911376953125, 0.24646759033203125, 0.27264404296875, 0.29882049560546875, 0.3249969482421875, 0.35117340087890625, 0.377349853515625, 0.40352630615234375, 0.4297027587890625, 0.45587921142578125, 0.4820556640625, 0.5082321166992188, 0.5344085693359375, 0.5605850219726562, 0.586761474609375, 0.6129379272460938, 0.6391143798828125, 0.6652908325195312, 0.69146728515625, 0.7176437377929688, 0.7438201904296875, 0.7699966430664062, 0.796173095703125, 0.8223495483398438, 0.8485260009765625, 0.8747024536132812, 0.90087890625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 6.0, 4.0, 3.0, 8.0, 5.0, 13.0, 15.0, 12.0, 14.0, 25.0, 34.0, 43.0, 42.0, 47.0, 49.0, 69.0, 69.0, 60.0, 65.0, 73.0, 51.0, 43.0, 39.0, 37.0, 35.0, 24.0, 22.0, 13.0, 13.0, 14.0, 14.0, 11.0, 6.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.285400390625, -0.27634429931640625, -0.2672882080078125, -0.25823211669921875, -0.249176025390625, -0.24011993408203125, -0.2310638427734375, -0.22200775146484375, -0.21295166015625, -0.20389556884765625, -0.1948394775390625, -0.18578338623046875, -0.176727294921875, -0.16767120361328125, -0.1586151123046875, -0.14955902099609375, -0.1405029296875, -0.13144683837890625, -0.1223907470703125, -0.11333465576171875, -0.104278564453125, -0.09522247314453125, -0.0861663818359375, -0.07711029052734375, -0.06805419921875, -0.05899810791015625, -0.0499420166015625, -0.04088592529296875, -0.031829833984375, -0.02277374267578125, -0.0137176513671875, -0.00466156005859375, 0.00439453125, 0.01345062255859375, 0.0225067138671875, 0.03156280517578125, 0.040618896484375, 0.04967498779296875, 0.0587310791015625, 0.06778717041015625, 0.07684326171875, 0.08589935302734375, 0.0949554443359375, 0.10401153564453125, 0.113067626953125, 0.12212371826171875, 0.1311798095703125, 0.14023590087890625, 0.1492919921875, 0.15834808349609375, 0.1674041748046875, 0.17646026611328125, 0.185516357421875, 0.19457244873046875, 0.2036285400390625, 0.21268463134765625, 0.22174072265625, 0.23079681396484375, 0.2398529052734375, 0.24890899658203125, 0.257965087890625, 0.26702117919921875, 0.2760772705078125, 0.28513336181640625, 0.294189453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 3.0, 13.0, 8.0, 12.0, 13.0, 14.0, 18.0, 26.0, 26.0, 40.0, 49.0, 58.0, 145.0, 222.0, 718.0, 12454.0, 1023245.0, 10162.0, 674.0, 244.0, 95.0, 88.0, 58.0, 32.0, 30.0, 16.0, 13.0, 17.0, 9.0, 9.0, 6.0, 5.0, 4.0, 7.0, 0.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.22265625, -6.03106689453125, -5.8394775390625, -5.64788818359375, -5.456298828125, -5.26470947265625, -5.0731201171875, -4.88153076171875, -4.68994140625, -4.49835205078125, -4.3067626953125, -4.11517333984375, -3.923583984375, -3.73199462890625, -3.5404052734375, -3.34881591796875, -3.1572265625, -2.96563720703125, -2.7740478515625, -2.58245849609375, -2.390869140625, -2.19927978515625, -2.0076904296875, -1.81610107421875, -1.62451171875, -1.43292236328125, -1.2413330078125, -1.04974365234375, -0.858154296875, -0.66656494140625, -0.4749755859375, -0.28338623046875, -0.091796875, 0.09979248046875, 0.2913818359375, 0.48297119140625, 0.674560546875, 0.86614990234375, 1.0577392578125, 1.24932861328125, 1.44091796875, 1.63250732421875, 1.8240966796875, 2.01568603515625, 2.207275390625, 2.39886474609375, 2.5904541015625, 2.78204345703125, 2.9736328125, 3.16522216796875, 3.3568115234375, 3.54840087890625, 3.739990234375, 3.93157958984375, 4.1231689453125, 4.31475830078125, 4.50634765625, 4.69793701171875, 4.8895263671875, 5.08111572265625, 5.272705078125, 5.46429443359375, 5.6558837890625, 5.84747314453125, 6.0390625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 13.0, 14.0, 21.0, 41.0, 64.0, 107.0, 318.0, 202.0, 89.0, 54.0, 29.0, 18.0, 11.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.952785313129425, -0.9020622968673706, -0.8513392806053162, -0.8006162643432617, -0.7498931884765625, -0.6991701722145081, -0.6484471559524536, -0.5977240800857544, -0.5470011234283447, -0.4962781071662903, -0.44555506110191345, -0.394832044839859, -0.3441089987754822, -0.29338598251342773, -0.2426629662513733, -0.19193992018699646, -0.14121687412261963, -0.09049384295940399, -0.03977081924676895, 0.010952204465866089, 0.061675235629081726, 0.11239826679229736, 0.1631212830543518, 0.21384432911872864, 0.2645673453807831, 0.3152903616428375, 0.36601340770721436, 0.4167364239692688, 0.46745944023132324, 0.5181825160980225, 0.5689054727554321, 0.6196285486221313, 0.6703516244888306, 0.721074640750885, 0.7717976570129395, 0.8225207328796387, 0.8732437491416931, 0.9239667654037476, 0.974689781665802, 1.0254127979278564, 1.0761358737945557, 1.1268589496612549, 1.1775819063186646, 1.2283049821853638, 1.2790279388427734, 1.3297510147094727, 1.3804740905761719, 1.4311970472335815, 1.4819200038909912, 1.5326430797576904, 1.5833660364151, 1.6340891122817993, 1.684812068939209, 1.7355351448059082, 1.7862582206726074, 1.836981177330017, 1.8877042531967163, 1.9384273290634155, 1.9891502857208252, 2.0398733615875244, 2.0905964374542236, 2.1413192749023438, 2.192042350769043, 2.242765426635742, 2.2934885025024414]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 9.0, 12.0, 13.0, 16.0, 17.0, 21.0, 19.0, 24.0, 33.0, 36.0, 20.0, 26.0, 43.0, 30.0, 32.0, 52.0, 45.0, 43.0, 36.0, 32.0, 33.0, 44.0, 42.0, 28.0, 21.0, 31.0, 25.0, 34.0, 26.0, 24.0, 17.0, 15.0, 12.0, 16.0, 10.0, 6.0, 5.0, 9.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0562572479248047, -1.022892713546753, -0.9895281791687012, -0.9561636447906494, -0.9227991104125977, -0.8894345760345459, -0.8560700416564941, -0.8227055072784424, -0.7893409729003906, -0.7559764385223389, -0.7226119041442871, -0.6892473697662354, -0.6558828353881836, -0.6225183010101318, -0.5891537666320801, -0.5557892322540283, -0.5224246978759766, -0.4890601634979248, -0.45569562911987305, -0.4223310947418213, -0.38896656036376953, -0.3556020259857178, -0.322237491607666, -0.28887295722961426, -0.2555084228515625, -0.22214388847351074, -0.18877935409545898, -0.15541481971740723, -0.12205028533935547, -0.08868575096130371, -0.05532121658325195, -0.021956682205200195, 0.011407971382141113, 0.04477250576019287, 0.07813704013824463, 0.11150157451629639, 0.14486610889434814, 0.1782306432723999, 0.21159517765045166, 0.24495971202850342, 0.2783242464065552, 0.31168878078460693, 0.3450533151626587, 0.37841784954071045, 0.4117823839187622, 0.44514691829681396, 0.4785114526748657, 0.5118759870529175, 0.5452405214309692, 0.578605055809021, 0.6119695901870728, 0.6453341245651245, 0.6786986589431763, 0.712063193321228, 0.7454277276992798, 0.7787922620773315, 0.8121567964553833, 0.8455213308334351, 0.8788858652114868, 0.9122503995895386, 0.9456149339675903, 0.9789794683456421, 1.0123440027236938, 1.0457085371017456, 1.0790730714797974]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 7.0, 2.0, 4.0, 7.0, 4.0, 12.0, 14.0, 13.0, 15.0, 20.0, 19.0, 24.0, 24.0, 38.0, 46.0, 29.0, 40.0, 42.0, 32.0, 45.0, 41.0, 39.0, 36.0, 50.0, 34.0, 49.0, 45.0, 34.0, 28.0, 20.0, 24.0, 23.0, 22.0, 28.0, 11.0, 17.0, 14.0, 9.0, 7.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.81640625, -7.56781005859375, -7.3192138671875, -7.07061767578125, -6.822021484375, -6.57342529296875, -6.3248291015625, -6.07623291015625, -5.82763671875, -5.57904052734375, -5.3304443359375, -5.08184814453125, -4.833251953125, -4.58465576171875, -4.3360595703125, -4.08746337890625, -3.8388671875, -3.59027099609375, -3.3416748046875, -3.09307861328125, -2.844482421875, -2.59588623046875, -2.3472900390625, -2.09869384765625, -1.85009765625, -1.60150146484375, -1.3529052734375, -1.10430908203125, -0.855712890625, -0.60711669921875, -0.3585205078125, -0.10992431640625, 0.138671875, 0.38726806640625, 0.6358642578125, 0.88446044921875, 1.133056640625, 1.38165283203125, 1.6302490234375, 1.87884521484375, 2.12744140625, 2.37603759765625, 2.6246337890625, 2.87322998046875, 3.121826171875, 3.37042236328125, 3.6190185546875, 3.86761474609375, 4.1162109375, 4.36480712890625, 4.6134033203125, 4.86199951171875, 5.110595703125, 5.35919189453125, 5.6077880859375, 5.85638427734375, 6.10498046875, 6.35357666015625, 6.6021728515625, 6.85076904296875, 7.099365234375, 7.34796142578125, 7.5965576171875, 7.84515380859375, 8.09375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 6.0, 10.0, 13.0, 19.0, 28.0, 19.0, 35.0, 65.0, 106.0, 120.0, 193.0, 274.0, 414.0, 628.0, 917.0, 1368.0, 1967.0, 3028.0, 4728.0, 7569.0, 14324.0, 34908.0, 113320.0, 409832.0, 313302.0, 82763.0, 27094.0, 12121.0, 6802.0, 4211.0, 2748.0, 1746.0, 1222.0, 824.0, 541.0, 355.0, 320.0, 203.0, 140.0, 86.0, 54.0, 35.0, 33.0, 22.0, 9.0, 8.0, 8.0, 4.0, 3.0, 5.0, 1.0, 4.0, 3.0], "bins": [-12.734375, -12.3692626953125, -12.004150390625, -11.6390380859375, -11.27392578125, -10.9088134765625, -10.543701171875, -10.1785888671875, -9.8134765625, -9.4483642578125, -9.083251953125, -8.7181396484375, -8.35302734375, -7.9879150390625, -7.622802734375, -7.2576904296875, -6.892578125, -6.5274658203125, -6.162353515625, -5.7972412109375, -5.43212890625, -5.0670166015625, -4.701904296875, -4.3367919921875, -3.9716796875, -3.6065673828125, -3.241455078125, -2.8763427734375, -2.51123046875, -2.1461181640625, -1.781005859375, -1.4158935546875, -1.05078125, -0.6856689453125, -0.320556640625, 0.0445556640625, 0.40966796875, 0.7747802734375, 1.139892578125, 1.5050048828125, 1.8701171875, 2.2352294921875, 2.600341796875, 2.9654541015625, 3.33056640625, 3.6956787109375, 4.060791015625, 4.4259033203125, 4.791015625, 5.1561279296875, 5.521240234375, 5.8863525390625, 6.25146484375, 6.6165771484375, 6.981689453125, 7.3468017578125, 7.7119140625, 8.0770263671875, 8.442138671875, 8.8072509765625, 9.17236328125, 9.5374755859375, 9.902587890625, 10.2677001953125, 10.6328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 6.0, 8.0, 8.0, 6.0, 9.0, 20.0, 19.0, 13.0, 26.0, 30.0, 28.0, 37.0, 34.0, 46.0, 48.0, 44.0, 75.0, 118.0, 268.0, 1455.0, 202.0, 119.0, 62.0, 49.0, 44.0, 27.0, 33.0, 28.0, 37.0, 18.0, 17.0, 26.0, 20.0, 11.0, 16.0, 10.0, 9.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.66064453125, -18.9150390625, -18.16943359375, -17.423828125, -16.67822265625, -15.9326171875, -15.18701171875, -14.44140625, -13.69580078125, -12.9501953125, -12.20458984375, -11.458984375, -10.71337890625, -9.9677734375, -9.22216796875, -8.4765625, -7.73095703125, -6.9853515625, -6.23974609375, -5.494140625, -4.74853515625, -4.0029296875, -3.25732421875, -2.51171875, -1.76611328125, -1.0205078125, -0.27490234375, 0.470703125, 1.21630859375, 1.9619140625, 2.70751953125, 3.453125, 4.19873046875, 4.9443359375, 5.68994140625, 6.435546875, 7.18115234375, 7.9267578125, 8.67236328125, 9.41796875, 10.16357421875, 10.9091796875, 11.65478515625, 12.400390625, 13.14599609375, 13.8916015625, 14.63720703125, 15.3828125, 16.12841796875, 16.8740234375, 17.61962890625, 18.365234375, 19.11083984375, 19.8564453125, 20.60205078125, 21.34765625, 22.09326171875, 22.8388671875, 23.58447265625, 24.330078125, 25.07568359375, 25.8212890625, 26.56689453125, 27.3125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 12.0, 18.0, 19.0, 18.0, 23.0, 39.0, 39.0, 51.0, 53.0, 90.0, 77.0, 125.0, 177.0, 290.0, 584.0, 1315.0, 4007.0, 15841.0, 239784.0, 2805786.0, 63055.0, 9270.0, 2602.0, 941.0, 437.0, 292.0, 155.0, 125.0, 93.0, 80.0, 65.0, 45.0, 38.0, 37.0, 19.0, 14.0, 12.0, 12.0, 14.0, 7.0, 9.0, 1.0, 8.0, 4.0, 1.0, 1.0, 1.0, 5.0], "bins": [-46.15625, -44.849609375, -43.54296875, -42.236328125, -40.9296875, -39.623046875, -38.31640625, -37.009765625, -35.703125, -34.396484375, -33.08984375, -31.783203125, -30.4765625, -29.169921875, -27.86328125, -26.556640625, -25.25, -23.943359375, -22.63671875, -21.330078125, -20.0234375, -18.716796875, -17.41015625, -16.103515625, -14.796875, -13.490234375, -12.18359375, -10.876953125, -9.5703125, -8.263671875, -6.95703125, -5.650390625, -4.34375, -3.037109375, -1.73046875, -0.423828125, 0.8828125, 2.189453125, 3.49609375, 4.802734375, 6.109375, 7.416015625, 8.72265625, 10.029296875, 11.3359375, 12.642578125, 13.94921875, 15.255859375, 16.5625, 17.869140625, 19.17578125, 20.482421875, 21.7890625, 23.095703125, 24.40234375, 25.708984375, 27.015625, 28.322265625, 29.62890625, 30.935546875, 32.2421875, 33.548828125, 34.85546875, 36.162109375, 37.46875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 16.0, 53.0, 114.0, 211.0, 286.0, 195.0, 79.0, 32.0, 11.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.54403686523438, -80.15449523925781, -75.76495361328125, -71.37541961669922, -66.98587799072266, -62.596336364746094, -58.2067985534668, -53.8172607421875, -49.42771911621094, -45.038177490234375, -40.64863967895508, -36.25910186767578, -31.86956024169922, -27.48002052307129, -23.09048080444336, -18.70094108581543, -14.3114013671875, -9.92186164855957, -5.532321929931641, -1.142782211303711, 3.2467575073242188, 7.636297225952148, 12.025836944580078, 16.415376663208008, 20.804916381835938, 25.194456100463867, 29.583995819091797, 33.973533630371094, 38.363075256347656, 42.75261688232422, 47.142154693603516, 51.53169250488281, 55.92121887207031, 60.310760498046875, 64.70030212402344, 69.08983612060547, 73.47937774658203, 77.8689193725586, 82.25845336914062, 86.64799499511719, 91.03753662109375, 95.42707824707031, 99.81661987304688, 104.2061538696289, 108.59569549560547, 112.98523712158203, 117.37477111816406, 121.76431274414062, 126.15385437011719, 130.54339599609375, 134.9329376220703, 139.32247924804688, 143.71200561523438, 148.10154724121094, 152.4910888671875, 156.88063049316406, 161.27017211914062, 165.6597137451172, 170.04925537109375, 174.4387969970703, 178.82833862304688, 183.21786499023438, 187.60740661621094, 191.9969482421875, 196.38648986816406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 7.0, 18.0, 10.0, 15.0, 17.0, 13.0, 22.0, 33.0, 29.0, 36.0, 28.0, 26.0, 37.0, 34.0, 36.0, 48.0, 49.0, 41.0, 42.0, 43.0, 42.0, 33.0, 31.0, 21.0, 38.0, 20.0, 27.0, 30.0, 16.0, 23.0, 17.0, 17.0, 11.0, 10.0, 17.0, 10.0, 4.0, 10.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-60.20482635498047, -58.35892105102539, -56.51301956176758, -54.6671142578125, -52.82121276855469, -50.97530746459961, -49.12940216064453, -47.28350067138672, -45.437599182128906, -43.59169387817383, -41.745792388916016, -39.89988708496094, -38.053985595703125, -36.20808029174805, -34.36217498779297, -32.516273498535156, -30.670368194580078, -28.824464797973633, -26.978561401367188, -25.13265609741211, -23.286754608154297, -21.44084930419922, -19.594945907592773, -17.749042510986328, -15.903139114379883, -14.057235717773438, -12.211332321166992, -10.36542797088623, -8.519524574279785, -6.67362117767334, -4.827716827392578, -2.981813430786133, -1.1359062194824219, 0.7099974155426025, 2.555901050567627, 4.4018049240112305, 6.247708320617676, 8.093611717224121, 9.939516067504883, 11.785419464111328, 13.631322860717773, 15.477226257324219, 17.323129653930664, 19.16903305053711, 21.014938354492188, 22.86083984375, 24.706745147705078, 26.552648544311523, 28.39855194091797, 30.244455337524414, 32.09035873413086, 33.93626403808594, 35.78216552734375, 37.62807083129883, 39.473976135253906, 41.31987762451172, 43.16577911376953, 45.01168441772461, 46.85758590698242, 48.7034912109375, 50.54939270019531, 52.39529800415039, 54.24120330810547, 56.08710479736328, 57.93301010131836]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 0.0, 5.0, 4.0, 5.0, 12.0, 13.0, 17.0, 19.0, 19.0, 19.0, 29.0, 29.0, 31.0, 26.0, 31.0, 45.0, 30.0, 45.0, 41.0, 50.0, 50.0, 39.0, 46.0, 37.0, 41.0, 37.0, 39.0, 29.0, 26.0, 29.0, 29.0, 12.0, 26.0, 13.0, 12.0, 13.0, 14.0, 6.0, 6.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.5936279296875, -7.327880859375, -7.0621337890625, -6.79638671875, -6.5306396484375, -6.264892578125, -5.9991455078125, -5.7333984375, -5.4676513671875, -5.201904296875, -4.9361572265625, -4.67041015625, -4.4046630859375, -4.138916015625, -3.8731689453125, -3.607421875, -3.3416748046875, -3.075927734375, -2.8101806640625, -2.54443359375, -2.2786865234375, -2.012939453125, -1.7471923828125, -1.4814453125, -1.2156982421875, -0.949951171875, -0.6842041015625, -0.41845703125, -0.1527099609375, 0.113037109375, 0.3787841796875, 0.64453125, 0.9102783203125, 1.176025390625, 1.4417724609375, 1.70751953125, 1.9732666015625, 2.239013671875, 2.5047607421875, 2.7705078125, 3.0362548828125, 3.302001953125, 3.5677490234375, 3.83349609375, 4.0992431640625, 4.364990234375, 4.6307373046875, 4.896484375, 5.1622314453125, 5.427978515625, 5.6937255859375, 5.95947265625, 6.2252197265625, 6.490966796875, 6.7567138671875, 7.0224609375, 7.2882080078125, 7.553955078125, 7.8197021484375, 8.08544921875, 8.3511962890625, 8.616943359375, 8.8826904296875, 9.1484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 4.0, 11.0, 11.0, 10.0, 14.0, 20.0, 26.0, 44.0, 69.0, 102.0, 174.0, 279.0, 408.0, 696.0, 1143.0, 1938.0, 3376.0, 6796.0, 13694.0, 34530.0, 142730.0, 1195093.0, 2348130.0, 347264.0, 58401.0, 19882.0, 8825.0, 4589.0, 2362.0, 1327.0, 829.0, 499.0, 323.0, 221.0, 149.0, 120.0, 55.0, 34.0, 27.0, 25.0, 13.0, 16.0, 6.0, 4.0, 2.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-21.6875, -21.03466796875, -20.3818359375, -19.72900390625, -19.076171875, -18.42333984375, -17.7705078125, -17.11767578125, -16.46484375, -15.81201171875, -15.1591796875, -14.50634765625, -13.853515625, -13.20068359375, -12.5478515625, -11.89501953125, -11.2421875, -10.58935546875, -9.9365234375, -9.28369140625, -8.630859375, -7.97802734375, -7.3251953125, -6.67236328125, -6.01953125, -5.36669921875, -4.7138671875, -4.06103515625, -3.408203125, -2.75537109375, -2.1025390625, -1.44970703125, -0.796875, -0.14404296875, 0.5087890625, 1.16162109375, 1.814453125, 2.46728515625, 3.1201171875, 3.77294921875, 4.42578125, 5.07861328125, 5.7314453125, 6.38427734375, 7.037109375, 7.68994140625, 8.3427734375, 8.99560546875, 9.6484375, 10.30126953125, 10.9541015625, 11.60693359375, 12.259765625, 12.91259765625, 13.5654296875, 14.21826171875, 14.87109375, 15.52392578125, 16.1767578125, 16.82958984375, 17.482421875, 18.13525390625, 18.7880859375, 19.44091796875, 20.09375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 16.0, 17.0, 27.0, 41.0, 35.0, 67.0, 106.0, 141.0, 200.0, 338.0, 436.0, 595.0, 568.0, 459.0, 301.0, 207.0, 125.0, 107.0, 67.0, 71.0, 35.0, 24.0, 19.0, 19.0, 12.0, 6.0, 8.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -19.467529296875, -18.84130859375, -18.215087890625, -17.5888671875, -16.962646484375, -16.33642578125, -15.710205078125, -15.083984375, -14.457763671875, -13.83154296875, -13.205322265625, -12.5791015625, -11.952880859375, -11.32666015625, -10.700439453125, -10.07421875, -9.447998046875, -8.82177734375, -8.195556640625, -7.5693359375, -6.943115234375, -6.31689453125, -5.690673828125, -5.064453125, -4.438232421875, -3.81201171875, -3.185791015625, -2.5595703125, -1.933349609375, -1.30712890625, -0.680908203125, -0.0546875, 0.571533203125, 1.19775390625, 1.823974609375, 2.4501953125, 3.076416015625, 3.70263671875, 4.328857421875, 4.955078125, 5.581298828125, 6.20751953125, 6.833740234375, 7.4599609375, 8.086181640625, 8.71240234375, 9.338623046875, 9.96484375, 10.591064453125, 11.21728515625, 11.843505859375, 12.4697265625, 13.095947265625, 13.72216796875, 14.348388671875, 14.974609375, 15.600830078125, 16.22705078125, 16.853271484375, 17.4794921875, 18.105712890625, 18.73193359375, 19.358154296875, 19.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 7.0, 8.0, 8.0, 8.0, 14.0, 22.0, 28.0, 42.0, 55.0, 87.0, 132.0, 201.0, 414.0, 948.0, 2947.0, 13223.0, 95301.0, 2655049.0, 1352741.0, 59433.0, 9533.0, 2429.0, 842.0, 347.0, 172.0, 84.0, 66.0, 49.0, 35.0, 19.0, 17.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.05908203125, -45.4306640625, -43.80224609375, -42.173828125, -40.54541015625, -38.9169921875, -37.28857421875, -35.66015625, -34.03173828125, -32.4033203125, -30.77490234375, -29.146484375, -27.51806640625, -25.8896484375, -24.26123046875, -22.6328125, -21.00439453125, -19.3759765625, -17.74755859375, -16.119140625, -14.49072265625, -12.8623046875, -11.23388671875, -9.60546875, -7.97705078125, -6.3486328125, -4.72021484375, -3.091796875, -1.46337890625, 0.1650390625, 1.79345703125, 3.421875, 5.05029296875, 6.6787109375, 8.30712890625, 9.935546875, 11.56396484375, 13.1923828125, 14.82080078125, 16.44921875, 18.07763671875, 19.7060546875, 21.33447265625, 22.962890625, 24.59130859375, 26.2197265625, 27.84814453125, 29.4765625, 31.10498046875, 32.7333984375, 34.36181640625, 35.990234375, 37.61865234375, 39.2470703125, 40.87548828125, 42.50390625, 44.13232421875, 45.7607421875, 47.38916015625, 49.017578125, 50.64599609375, 52.2744140625, 53.90283203125, 55.53125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 14.0, 21.0, 23.0, 41.0, 63.0, 69.0, 88.0, 101.0, 120.0, 109.0, 87.0, 76.0, 61.0, 47.0, 30.0, 25.0, 9.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-153.76983642578125, -150.536376953125, -147.3029022216797, -144.06944274902344, -140.8359832763672, -137.60250854492188, -134.36904907226562, -131.13558959960938, -127.9021224975586, -124.66865539550781, -121.43519592285156, -118.20172882080078, -114.96826171875, -111.73480224609375, -108.50133514404297, -105.26786804199219, -102.03440856933594, -98.80094146728516, -95.5674819946289, -92.33401489257812, -89.10054779052734, -85.8670883178711, -82.63362121582031, -79.40016174316406, -76.16668701171875, -72.93321990966797, -69.69976043701172, -66.46629333496094, -63.23283004760742, -59.999366760253906, -56.765899658203125, -53.53243637084961, -50.29896926879883, -47.06550598144531, -43.83203887939453, -40.598575592041016, -37.3651123046875, -34.13164520263672, -30.898181915283203, -27.664718627929688, -24.43125343322754, -21.19778823852539, -17.964324951171875, -14.730859756469727, -11.497395515441895, -8.263931274414062, -5.030466079711914, -1.7970027923583984, 1.43646240234375, 4.669926643371582, 7.903391361236572, 11.136856079101562, 14.370320320129395, 17.603784561157227, 20.837249755859375, 24.07071304321289, 27.30417823791504, 30.537643432617188, 33.7711067199707, 37.00457000732422, 40.238037109375, 43.471500396728516, 46.70496368408203, 49.93843078613281, 53.17189407348633]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 13.0, 8.0, 24.0, 27.0, 29.0, 30.0, 24.0, 41.0, 50.0, 36.0, 42.0, 36.0, 45.0, 53.0, 41.0, 46.0, 39.0, 38.0, 53.0, 33.0, 29.0, 44.0, 23.0, 20.0, 19.0, 20.0, 15.0, 9.0, 13.0, 11.0, 11.0, 8.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.703155517578125, -57.82478332519531, -55.9464111328125, -54.06803894042969, -52.18966293334961, -50.3112907409668, -48.432918548583984, -46.55454635620117, -44.676170349121094, -42.79779815673828, -40.91942596435547, -39.041053771972656, -37.16267776489258, -35.284305572509766, -33.40593338012695, -31.52756118774414, -29.649188995361328, -27.770816802978516, -25.89244270324707, -24.014070510864258, -22.135696411132812, -20.25732421875, -18.378952026367188, -16.500579833984375, -14.62220573425293, -12.7438325881958, -10.865459442138672, -8.98708724975586, -7.1087141036987305, -5.230340957641602, -3.351968765258789, -1.4735956192016602, 0.40477752685546875, 2.2831504344940186, 4.161523342132568, 6.039896011352539, 7.918269157409668, 9.796642303466797, 11.67501449584961, 13.553387641906738, 15.431760787963867, 17.31013298034668, 19.188507080078125, 21.066879272460938, 22.94525146484375, 24.823625564575195, 26.701997756958008, 28.580371856689453, 30.458744049072266, 32.33711624145508, 34.21548843383789, 36.09386444091797, 37.97223663330078, 39.850608825683594, 41.728981018066406, 43.60735321044922, 45.48572540283203, 47.364097595214844, 49.242469787597656, 51.12084197998047, 52.99921798706055, 54.87759017944336, 56.75596237182617, 58.634334564208984, 60.51271057128906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 6.0, 13.0, 18.0, 21.0, 26.0, 25.0, 28.0, 33.0, 37.0, 44.0, 45.0, 50.0, 48.0, 56.0, 44.0, 65.0, 43.0, 46.0, 43.0, 45.0, 43.0, 25.0, 39.0, 26.0, 21.0, 22.0, 13.0, 17.0, 8.0, 11.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.4375, -10.127685546875, -9.81787109375, -9.508056640625, -9.1982421875, -8.888427734375, -8.57861328125, -8.268798828125, -7.958984375, -7.649169921875, -7.33935546875, -7.029541015625, -6.7197265625, -6.409912109375, -6.10009765625, -5.790283203125, -5.48046875, -5.170654296875, -4.86083984375, -4.551025390625, -4.2412109375, -3.931396484375, -3.62158203125, -3.311767578125, -3.001953125, -2.692138671875, -2.38232421875, -2.072509765625, -1.7626953125, -1.452880859375, -1.14306640625, -0.833251953125, -0.5234375, -0.213623046875, 0.09619140625, 0.406005859375, 0.7158203125, 1.025634765625, 1.33544921875, 1.645263671875, 1.955078125, 2.264892578125, 2.57470703125, 2.884521484375, 3.1943359375, 3.504150390625, 3.81396484375, 4.123779296875, 4.43359375, 4.743408203125, 5.05322265625, 5.363037109375, 5.6728515625, 5.982666015625, 6.29248046875, 6.602294921875, 6.912109375, 7.221923828125, 7.53173828125, 7.841552734375, 8.1513671875, 8.461181640625, 8.77099609375, 9.080810546875, 9.390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 8.0, 11.0, 12.0, 23.0, 28.0, 22.0, 65.0, 80.0, 131.0, 185.0, 266.0, 384.0, 591.0, 904.0, 1342.0, 2119.0, 3272.0, 5164.0, 8351.0, 13747.0, 23096.0, 39105.0, 69868.0, 129304.0, 227152.0, 225959.0, 128819.0, 69782.0, 39316.0, 22710.0, 13970.0, 8137.0, 5352.0, 3119.0, 2085.0, 1380.0, 871.0, 594.0, 401.0, 297.0, 167.0, 112.0, 75.0, 66.0, 46.0, 18.0, 15.0, 11.0, 9.0, 9.0, 2.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5390625, -1.489410400390625, -1.43975830078125, -1.390106201171875, -1.3404541015625, -1.290802001953125, -1.24114990234375, -1.191497802734375, -1.141845703125, -1.092193603515625, -1.04254150390625, -0.992889404296875, -0.9432373046875, -0.893585205078125, -0.84393310546875, -0.794281005859375, -0.74462890625, -0.694976806640625, -0.64532470703125, -0.595672607421875, -0.5460205078125, -0.496368408203125, -0.44671630859375, -0.397064208984375, -0.347412109375, -0.297760009765625, -0.24810791015625, -0.198455810546875, -0.1488037109375, -0.099151611328125, -0.04949951171875, 0.000152587890625, 0.0498046875, 0.099456787109375, 0.14910888671875, 0.198760986328125, 0.2484130859375, 0.298065185546875, 0.34771728515625, 0.397369384765625, 0.447021484375, 0.496673583984375, 0.54632568359375, 0.595977783203125, 0.6456298828125, 0.695281982421875, 0.74493408203125, 0.794586181640625, 0.84423828125, 0.893890380859375, 0.94354248046875, 0.993194580078125, 1.0428466796875, 1.092498779296875, 1.14215087890625, 1.191802978515625, 1.241455078125, 1.291107177734375, 1.34075927734375, 1.390411376953125, 1.4400634765625, 1.489715576171875, 1.53936767578125, 1.589019775390625, 1.638671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 6.0, 5.0, 9.0, 8.0, 7.0, 13.0, 17.0, 13.0, 18.0, 23.0, 19.0, 29.0, 22.0, 29.0, 28.0, 19.0, 34.0, 29.0, 26.0, 42.0, 34.0, 32.0, 1066.0, 31.0, 34.0, 40.0, 29.0, 40.0, 33.0, 35.0, 20.0, 27.0, 19.0, 19.0, 21.0, 24.0, 22.0, 12.0, 14.0, 10.0, 7.0, 15.0, 9.0, 4.0, 1.0, 7.0, 8.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.94921875, -4.7955322265625, -4.641845703125, -4.4881591796875, -4.33447265625, -4.1807861328125, -4.027099609375, -3.8734130859375, -3.7197265625, -3.5660400390625, -3.412353515625, -3.2586669921875, -3.10498046875, -2.9512939453125, -2.797607421875, -2.6439208984375, -2.490234375, -2.3365478515625, -2.182861328125, -2.0291748046875, -1.87548828125, -1.7218017578125, -1.568115234375, -1.4144287109375, -1.2607421875, -1.1070556640625, -0.953369140625, -0.7996826171875, -0.64599609375, -0.4923095703125, -0.338623046875, -0.1849365234375, -0.03125, 0.1224365234375, 0.276123046875, 0.4298095703125, 0.58349609375, 0.7371826171875, 0.890869140625, 1.0445556640625, 1.1982421875, 1.3519287109375, 1.505615234375, 1.6593017578125, 1.81298828125, 1.9666748046875, 2.120361328125, 2.2740478515625, 2.427734375, 2.5814208984375, 2.735107421875, 2.8887939453125, 3.04248046875, 3.1961669921875, 3.349853515625, 3.5035400390625, 3.6572265625, 3.8109130859375, 3.964599609375, 4.1182861328125, 4.27197265625, 4.4256591796875, 4.579345703125, 4.7330322265625, 4.88671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 13.0, 12.0, 25.0, 28.0, 35.0, 58.0, 80.0, 94.0, 162.0, 215.0, 359.0, 538.0, 796.0, 1253.0, 2115.0, 3586.0, 5862.0, 10379.0, 18242.0, 31921.0, 59784.0, 115272.0, 282390.0, 1203654.0, 173383.0, 83964.0, 44630.0, 24330.0, 13676.0, 7933.0, 4759.0, 2837.0, 1667.0, 1076.0, 653.0, 410.0, 282.0, 176.0, 138.0, 97.0, 75.0, 46.0, 31.0, 31.0, 20.0, 14.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.7724609375, -0.7505569458007812, -0.7286529541015625, -0.7067489624023438, -0.684844970703125, -0.6629409790039062, -0.6410369873046875, -0.6191329956054688, -0.59722900390625, -0.5753250122070312, -0.5534210205078125, -0.5315170288085938, -0.509613037109375, -0.48770904541015625, -0.4658050537109375, -0.44390106201171875, -0.4219970703125, -0.40009307861328125, -0.3781890869140625, -0.35628509521484375, -0.334381103515625, -0.31247711181640625, -0.2905731201171875, -0.26866912841796875, -0.24676513671875, -0.22486114501953125, -0.2029571533203125, -0.18105316162109375, -0.159149169921875, -0.13724517822265625, -0.1153411865234375, -0.09343719482421875, -0.071533203125, -0.04962921142578125, -0.0277252197265625, -0.00582122802734375, 0.016082763671875, 0.03798675537109375, 0.0598907470703125, 0.08179473876953125, 0.10369873046875, 0.12560272216796875, 0.1475067138671875, 0.16941070556640625, 0.191314697265625, 0.21321868896484375, 0.2351226806640625, 0.25702667236328125, 0.2789306640625, 0.30083465576171875, 0.3227386474609375, 0.34464263916015625, 0.366546630859375, 0.38845062255859375, 0.4103546142578125, 0.43225860595703125, 0.45416259765625, 0.47606658935546875, 0.4979705810546875, 0.5198745727539062, 0.541778564453125, 0.5636825561523438, 0.5855865478515625, 0.6074905395507812, 0.62939453125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 6.0, 1.0, 9.0, 6.0, 6.0, 1.0, 7.0, 8.0, 7.0, 4.0, 9.0, 8.0, 13.0, 19.0, 20.0, 15.0, 25.0, 27.0, 43.0, 60.0, 87.0, 125.0, 112.0, 83.0, 68.0, 53.0, 23.0, 21.0, 15.0, 15.0, 15.0, 8.0, 7.0, 9.0, 8.0, 6.0, 6.0, 9.0, 6.0, 7.0, 5.0, 3.0, 4.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314453125, -0.3046417236328125, -0.294830322265625, -0.2850189208984375, -0.27520751953125, -0.2653961181640625, -0.255584716796875, -0.2457733154296875, -0.2359619140625, -0.2261505126953125, -0.216339111328125, -0.2065277099609375, -0.19671630859375, -0.1869049072265625, -0.177093505859375, -0.1672821044921875, -0.157470703125, -0.1476593017578125, -0.137847900390625, -0.1280364990234375, -0.11822509765625, -0.1084136962890625, -0.098602294921875, -0.0887908935546875, -0.0789794921875, -0.0691680908203125, -0.059356689453125, -0.0495452880859375, -0.03973388671875, -0.0299224853515625, -0.020111083984375, -0.0102996826171875, -0.00048828125, 0.0093231201171875, 0.019134521484375, 0.0289459228515625, 0.03875732421875, 0.0485687255859375, 0.058380126953125, 0.0681915283203125, 0.0780029296875, 0.0878143310546875, 0.097625732421875, 0.1074371337890625, 0.11724853515625, 0.1270599365234375, 0.136871337890625, 0.1466827392578125, 0.156494140625, 0.1663055419921875, 0.176116943359375, 0.1859283447265625, 0.19573974609375, 0.2055511474609375, 0.215362548828125, 0.2251739501953125, 0.2349853515625, 0.2447967529296875, 0.254608154296875, 0.2644195556640625, 0.27423095703125, 0.2840423583984375, 0.293853759765625, 0.3036651611328125, 0.3134765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 3.0, 3.0, 7.0, 6.0, 6.0, 11.0, 4.0, 10.0, 9.0, 9.0, 7.0, 20.0, 20.0, 31.0, 42.0, 77.0, 159.0, 355.0, 1369.0, 59918.0, 979217.0, 6137.0, 549.0, 221.0, 105.0, 49.0, 43.0, 35.0, 22.0, 15.0, 10.0, 11.0, 5.0, 6.0, 8.0, 7.0, 3.0, 4.0, 6.0, 6.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.6578369140625, -6.444580078125, -6.2313232421875, -6.01806640625, -5.8048095703125, -5.591552734375, -5.3782958984375, -5.1650390625, -4.9517822265625, -4.738525390625, -4.5252685546875, -4.31201171875, -4.0987548828125, -3.885498046875, -3.6722412109375, -3.458984375, -3.2457275390625, -3.032470703125, -2.8192138671875, -2.60595703125, -2.3927001953125, -2.179443359375, -1.9661865234375, -1.7529296875, -1.5396728515625, -1.326416015625, -1.1131591796875, -0.89990234375, -0.6866455078125, -0.473388671875, -0.2601318359375, -0.046875, 0.1663818359375, 0.379638671875, 0.5928955078125, 0.80615234375, 1.0194091796875, 1.232666015625, 1.4459228515625, 1.6591796875, 1.8724365234375, 2.085693359375, 2.2989501953125, 2.51220703125, 2.7254638671875, 2.938720703125, 3.1519775390625, 3.365234375, 3.5784912109375, 3.791748046875, 4.0050048828125, 4.21826171875, 4.4315185546875, 4.644775390625, 4.8580322265625, 5.0712890625, 5.2845458984375, 5.497802734375, 5.7110595703125, 5.92431640625, 6.1375732421875, 6.350830078125, 6.5640869140625, 6.77734375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 17.0, 29.0, 39.0, 67.0, 110.0, 323.0, 202.0, 85.0, 46.0, 39.0, 12.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5964094400405884, -1.5320537090301514, -1.4676979780197144, -1.4033422470092773, -1.3389865159988403, -1.2746307849884033, -1.2102750539779663, -1.1459193229675293, -1.0815635919570923, -1.0172078609466553, -0.9528521299362183, -0.8884963989257812, -0.8241406679153442, -0.7597849369049072, -0.6954292058944702, -0.6310734748840332, -0.5667177438735962, -0.5023620128631592, -0.43800628185272217, -0.37365055084228516, -0.30929481983184814, -0.24493908882141113, -0.18058335781097412, -0.11622762680053711, -0.0518718957901001, 0.012483835220336914, 0.07683956623077393, 0.14119529724121094, 0.20555102825164795, 0.26990675926208496, 0.334262490272522, 0.398618221282959, 0.46297383308410645, 0.5273295640945435, 0.5916852951049805, 0.6560410261154175, 0.7203967571258545, 0.7847524881362915, 0.8491082191467285, 0.9134639501571655, 0.9778196811676025, 1.0421754121780396, 1.1065311431884766, 1.1708868741989136, 1.2352426052093506, 1.2995983362197876, 1.3639540672302246, 1.4283097982406616, 1.4926655292510986, 1.5570212602615356, 1.6213769912719727, 1.6857327222824097, 1.7500884532928467, 1.8144441843032837, 1.8787999153137207, 1.9431556463241577, 2.0075113773345947, 2.071866989135742, 2.1362228393554688, 2.2005786895751953, 2.2649343013763428, 2.3292899131774902, 2.393645763397217, 2.4580016136169434, 2.522357225418091]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 6.0, 11.0, 17.0, 16.0, 18.0, 10.0, 26.0, 17.0, 27.0, 24.0, 30.0, 28.0, 35.0, 32.0, 29.0, 45.0, 36.0, 48.0, 34.0, 38.0, 35.0, 30.0, 37.0, 36.0, 39.0, 23.0, 40.0, 33.0, 31.0, 17.0, 22.0, 14.0, 22.0, 20.0, 5.0, 6.0, 5.0, 10.0, 2.0, 5.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2055637836456299, -1.1697578430175781, -1.1339519023895264, -1.0981459617614746, -1.0623400211334229, -1.026534080505371, -0.9907281398773193, -0.9549221992492676, -0.9191162586212158, -0.8833103179931641, -0.8475043773651123, -0.8116984367370605, -0.7758924961090088, -0.740086555480957, -0.7042806148529053, -0.6684746742248535, -0.6326687335968018, -0.59686279296875, -0.5610568523406982, -0.5252509117126465, -0.4894449710845947, -0.45363903045654297, -0.4178330898284912, -0.38202714920043945, -0.3462212085723877, -0.31041526794433594, -0.2746093273162842, -0.23880338668823242, -0.20299744606018066, -0.1671915054321289, -0.13138556480407715, -0.09557962417602539, -0.05977368354797363, -0.023967742919921875, 0.011838197708129883, 0.04764413833618164, 0.0834500789642334, 0.11925601959228516, 0.15506196022033691, 0.19086790084838867, 0.22667384147644043, 0.2624797821044922, 0.29828572273254395, 0.3340916633605957, 0.36989760398864746, 0.4057035446166992, 0.441509485244751, 0.47731542587280273, 0.5131213665008545, 0.5489273071289062, 0.584733247756958, 0.6205391883850098, 0.6563451290130615, 0.6921510696411133, 0.727957010269165, 0.7637629508972168, 0.7995688915252686, 0.8353748321533203, 0.8711807727813721, 0.9069867134094238, 0.9427926540374756, 0.9785985946655273, 1.014404535293579, 1.0502104759216309, 1.0860164165496826]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 6.0, 12.0, 19.0, 20.0, 27.0, 24.0, 26.0, 36.0, 41.0, 42.0, 46.0, 48.0, 48.0, 56.0, 47.0, 62.0, 44.0, 44.0, 47.0, 43.0, 40.0, 27.0, 39.0, 22.0, 28.0, 17.0, 15.0, 13.0, 11.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.421875, -10.1119384765625, -9.802001953125, -9.4920654296875, -9.18212890625, -8.8721923828125, -8.562255859375, -8.2523193359375, -7.9423828125, -7.6324462890625, -7.322509765625, -7.0125732421875, -6.70263671875, -6.3927001953125, -6.082763671875, -5.7728271484375, -5.462890625, -5.1529541015625, -4.843017578125, -4.5330810546875, -4.22314453125, -3.9132080078125, -3.603271484375, -3.2933349609375, -2.9833984375, -2.6734619140625, -2.363525390625, -2.0535888671875, -1.74365234375, -1.4337158203125, -1.123779296875, -0.8138427734375, -0.50390625, -0.1939697265625, 0.115966796875, 0.4259033203125, 0.73583984375, 1.0457763671875, 1.355712890625, 1.6656494140625, 1.9755859375, 2.2855224609375, 2.595458984375, 2.9053955078125, 3.21533203125, 3.5252685546875, 3.835205078125, 4.1451416015625, 4.455078125, 4.7650146484375, 5.074951171875, 5.3848876953125, 5.69482421875, 6.0047607421875, 6.314697265625, 6.6246337890625, 6.9345703125, 7.2445068359375, 7.554443359375, 7.8643798828125, 8.17431640625, 8.4842529296875, 8.794189453125, 9.1041259765625, 9.4140625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 16.0, 20.0, 28.0, 49.0, 53.0, 119.0, 159.0, 274.0, 344.0, 579.0, 934.0, 1347.0, 2104.0, 3500.0, 5631.0, 10759.0, 32324.0, 197758.0, 611376.0, 133764.0, 24471.0, 9265.0, 5036.0, 3065.0, 1996.0, 1244.0, 822.0, 532.0, 364.0, 214.0, 140.0, 90.0, 69.0, 34.0, 29.0, 20.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.625, -15.093505859375, -14.56201171875, -14.030517578125, -13.4990234375, -12.967529296875, -12.43603515625, -11.904541015625, -11.373046875, -10.841552734375, -10.31005859375, -9.778564453125, -9.2470703125, -8.715576171875, -8.18408203125, -7.652587890625, -7.12109375, -6.589599609375, -6.05810546875, -5.526611328125, -4.9951171875, -4.463623046875, -3.93212890625, -3.400634765625, -2.869140625, -2.337646484375, -1.80615234375, -1.274658203125, -0.7431640625, -0.211669921875, 0.31982421875, 0.851318359375, 1.3828125, 1.914306640625, 2.44580078125, 2.977294921875, 3.5087890625, 4.040283203125, 4.57177734375, 5.103271484375, 5.634765625, 6.166259765625, 6.69775390625, 7.229248046875, 7.7607421875, 8.292236328125, 8.82373046875, 9.355224609375, 9.88671875, 10.418212890625, 10.94970703125, 11.481201171875, 12.0126953125, 12.544189453125, 13.07568359375, 13.607177734375, 14.138671875, 14.670166015625, 15.20166015625, 15.733154296875, 16.2646484375, 16.796142578125, 17.32763671875, 17.859130859375, 18.390625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 16.0, 16.0, 17.0, 13.0, 32.0, 26.0, 29.0, 48.0, 35.0, 50.0, 46.0, 108.0, 161.0, 1406.0, 371.0, 154.0, 97.0, 65.0, 45.0, 41.0, 39.0, 38.0, 36.0, 21.0, 20.0, 18.0, 18.0, 8.0, 9.0, 14.0, 3.0, 8.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.296875, -25.447265625, -24.59765625, -23.748046875, -22.8984375, -22.048828125, -21.19921875, -20.349609375, -19.5, -18.650390625, -17.80078125, -16.951171875, -16.1015625, -15.251953125, -14.40234375, -13.552734375, -12.703125, -11.853515625, -11.00390625, -10.154296875, -9.3046875, -8.455078125, -7.60546875, -6.755859375, -5.90625, -5.056640625, -4.20703125, -3.357421875, -2.5078125, -1.658203125, -0.80859375, 0.041015625, 0.890625, 1.740234375, 2.58984375, 3.439453125, 4.2890625, 5.138671875, 5.98828125, 6.837890625, 7.6875, 8.537109375, 9.38671875, 10.236328125, 11.0859375, 11.935546875, 12.78515625, 13.634765625, 14.484375, 15.333984375, 16.18359375, 17.033203125, 17.8828125, 18.732421875, 19.58203125, 20.431640625, 21.28125, 22.130859375, 22.98046875, 23.830078125, 24.6796875, 25.529296875, 26.37890625, 27.228515625, 28.078125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 9.0, 10.0, 11.0, 12.0, 20.0, 22.0, 22.0, 31.0, 42.0, 59.0, 92.0, 142.0, 239.0, 402.0, 763.0, 2594.0, 13121.0, 956657.0, 2148713.0, 17683.0, 3074.0, 881.0, 400.0, 236.0, 157.0, 89.0, 56.0, 35.0, 30.0, 21.0, 29.0, 8.0, 8.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.2294921875, -51.458984375, -49.6884765625, -47.91796875, -46.1474609375, -44.376953125, -42.6064453125, -40.8359375, -39.0654296875, -37.294921875, -35.5244140625, -33.75390625, -31.9833984375, -30.212890625, -28.4423828125, -26.671875, -24.9013671875, -23.130859375, -21.3603515625, -19.58984375, -17.8193359375, -16.048828125, -14.2783203125, -12.5078125, -10.7373046875, -8.966796875, -7.1962890625, -5.42578125, -3.6552734375, -1.884765625, -0.1142578125, 1.65625, 3.4267578125, 5.197265625, 6.9677734375, 8.73828125, 10.5087890625, 12.279296875, 14.0498046875, 15.8203125, 17.5908203125, 19.361328125, 21.1318359375, 22.90234375, 24.6728515625, 26.443359375, 28.2138671875, 29.984375, 31.7548828125, 33.525390625, 35.2958984375, 37.06640625, 38.8369140625, 40.607421875, 42.3779296875, 44.1484375, 45.9189453125, 47.689453125, 49.4599609375, 51.23046875, 53.0009765625, 54.771484375, 56.5419921875, 58.3125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 10.0, 147.0, 523.0, 305.0, 30.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.7033576965332, -31.894519805908203, -25.085683822631836, -18.27684783935547, -11.468009948730469, -4.659172058105469, 2.1496620178222656, 8.958499908447266, 15.767337799072266, 22.576175689697266, 29.385011672973633, 36.19384765625, 43.002685546875, 49.8115234375, 56.620357513427734, 63.429195404052734, 70.238037109375, 77.046875, 83.855712890625, 90.66455078125, 97.473388671875, 104.2822265625, 111.09105682373047, 117.89989471435547, 124.70872497558594, 131.51756286621094, 138.32640075683594, 145.13523864746094, 151.94407653808594, 158.75291442871094, 165.56173706054688, 172.37057495117188, 179.17941284179688, 185.98825073242188, 192.79708862304688, 199.60592651367188, 206.41476440429688, 213.22360229492188, 220.03244018554688, 226.84127807617188, 233.65011596679688, 240.45895385742188, 247.26779174804688, 254.07662963867188, 260.8854675292969, 267.6943054199219, 274.5031433105469, 281.3119812011719, 288.12078857421875, 294.92962646484375, 301.73846435546875, 308.54730224609375, 315.35614013671875, 322.16497802734375, 328.97381591796875, 335.78265380859375, 342.59149169921875, 349.40032958984375, 356.20916748046875, 363.01800537109375, 369.82684326171875, 376.63568115234375, 383.44451904296875, 390.25335693359375, 397.06219482421875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 3.0, 7.0, 8.0, 7.0, 14.0, 11.0, 15.0, 22.0, 20.0, 25.0, 21.0, 32.0, 22.0, 39.0, 38.0, 38.0, 39.0, 38.0, 39.0, 56.0, 47.0, 36.0, 39.0, 37.0, 39.0, 48.0, 26.0, 29.0, 27.0, 32.0, 20.0, 16.0, 24.0, 11.0, 12.0, 13.0, 11.0, 11.0, 9.0, 8.0, 3.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.15870666503906, -58.18632888793945, -56.213951110839844, -54.24156951904297, -52.26919174194336, -50.29681396484375, -48.32443618774414, -46.35205841064453, -44.379676818847656, -42.40729904174805, -40.43492126464844, -38.46253967285156, -36.49016189575195, -34.517784118652344, -32.545406341552734, -30.573028564453125, -28.600650787353516, -26.628273010253906, -24.655893325805664, -22.683515548706055, -20.711135864257812, -18.738758087158203, -16.766380310058594, -14.794001579284668, -12.821622848510742, -10.849244117736816, -8.87686538696289, -6.904487609863281, -4.9321088790893555, -2.9597301483154297, -0.9873523712158203, 0.9850263595581055, 2.9574050903320312, 4.929783821105957, 6.902162075042725, 8.874540328979492, 10.846919059753418, 12.819297790527344, 14.791675567626953, 16.764053344726562, 18.736433029174805, 20.708810806274414, 22.681190490722656, 24.653568267822266, 26.625946044921875, 28.598325729370117, 30.570703506469727, 32.54308319091797, 34.51546096801758, 36.48783874511719, 38.4602165222168, 40.432594299316406, 42.40497589111328, 44.37735366821289, 46.3497314453125, 48.32210922241211, 50.29448699951172, 52.26686477661133, 54.23924255371094, 56.21162414550781, 58.18400192260742, 60.15637969970703, 62.12875747680664, 64.10113525390625, 66.07351684570312]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 9.0, 4.0, 8.0, 18.0, 20.0, 17.0, 18.0, 27.0, 28.0, 34.0, 42.0, 30.0, 58.0, 39.0, 59.0, 48.0, 45.0, 51.0, 36.0, 48.0, 56.0, 43.0, 37.0, 37.0, 25.0, 35.0, 22.0, 20.0, 11.0, 15.0, 11.0, 16.0, 6.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.8984375, -9.587646484375, -9.27685546875, -8.966064453125, -8.6552734375, -8.344482421875, -8.03369140625, -7.722900390625, -7.412109375, -7.101318359375, -6.79052734375, -6.479736328125, -6.1689453125, -5.858154296875, -5.54736328125, -5.236572265625, -4.92578125, -4.614990234375, -4.30419921875, -3.993408203125, -3.6826171875, -3.371826171875, -3.06103515625, -2.750244140625, -2.439453125, -2.128662109375, -1.81787109375, -1.507080078125, -1.1962890625, -0.885498046875, -0.57470703125, -0.263916015625, 0.046875, 0.357666015625, 0.66845703125, 0.979248046875, 1.2900390625, 1.600830078125, 1.91162109375, 2.222412109375, 2.533203125, 2.843994140625, 3.15478515625, 3.465576171875, 3.7763671875, 4.087158203125, 4.39794921875, 4.708740234375, 5.01953125, 5.330322265625, 5.64111328125, 5.951904296875, 6.2626953125, 6.573486328125, 6.88427734375, 7.195068359375, 7.505859375, 7.816650390625, 8.12744140625, 8.438232421875, 8.7490234375, 9.059814453125, 9.37060546875, 9.681396484375, 9.9921875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 12.0, 10.0, 18.0, 21.0, 32.0, 47.0, 65.0, 93.0, 152.0, 232.0, 339.0, 511.0, 901.0, 1487.0, 2802.0, 5272.0, 11846.0, 33051.0, 151969.0, 1341735.0, 2265004.0, 297868.0, 49732.0, 16099.0, 6781.0, 3340.0, 1885.0, 1012.0, 657.0, 426.0, 290.0, 179.0, 116.0, 81.0, 54.0, 44.0, 29.0, 22.0, 16.0, 9.0, 10.0, 9.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.765625, -19.087890625, -18.41015625, -17.732421875, -17.0546875, -16.376953125, -15.69921875, -15.021484375, -14.34375, -13.666015625, -12.98828125, -12.310546875, -11.6328125, -10.955078125, -10.27734375, -9.599609375, -8.921875, -8.244140625, -7.56640625, -6.888671875, -6.2109375, -5.533203125, -4.85546875, -4.177734375, -3.5, -2.822265625, -2.14453125, -1.466796875, -0.7890625, -0.111328125, 0.56640625, 1.244140625, 1.921875, 2.599609375, 3.27734375, 3.955078125, 4.6328125, 5.310546875, 5.98828125, 6.666015625, 7.34375, 8.021484375, 8.69921875, 9.376953125, 10.0546875, 10.732421875, 11.41015625, 12.087890625, 12.765625, 13.443359375, 14.12109375, 14.798828125, 15.4765625, 16.154296875, 16.83203125, 17.509765625, 18.1875, 18.865234375, 19.54296875, 20.220703125, 20.8984375, 21.576171875, 22.25390625, 22.931640625, 23.609375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 1.0, 7.0, 12.0, 14.0, 16.0, 24.0, 34.0, 40.0, 41.0, 65.0, 78.0, 115.0, 144.0, 223.0, 335.0, 433.0, 484.0, 493.0, 403.0, 289.0, 215.0, 153.0, 116.0, 75.0, 60.0, 43.0, 27.0, 31.0, 27.0, 14.0, 6.0, 15.0, 3.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5625, -15.04052734375, -14.5185546875, -13.99658203125, -13.474609375, -12.95263671875, -12.4306640625, -11.90869140625, -11.38671875, -10.86474609375, -10.3427734375, -9.82080078125, -9.298828125, -8.77685546875, -8.2548828125, -7.73291015625, -7.2109375, -6.68896484375, -6.1669921875, -5.64501953125, -5.123046875, -4.60107421875, -4.0791015625, -3.55712890625, -3.03515625, -2.51318359375, -1.9912109375, -1.46923828125, -0.947265625, -0.42529296875, 0.0966796875, 0.61865234375, 1.140625, 1.66259765625, 2.1845703125, 2.70654296875, 3.228515625, 3.75048828125, 4.2724609375, 4.79443359375, 5.31640625, 5.83837890625, 6.3603515625, 6.88232421875, 7.404296875, 7.92626953125, 8.4482421875, 8.97021484375, 9.4921875, 10.01416015625, 10.5361328125, 11.05810546875, 11.580078125, 12.10205078125, 12.6240234375, 13.14599609375, 13.66796875, 14.18994140625, 14.7119140625, 15.23388671875, 15.755859375, 16.27783203125, 16.7998046875, 17.32177734375, 17.84375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 13.0, 16.0, 16.0, 23.0, 33.0, 59.0, 87.0, 117.0, 191.0, 454.0, 1567.0, 9147.0, 147143.0, 3860130.0, 163106.0, 9610.0, 1540.0, 422.0, 193.0, 132.0, 74.0, 45.0, 40.0, 25.0, 22.0, 20.0, 14.0, 12.0, 8.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.3125, -74.9345703125, -72.556640625, -70.1787109375, -67.80078125, -65.4228515625, -63.044921875, -60.6669921875, -58.2890625, -55.9111328125, -53.533203125, -51.1552734375, -48.77734375, -46.3994140625, -44.021484375, -41.6435546875, -39.265625, -36.8876953125, -34.509765625, -32.1318359375, -29.75390625, -27.3759765625, -24.998046875, -22.6201171875, -20.2421875, -17.8642578125, -15.486328125, -13.1083984375, -10.73046875, -8.3525390625, -5.974609375, -3.5966796875, -1.21875, 1.1591796875, 3.537109375, 5.9150390625, 8.29296875, 10.6708984375, 13.048828125, 15.4267578125, 17.8046875, 20.1826171875, 22.560546875, 24.9384765625, 27.31640625, 29.6943359375, 32.072265625, 34.4501953125, 36.828125, 39.2060546875, 41.583984375, 43.9619140625, 46.33984375, 48.7177734375, 51.095703125, 53.4736328125, 55.8515625, 58.2294921875, 60.607421875, 62.9853515625, 65.36328125, 67.7412109375, 70.119140625, 72.4970703125, 74.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 16.0, 25.0, 39.0, 53.0, 88.0, 123.0, 160.0, 135.0, 128.0, 101.0, 67.0, 38.0, 13.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.6884994506836, -81.61717224121094, -77.54585266113281, -73.47452545166016, -69.40320587158203, -65.33187866210938, -61.260555267333984, -57.189231872558594, -53.1179084777832, -49.04658508300781, -44.97526168823242, -40.90393829345703, -36.832611083984375, -32.76129150390625, -28.689964294433594, -24.618640899658203, -20.547317504882812, -16.475994110107422, -12.404669761657715, -8.333345413208008, -4.262022018432617, -0.19069862365722656, 3.880626678466797, 7.9519500732421875, 12.023273468017578, 16.09459686279297, 20.16592025756836, 24.237245559692383, 28.308568954467773, 32.37989044189453, 36.45121765136719, 40.52254104614258, 44.59385681152344, 48.66518020629883, 52.73650360107422, 56.807830810546875, 60.879150390625, 64.95047760009766, 69.02180480957031, 73.09312438964844, 77.16444396972656, 81.23577117919922, 85.30709075927734, 89.37841796875, 93.44973754882812, 97.52106475830078, 101.59239196777344, 105.66371154785156, 109.73503875732422, 113.80636596679688, 117.877685546875, 121.94901275634766, 126.02033233642578, 130.09165954589844, 134.16297912597656, 138.23431396484375, 142.30563354492188, 146.376953125, 150.4482879638672, 154.5196075439453, 158.59092712402344, 162.66224670410156, 166.73358154296875, 170.80490112304688, 174.876220703125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 9.0, 12.0, 15.0, 24.0, 13.0, 13.0, 30.0, 28.0, 30.0, 31.0, 34.0, 38.0, 34.0, 38.0, 40.0, 38.0, 55.0, 45.0, 38.0, 48.0, 35.0, 38.0, 28.0, 29.0, 35.0, 17.0, 24.0, 36.0, 21.0, 16.0, 17.0, 13.0, 14.0, 11.0, 7.0, 5.0, 4.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.67112731933594, -46.95042419433594, -45.22972106933594, -43.50901794433594, -41.78831481933594, -40.06761169433594, -38.34690856933594, -36.62620544433594, -34.90550231933594, -33.18479919433594, -31.464096069335938, -29.743392944335938, -28.022689819335938, -26.301986694335938, -24.581283569335938, -22.860580444335938, -21.139875411987305, -19.419172286987305, -17.698469161987305, -15.977766036987305, -14.257062911987305, -12.536358833312988, -10.815655708312988, -9.094952583312988, -7.374249458312988, -5.653546333312988, -3.932842969894409, -2.21213960647583, -0.4914364814758301, 1.2292671203613281, 2.949970245361328, 4.670673370361328, 6.391376495361328, 8.112079620361328, 9.832782745361328, 11.553485870361328, 13.274188995361328, 14.994893074035645, 16.715595245361328, 18.436298370361328, 20.157001495361328, 21.877704620361328, 23.598407745361328, 25.319110870361328, 27.039813995361328, 28.760517120361328, 30.481220245361328, 32.20192337036133, 33.922630310058594, 35.643333435058594, 37.364036560058594, 39.084739685058594, 40.805442810058594, 42.526145935058594, 44.246849060058594, 45.967552185058594, 47.688255310058594, 49.408958435058594, 51.129661560058594, 52.850364685058594, 54.571067810058594, 56.291770935058594, 58.012474060058594, 59.733177185058594, 61.453880310058594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 12.0, 9.0, 12.0, 21.0, 26.0, 26.0, 27.0, 34.0, 42.0, 50.0, 40.0, 57.0, 54.0, 60.0, 41.0, 55.0, 45.0, 47.0, 53.0, 38.0, 42.0, 36.0, 33.0, 28.0, 26.0, 19.0, 13.0, 13.0, 12.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.5546875, -11.2218017578125, -10.888916015625, -10.5560302734375, -10.22314453125, -9.8902587890625, -9.557373046875, -9.2244873046875, -8.8916015625, -8.5587158203125, -8.225830078125, -7.8929443359375, -7.56005859375, -7.2271728515625, -6.894287109375, -6.5614013671875, -6.228515625, -5.8956298828125, -5.562744140625, -5.2298583984375, -4.89697265625, -4.5640869140625, -4.231201171875, -3.8983154296875, -3.5654296875, -3.2325439453125, -2.899658203125, -2.5667724609375, -2.23388671875, -1.9010009765625, -1.568115234375, -1.2352294921875, -0.90234375, -0.5694580078125, -0.236572265625, 0.0963134765625, 0.42919921875, 0.7620849609375, 1.094970703125, 1.4278564453125, 1.7607421875, 2.0936279296875, 2.426513671875, 2.7593994140625, 3.09228515625, 3.4251708984375, 3.758056640625, 4.0909423828125, 4.423828125, 4.7567138671875, 5.089599609375, 5.4224853515625, 5.75537109375, 6.0882568359375, 6.421142578125, 6.7540283203125, 7.0869140625, 7.4197998046875, 7.752685546875, 8.0855712890625, 8.41845703125, 8.7513427734375, 9.084228515625, 9.4171142578125, 9.75]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 13.0, 32.0, 34.0, 41.0, 62.0, 105.0, 168.0, 223.0, 399.0, 669.0, 1123.0, 1915.0, 3423.0, 6355.0, 11448.0, 21975.0, 43198.0, 91308.0, 194536.0, 300244.0, 192097.0, 89655.0, 42533.0, 21388.0, 11416.0, 6041.0, 3279.0, 1964.0, 1141.0, 638.0, 391.0, 260.0, 165.0, 95.0, 60.0, 43.0, 27.0, 24.0, 16.0, 15.0, 7.0, 3.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6640625, -1.6094818115234375, -1.554901123046875, -1.5003204345703125, -1.44573974609375, -1.3911590576171875, -1.336578369140625, -1.2819976806640625, -1.2274169921875, -1.1728363037109375, -1.118255615234375, -1.0636749267578125, -1.00909423828125, -0.9545135498046875, -0.899932861328125, -0.8453521728515625, -0.790771484375, -0.7361907958984375, -0.681610107421875, -0.6270294189453125, -0.57244873046875, -0.5178680419921875, -0.463287353515625, -0.4087066650390625, -0.3541259765625, -0.2995452880859375, -0.244964599609375, -0.1903839111328125, -0.13580322265625, -0.0812225341796875, -0.026641845703125, 0.0279388427734375, 0.08251953125, 0.1371002197265625, 0.191680908203125, 0.2462615966796875, 0.30084228515625, 0.3554229736328125, 0.410003662109375, 0.4645843505859375, 0.5191650390625, 0.5737457275390625, 0.628326416015625, 0.6829071044921875, 0.73748779296875, 0.7920684814453125, 0.846649169921875, 0.9012298583984375, 0.955810546875, 1.0103912353515625, 1.064971923828125, 1.1195526123046875, 1.17413330078125, 1.2287139892578125, 1.283294677734375, 1.3378753662109375, 1.3924560546875, 1.4470367431640625, 1.501617431640625, 1.5561981201171875, 1.61077880859375, 1.6653594970703125, 1.719940185546875, 1.7745208740234375, 1.8291015625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 6.0, 9.0, 12.0, 11.0, 14.0, 13.0, 14.0, 14.0, 18.0, 15.0, 20.0, 32.0, 32.0, 29.0, 41.0, 43.0, 50.0, 54.0, 55.0, 1066.0, 36.0, 35.0, 32.0, 19.0, 45.0, 30.0, 42.0, 27.0, 35.0, 26.0, 20.0, 14.0, 10.0, 26.0, 15.0, 14.0, 13.0, 8.0, 6.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.8206787109375, -4.641357421875, -4.4620361328125, -4.28271484375, -4.1033935546875, -3.924072265625, -3.7447509765625, -3.5654296875, -3.3861083984375, -3.206787109375, -3.0274658203125, -2.84814453125, -2.6688232421875, -2.489501953125, -2.3101806640625, -2.130859375, -1.9515380859375, -1.772216796875, -1.5928955078125, -1.41357421875, -1.2342529296875, -1.054931640625, -0.8756103515625, -0.6962890625, -0.5169677734375, -0.337646484375, -0.1583251953125, 0.02099609375, 0.2003173828125, 0.379638671875, 0.5589599609375, 0.73828125, 0.9176025390625, 1.096923828125, 1.2762451171875, 1.45556640625, 1.6348876953125, 1.814208984375, 1.9935302734375, 2.1728515625, 2.3521728515625, 2.531494140625, 2.7108154296875, 2.89013671875, 3.0694580078125, 3.248779296875, 3.4281005859375, 3.607421875, 3.7867431640625, 3.966064453125, 4.1453857421875, 4.32470703125, 4.5040283203125, 4.683349609375, 4.8626708984375, 5.0419921875, 5.2213134765625, 5.400634765625, 5.5799560546875, 5.75927734375, 5.9385986328125, 6.117919921875, 6.2972412109375, 6.4765625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 7.0, 9.0, 18.0, 9.0, 26.0, 26.0, 32.0, 55.0, 59.0, 110.0, 140.0, 230.0, 368.0, 641.0, 1192.0, 2149.0, 3876.0, 7435.0, 14397.0, 29482.0, 60961.0, 131054.0, 676123.0, 912576.0, 133519.0, 61493.0, 29955.0, 14695.0, 7575.0, 3918.0, 2075.0, 1152.0, 631.0, 387.0, 225.0, 167.0, 90.0, 74.0, 60.0, 29.0, 27.0, 17.0, 11.0, 14.0, 9.0, 5.0, 7.0, 8.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.77392578125, -0.7497482299804688, -0.7255706787109375, -0.7013931274414062, -0.677215576171875, -0.6530380249023438, -0.6288604736328125, -0.6046829223632812, -0.58050537109375, -0.5563278198242188, -0.5321502685546875, -0.5079727172851562, -0.483795166015625, -0.45961761474609375, -0.4354400634765625, -0.41126251220703125, -0.3870849609375, -0.36290740966796875, -0.3387298583984375, -0.31455230712890625, -0.290374755859375, -0.26619720458984375, -0.2420196533203125, -0.21784210205078125, -0.19366455078125, -0.16948699951171875, -0.1453094482421875, -0.12113189697265625, -0.096954345703125, -0.07277679443359375, -0.0485992431640625, -0.02442169189453125, -0.000244140625, 0.02393341064453125, 0.0481109619140625, 0.07228851318359375, 0.096466064453125, 0.12064361572265625, 0.1448211669921875, 0.16899871826171875, 0.19317626953125, 0.21735382080078125, 0.2415313720703125, 0.26570892333984375, 0.289886474609375, 0.31406402587890625, 0.3382415771484375, 0.36241912841796875, 0.3865966796875, 0.41077423095703125, 0.4349517822265625, 0.45912933349609375, 0.483306884765625, 0.5074844360351562, 0.5316619873046875, 0.5558395385742188, 0.58001708984375, 0.6041946411132812, 0.6283721923828125, 0.6525497436523438, 0.676727294921875, 0.7009048461914062, 0.7250823974609375, 0.7492599487304688, 0.7734375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 5.0, 1.0, 3.0, 1.0, 5.0, 7.0, 11.0, 14.0, 14.0, 18.0, 11.0, 12.0, 16.0, 15.0, 23.0, 47.0, 76.0, 142.0, 214.0, 117.0, 52.0, 33.0, 32.0, 12.0, 16.0, 15.0, 16.0, 10.0, 3.0, 14.0, 8.0, 7.0, 7.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.23095703125, -0.22475433349609375, -0.2185516357421875, -0.21234893798828125, -0.206146240234375, -0.19994354248046875, -0.1937408447265625, -0.18753814697265625, -0.18133544921875, -0.17513275146484375, -0.1689300537109375, -0.16272735595703125, -0.156524658203125, -0.15032196044921875, -0.1441192626953125, -0.13791656494140625, -0.1317138671875, -0.12551116943359375, -0.1193084716796875, -0.11310577392578125, -0.106903076171875, -0.10070037841796875, -0.0944976806640625, -0.08829498291015625, -0.08209228515625, -0.07588958740234375, -0.0696868896484375, -0.06348419189453125, -0.057281494140625, -0.05107879638671875, -0.0448760986328125, -0.03867340087890625, -0.032470703125, -0.02626800537109375, -0.0200653076171875, -0.01386260986328125, -0.007659912109375, -0.00145721435546875, 0.0047454833984375, 0.01094818115234375, 0.01715087890625, 0.02335357666015625, 0.0295562744140625, 0.03575897216796875, 0.041961669921875, 0.04816436767578125, 0.0543670654296875, 0.06056976318359375, 0.0667724609375, 0.07297515869140625, 0.0791778564453125, 0.08538055419921875, 0.091583251953125, 0.09778594970703125, 0.1039886474609375, 0.11019134521484375, 0.11639404296875, 0.12259674072265625, 0.1287994384765625, 0.13500213623046875, 0.141204833984375, 0.14740753173828125, 0.1536102294921875, 0.15981292724609375, 0.166015625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 13.0, 8.0, 7.0, 8.0, 21.0, 22.0, 29.0, 30.0, 78.0, 117.0, 401.0, 4078.0, 1003663.0, 38594.0, 933.0, 227.0, 98.0, 45.0, 22.0, 19.0, 19.0, 18.0, 12.0, 19.0, 11.0, 9.0, 3.0, 4.0, 2.0, 1.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.619140625, -3.483917236328125, -3.34869384765625, -3.213470458984375, -3.0782470703125, -2.943023681640625, -2.80780029296875, -2.672576904296875, -2.537353515625, -2.402130126953125, -2.26690673828125, -2.131683349609375, -1.9964599609375, -1.861236572265625, -1.72601318359375, -1.590789794921875, -1.45556640625, -1.320343017578125, -1.18511962890625, -1.049896240234375, -0.9146728515625, -0.779449462890625, -0.64422607421875, -0.509002685546875, -0.373779296875, -0.238555908203125, -0.10333251953125, 0.031890869140625, 0.1671142578125, 0.302337646484375, 0.43756103515625, 0.572784423828125, 0.7080078125, 0.843231201171875, 0.97845458984375, 1.113677978515625, 1.2489013671875, 1.384124755859375, 1.51934814453125, 1.654571533203125, 1.789794921875, 1.925018310546875, 2.06024169921875, 2.195465087890625, 2.3306884765625, 2.465911865234375, 2.60113525390625, 2.736358642578125, 2.87158203125, 3.006805419921875, 3.14202880859375, 3.277252197265625, 3.4124755859375, 3.547698974609375, 3.68292236328125, 3.818145751953125, 3.953369140625, 4.088592529296875, 4.22381591796875, 4.359039306640625, 4.4942626953125, 4.629486083984375, 4.76470947265625, 4.899932861328125, 5.03515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 10.0, 14.0, 26.0, 61.0, 90.0, 214.0, 323.0, 117.0, 56.0, 44.0, 16.0, 4.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38207873702049255, -0.3506269156932831, -0.3191750943660736, -0.28772324323654175, -0.2562714219093323, -0.224819615483284, -0.19336777925491333, -0.16191595792770386, -0.13046413660049438, -0.09901231527328491, -0.06756048649549484, -0.03610865771770477, -0.0046568363904953, 0.026794984936714172, 0.05824682116508484, 0.08969864249229431, 0.12115046381950378, 0.15260228514671326, 0.18405410647392273, 0.2155059427022934, 0.24695776402950287, 0.27840960025787354, 0.309861421585083, 0.3413132429122925, 0.37276506423950195, 0.4042168855667114, 0.4356687068939209, 0.46712052822113037, 0.49857234954833984, 0.5300241708755493, 0.5614759922027588, 0.5929278135299683, 0.6243796348571777, 0.6558314561843872, 0.6872832775115967, 0.7187350988388062, 0.7501869201660156, 0.7816387414932251, 0.8130905628204346, 0.844542384147644, 0.8759942054748535, 0.907446026802063, 0.9388978481292725, 0.9703496694564819, 1.0018014907836914, 1.0332533121109009, 1.0647051334381104, 1.0961569547653198, 1.1276087760925293, 1.1590605974197388, 1.1905124187469482, 1.2219642400741577, 1.2534160614013672, 1.2848678827285767, 1.3163197040557861, 1.3477715253829956, 1.3792234659194946, 1.410675287246704, 1.4421271085739136, 1.473578929901123, 1.5050307512283325, 1.536482572555542, 1.5679343938827515, 1.599386215209961, 1.6308380365371704]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 7.0, 1.0, 7.0, 6.0, 8.0, 10.0, 12.0, 11.0, 12.0, 20.0, 21.0, 27.0, 29.0, 32.0, 36.0, 34.0, 33.0, 40.0, 32.0, 46.0, 51.0, 34.0, 34.0, 34.0, 32.0, 30.0, 33.0, 34.0, 41.0, 44.0, 40.0, 31.0, 14.0, 19.0, 20.0, 10.0, 11.0, 12.0, 12.0, 13.0, 6.0, 5.0, 4.0, 7.0, 2.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5377938747406006, -0.5203893780708313, -0.5029848217964172, -0.48558032512664795, -0.4681757986545563, -0.4507712721824646, -0.4333667755126953, -0.41596224904060364, -0.39855772256851196, -0.3811531960964203, -0.3637486696243286, -0.3463441729545593, -0.32893964648246765, -0.311535120010376, -0.2941306233406067, -0.276726096868515, -0.25932157039642334, -0.24191704392433167, -0.22451253235340118, -0.2071080207824707, -0.18970349431037903, -0.17229896783828735, -0.15489445626735687, -0.1374899446964264, -0.12008541822433472, -0.10268089920282364, -0.08527638018131256, -0.06787186115980148, -0.050467342138290405, -0.03306282311677933, -0.01565830409526825, 0.0017462149262428284, 0.019150733947753906, 0.036555252969264984, 0.05395977199077606, 0.07136429101228714, 0.08876881003379822, 0.1061733290553093, 0.12357784807682037, 0.14098235964775085, 0.15838688611984253, 0.1757914125919342, 0.19319592416286469, 0.21060043573379517, 0.22800496220588684, 0.24540948867797852, 0.2628139853477478, 0.2802185118198395, 0.29762303829193115, 0.3150275647640228, 0.3324320912361145, 0.3498365879058838, 0.36724111437797546, 0.38464564085006714, 0.4020501375198364, 0.4194546639919281, 0.4368591904640198, 0.45426371693611145, 0.4716682434082031, 0.4890727400779724, 0.5064772367477417, 0.5238817930221558, 0.541286289691925, 0.5586908459663391, 0.5760953426361084]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 12.0, 9.0, 11.0, 21.0, 24.0, 27.0, 28.0, 35.0, 42.0, 46.0, 43.0, 57.0, 51.0, 62.0, 39.0, 58.0, 43.0, 48.0, 51.0, 39.0, 45.0, 35.0, 32.0, 28.0, 26.0, 21.0, 12.0, 13.0, 10.0, 10.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.546875, -11.21435546875, -10.8818359375, -10.54931640625, -10.216796875, -9.88427734375, -9.5517578125, -9.21923828125, -8.88671875, -8.55419921875, -8.2216796875, -7.88916015625, -7.556640625, -7.22412109375, -6.8916015625, -6.55908203125, -6.2265625, -5.89404296875, -5.5615234375, -5.22900390625, -4.896484375, -4.56396484375, -4.2314453125, -3.89892578125, -3.56640625, -3.23388671875, -2.9013671875, -2.56884765625, -2.236328125, -1.90380859375, -1.5712890625, -1.23876953125, -0.90625, -0.57373046875, -0.2412109375, 0.09130859375, 0.423828125, 0.75634765625, 1.0888671875, 1.42138671875, 1.75390625, 2.08642578125, 2.4189453125, 2.75146484375, 3.083984375, 3.41650390625, 3.7490234375, 4.08154296875, 4.4140625, 4.74658203125, 5.0791015625, 5.41162109375, 5.744140625, 6.07666015625, 6.4091796875, 6.74169921875, 7.07421875, 7.40673828125, 7.7392578125, 8.07177734375, 8.404296875, 8.73681640625, 9.0693359375, 9.40185546875, 9.734375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 13.0, 12.0, 18.0, 39.0, 46.0, 96.0, 119.0, 229.0, 370.0, 563.0, 1080.0, 1833.0, 3613.0, 7360.0, 15586.0, 34396.0, 85416.0, 245198.0, 398085.0, 151816.0, 56172.0, 23726.0, 11118.0, 5434.0, 2700.0, 1473.0, 798.0, 433.0, 295.0, 187.0, 106.0, 72.0, 44.0, 36.0, 17.0, 13.0, 9.0, 13.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.10565185546875, -6.8245849609375, -6.54351806640625, -6.262451171875, -5.98138427734375, -5.7003173828125, -5.41925048828125, -5.13818359375, -4.85711669921875, -4.5760498046875, -4.29498291015625, -4.013916015625, -3.73284912109375, -3.4517822265625, -3.17071533203125, -2.8896484375, -2.60858154296875, -2.3275146484375, -2.04644775390625, -1.765380859375, -1.48431396484375, -1.2032470703125, -0.92218017578125, -0.64111328125, -0.36004638671875, -0.0789794921875, 0.20208740234375, 0.483154296875, 0.76422119140625, 1.0452880859375, 1.32635498046875, 1.607421875, 1.88848876953125, 2.1695556640625, 2.45062255859375, 2.731689453125, 3.01275634765625, 3.2938232421875, 3.57489013671875, 3.85595703125, 4.13702392578125, 4.4180908203125, 4.69915771484375, 4.980224609375, 5.26129150390625, 5.5423583984375, 5.82342529296875, 6.1044921875, 6.38555908203125, 6.6666259765625, 6.94769287109375, 7.228759765625, 7.50982666015625, 7.7908935546875, 8.07196044921875, 8.35302734375, 8.63409423828125, 8.9151611328125, 9.19622802734375, 9.477294921875, 9.75836181640625, 10.0394287109375, 10.32049560546875, 10.6015625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 7.0, 7.0, 17.0, 18.0, 20.0, 19.0, 32.0, 29.0, 36.0, 29.0, 42.0, 37.0, 48.0, 61.0, 118.0, 289.0, 1513.0, 213.0, 80.0, 67.0, 46.0, 43.0, 34.0, 34.0, 23.0, 36.0, 26.0, 19.0, 16.0, 18.0, 13.0, 14.0, 9.0, 4.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-30.65625, -29.787109375, -28.91796875, -28.048828125, -27.1796875, -26.310546875, -25.44140625, -24.572265625, -23.703125, -22.833984375, -21.96484375, -21.095703125, -20.2265625, -19.357421875, -18.48828125, -17.619140625, -16.75, -15.880859375, -15.01171875, -14.142578125, -13.2734375, -12.404296875, -11.53515625, -10.666015625, -9.796875, -8.927734375, -8.05859375, -7.189453125, -6.3203125, -5.451171875, -4.58203125, -3.712890625, -2.84375, -1.974609375, -1.10546875, -0.236328125, 0.6328125, 1.501953125, 2.37109375, 3.240234375, 4.109375, 4.978515625, 5.84765625, 6.716796875, 7.5859375, 8.455078125, 9.32421875, 10.193359375, 11.0625, 11.931640625, 12.80078125, 13.669921875, 14.5390625, 15.408203125, 16.27734375, 17.146484375, 18.015625, 18.884765625, 19.75390625, 20.623046875, 21.4921875, 22.361328125, 23.23046875, 24.099609375, 24.96875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 16.0, 24.0, 26.0, 26.0, 35.0, 48.0, 70.0, 82.0, 117.0, 160.0, 245.0, 426.0, 1491.0, 26562.0, 3017932.0, 94564.0, 2381.0, 484.0, 267.0, 190.0, 136.0, 88.0, 80.0, 56.0, 40.0, 26.0, 30.0, 21.0, 14.0, 8.0, 9.0, 5.0, 2.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.53125, -53.59130859375, -51.6513671875, -49.71142578125, -47.771484375, -45.83154296875, -43.8916015625, -41.95166015625, -40.01171875, -38.07177734375, -36.1318359375, -34.19189453125, -32.251953125, -30.31201171875, -28.3720703125, -26.43212890625, -24.4921875, -22.55224609375, -20.6123046875, -18.67236328125, -16.732421875, -14.79248046875, -12.8525390625, -10.91259765625, -8.97265625, -7.03271484375, -5.0927734375, -3.15283203125, -1.212890625, 0.72705078125, 2.6669921875, 4.60693359375, 6.546875, 8.48681640625, 10.4267578125, 12.36669921875, 14.306640625, 16.24658203125, 18.1865234375, 20.12646484375, 22.06640625, 24.00634765625, 25.9462890625, 27.88623046875, 29.826171875, 31.76611328125, 33.7060546875, 35.64599609375, 37.5859375, 39.52587890625, 41.4658203125, 43.40576171875, 45.345703125, 47.28564453125, 49.2255859375, 51.16552734375, 53.10546875, 55.04541015625, 56.9853515625, 58.92529296875, 60.865234375, 62.80517578125, 64.7451171875, 66.68505859375, 68.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 25.0, 95.0, 261.0, 265.0, 204.0, 105.0, 39.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-120.59603881835938, -117.69630432128906, -114.79656982421875, -111.89683532714844, -108.99710845947266, -106.09737396240234, -103.19763946533203, -100.29790496826172, -97.39817810058594, -94.49844360351562, -91.59870910644531, -88.698974609375, -85.79924774169922, -82.8995132446289, -79.9997787475586, -77.10004425048828, -74.20030975341797, -71.30057525634766, -68.40084075927734, -65.50111389160156, -62.60137939453125, -59.70164489746094, -56.801910400390625, -53.90217590332031, -51.002445220947266, -48.10271072387695, -45.202980041503906, -42.303245544433594, -39.40351104736328, -36.503780364990234, -33.60404586791992, -30.704313278198242, -27.80457305908203, -24.90484046936035, -22.005107879638672, -19.10537338256836, -16.20564079284668, -13.305908203125, -10.406173706054688, -7.506441116333008, -4.606708526611328, -1.7069754600524902, 1.1927576065063477, 4.092491149902344, 6.992223739624023, 9.891956329345703, 12.791690826416016, 15.691423416137695, 18.591156005859375, 21.490888595581055, 24.390621185302734, 27.290355682373047, 30.190088272094727, 33.089820861816406, 35.98955535888672, 38.88928985595703, 41.78902053833008, 44.68875503540039, 47.58848571777344, 50.48822021484375, 53.38795471191406, 56.28768539428711, 59.18741989135742, 62.08715057373047, 64.98688507080078]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 8.0, 11.0, 19.0, 19.0, 25.0, 22.0, 23.0, 27.0, 26.0, 25.0, 42.0, 42.0, 41.0, 39.0, 41.0, 41.0, 30.0, 37.0, 44.0, 42.0, 45.0, 37.0, 47.0, 34.0, 35.0, 20.0, 26.0, 22.0, 20.0, 21.0, 13.0, 12.0, 14.0, 5.0, 7.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.1614761352539, -67.1134262084961, -65.06536865234375, -63.01731872558594, -60.969268798828125, -58.92121505737305, -56.87316131591797, -54.825111389160156, -52.77705764770508, -50.72900390625, -48.68095397949219, -46.63290023803711, -44.58484649658203, -42.53679656982422, -40.48874282836914, -38.44068908691406, -36.39263916015625, -34.34458541870117, -32.29653549194336, -30.24848175048828, -28.200429916381836, -26.15237808227539, -24.104324340820312, -22.056272506713867, -20.008220672607422, -17.960168838500977, -15.912116050720215, -13.864063262939453, -11.816011428833008, -9.767959594726562, -7.719906806945801, -5.671854019165039, -3.623798370361328, -1.5757460594177246, 0.4723062515258789, 2.5203585624694824, 4.568410873413086, 6.616462707519531, 8.664515495300293, 10.712568283081055, 12.7606201171875, 14.808671951293945, 16.85672378540039, 18.90477752685547, 20.952829360961914, 23.00088119506836, 25.048934936523438, 27.096986770629883, 29.145038604736328, 31.193090438842773, 33.24114227294922, 35.2891960144043, 37.337249755859375, 39.38529968261719, 41.433353424072266, 43.481407165527344, 45.529457092285156, 47.577510833740234, 49.62556076049805, 51.673614501953125, 53.72166442871094, 55.769718170166016, 57.817771911621094, 59.865821838378906, 61.913875579833984]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 8.0, 4.0, 24.0, 25.0, 27.0, 25.0, 26.0, 45.0, 45.0, 40.0, 46.0, 40.0, 61.0, 51.0, 62.0, 48.0, 49.0, 36.0, 49.0, 34.0, 52.0, 24.0, 28.0, 23.0, 20.0, 22.0, 18.0, 13.0, 11.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.671875, -11.3409423828125, -11.010009765625, -10.6790771484375, -10.34814453125, -10.0172119140625, -9.686279296875, -9.3553466796875, -9.0244140625, -8.6934814453125, -8.362548828125, -8.0316162109375, -7.70068359375, -7.3697509765625, -7.038818359375, -6.7078857421875, -6.376953125, -6.0460205078125, -5.715087890625, -5.3841552734375, -5.05322265625, -4.7222900390625, -4.391357421875, -4.0604248046875, -3.7294921875, -3.3985595703125, -3.067626953125, -2.7366943359375, -2.40576171875, -2.0748291015625, -1.743896484375, -1.4129638671875, -1.08203125, -0.7510986328125, -0.420166015625, -0.0892333984375, 0.24169921875, 0.5726318359375, 0.903564453125, 1.2344970703125, 1.5654296875, 1.8963623046875, 2.227294921875, 2.5582275390625, 2.88916015625, 3.2200927734375, 3.551025390625, 3.8819580078125, 4.212890625, 4.5438232421875, 4.874755859375, 5.2056884765625, 5.53662109375, 5.8675537109375, 6.198486328125, 6.5294189453125, 6.8603515625, 7.1912841796875, 7.522216796875, 7.8531494140625, 8.18408203125, 8.5150146484375, 8.845947265625, 9.1768798828125, 9.5078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 9.0, 7.0, 4.0, 15.0, 22.0, 24.0, 40.0, 57.0, 64.0, 114.0, 139.0, 200.0, 289.0, 469.0, 776.0, 1359.0, 2605.0, 5552.0, 13926.0, 48245.0, 392573.0, 2905117.0, 721042.0, 69981.0, 17850.0, 6872.0, 3041.0, 1455.0, 886.0, 493.0, 328.0, 223.0, 144.0, 92.0, 83.0, 53.0, 34.0, 34.0, 18.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.5, -27.652099609375, -26.80419921875, -25.956298828125, -25.1083984375, -24.260498046875, -23.41259765625, -22.564697265625, -21.716796875, -20.868896484375, -20.02099609375, -19.173095703125, -18.3251953125, -17.477294921875, -16.62939453125, -15.781494140625, -14.93359375, -14.085693359375, -13.23779296875, -12.389892578125, -11.5419921875, -10.694091796875, -9.84619140625, -8.998291015625, -8.150390625, -7.302490234375, -6.45458984375, -5.606689453125, -4.7587890625, -3.910888671875, -3.06298828125, -2.215087890625, -1.3671875, -0.519287109375, 0.32861328125, 1.176513671875, 2.0244140625, 2.872314453125, 3.72021484375, 4.568115234375, 5.416015625, 6.263916015625, 7.11181640625, 7.959716796875, 8.8076171875, 9.655517578125, 10.50341796875, 11.351318359375, 12.19921875, 13.047119140625, 13.89501953125, 14.742919921875, 15.5908203125, 16.438720703125, 17.28662109375, 18.134521484375, 18.982421875, 19.830322265625, 20.67822265625, 21.526123046875, 22.3740234375, 23.221923828125, 24.06982421875, 24.917724609375, 25.765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 10.0, 5.0, 3.0, 13.0, 9.0, 10.0, 15.0, 27.0, 22.0, 33.0, 40.0, 58.0, 98.0, 101.0, 159.0, 221.0, 329.0, 388.0, 507.0, 505.0, 403.0, 317.0, 217.0, 135.0, 122.0, 84.0, 68.0, 44.0, 43.0, 21.0, 19.0, 14.0, 10.0, 11.0, 5.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.8125, -18.2763671875, -17.740234375, -17.2041015625, -16.66796875, -16.1318359375, -15.595703125, -15.0595703125, -14.5234375, -13.9873046875, -13.451171875, -12.9150390625, -12.37890625, -11.8427734375, -11.306640625, -10.7705078125, -10.234375, -9.6982421875, -9.162109375, -8.6259765625, -8.08984375, -7.5537109375, -7.017578125, -6.4814453125, -5.9453125, -5.4091796875, -4.873046875, -4.3369140625, -3.80078125, -3.2646484375, -2.728515625, -2.1923828125, -1.65625, -1.1201171875, -0.583984375, -0.0478515625, 0.48828125, 1.0244140625, 1.560546875, 2.0966796875, 2.6328125, 3.1689453125, 3.705078125, 4.2412109375, 4.77734375, 5.3134765625, 5.849609375, 6.3857421875, 6.921875, 7.4580078125, 7.994140625, 8.5302734375, 9.06640625, 9.6025390625, 10.138671875, 10.6748046875, 11.2109375, 11.7470703125, 12.283203125, 12.8193359375, 13.35546875, 13.8916015625, 14.427734375, 14.9638671875, 15.5]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 18.0, 16.0, 21.0, 22.0, 33.0, 68.0, 91.0, 142.0, 187.0, 403.0, 1015.0, 3514.0, 21385.0, 513497.0, 3556511.0, 85695.0, 8276.0, 1878.0, 657.0, 305.0, 154.0, 109.0, 74.0, 44.0, 28.0, 26.0, 20.0, 23.0, 14.0, 6.0, 8.0, 5.0, 10.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.86962890625, -68.7392578125, -66.60888671875, -64.478515625, -62.34814453125, -60.2177734375, -58.08740234375, -55.95703125, -53.82666015625, -51.6962890625, -49.56591796875, -47.435546875, -45.30517578125, -43.1748046875, -41.04443359375, -38.9140625, -36.78369140625, -34.6533203125, -32.52294921875, -30.392578125, -28.26220703125, -26.1318359375, -24.00146484375, -21.87109375, -19.74072265625, -17.6103515625, -15.47998046875, -13.349609375, -11.21923828125, -9.0888671875, -6.95849609375, -4.828125, -2.69775390625, -0.5673828125, 1.56298828125, 3.693359375, 5.82373046875, 7.9541015625, 10.08447265625, 12.21484375, 14.34521484375, 16.4755859375, 18.60595703125, 20.736328125, 22.86669921875, 24.9970703125, 27.12744140625, 29.2578125, 31.38818359375, 33.5185546875, 35.64892578125, 37.779296875, 39.90966796875, 42.0400390625, 44.17041015625, 46.30078125, 48.43115234375, 50.5615234375, 52.69189453125, 54.822265625, 56.95263671875, 59.0830078125, 61.21337890625, 63.34375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 22.0, 73.0, 208.0, 340.0, 246.0, 89.0, 24.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.43296813964844, -130.91455078125, -121.39613342285156, -111.87772369384766, -102.35930633544922, -92.84088897705078, -83.32247924804688, -73.80406188964844, -64.28564453125, -54.76722717285156, -45.24881362915039, -35.73040008544922, -26.21198272705078, -16.693565368652344, -7.175151824951172, 2.34326171875, 11.861679077148438, 21.380094528198242, 30.898509979248047, 40.41692352294922, 49.935340881347656, 59.453758239746094, 68.97216796875, 78.49058532714844, 88.00900268554688, 97.52742004394531, 107.04583740234375, 116.56424713134766, 126.0826644897461, 135.60107421875, 145.11949157714844, 154.63790893554688, 164.15634155273438, 173.6747589111328, 183.19317626953125, 192.7115936279297, 202.23001098632812, 211.7484130859375, 221.26683044433594, 230.78524780273438, 240.3036651611328, 249.82208251953125, 259.3404846191406, 268.8589172363281, 278.3773193359375, 287.895751953125, 297.4141540527344, 306.93255615234375, 316.45098876953125, 325.9693908691406, 335.4878234863281, 345.0062255859375, 354.524658203125, 364.0430603027344, 373.5614929199219, 383.07989501953125, 392.59832763671875, 402.1167297363281, 411.6351623535156, 421.153564453125, 430.6719970703125, 440.1903991699219, 449.7088317871094, 459.22723388671875, 468.7456359863281]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 9.0, 7.0, 10.0, 9.0, 14.0, 18.0, 14.0, 14.0, 29.0, 28.0, 21.0, 28.0, 32.0, 24.0, 36.0, 36.0, 37.0, 48.0, 44.0, 25.0, 34.0, 39.0, 38.0, 36.0, 41.0, 25.0, 34.0, 31.0, 34.0, 27.0, 22.0, 22.0, 26.0, 19.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-56.384605407714844, -54.535579681396484, -52.686553955078125, -50.837528228759766, -48.988502502441406, -47.13947677612305, -45.29045104980469, -43.44142532348633, -41.59239959716797, -39.74337387084961, -37.89434814453125, -36.04532241821289, -34.19629669189453, -32.34727096557617, -30.498245239257812, -28.649219512939453, -26.800193786621094, -24.951168060302734, -23.102142333984375, -21.253116607666016, -19.404090881347656, -17.555065155029297, -15.706039428710938, -13.857013702392578, -12.007987976074219, -10.15896224975586, -8.3099365234375, -6.460910797119141, -4.611885070800781, -2.762859344482422, -0.9138336181640625, 0.9351921081542969, 2.7842178344726562, 4.633243560791016, 6.482269287109375, 8.331295013427734, 10.180320739746094, 12.029346466064453, 13.878372192382812, 15.727397918701172, 17.57642364501953, 19.42544937133789, 21.27447509765625, 23.12350082397461, 24.97252655029297, 26.821552276611328, 28.670578002929688, 30.519603729248047, 32.368629455566406, 34.217655181884766, 36.066680908203125, 37.915706634521484, 39.764732360839844, 41.6137580871582, 43.46278381347656, 45.31180953979492, 47.16083526611328, 49.00986099243164, 50.85888671875, 52.70791244506836, 54.55693817138672, 56.40596389770508, 58.25498962402344, 60.1040153503418, 61.953041076660156]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 4.0, 13.0, 11.0, 13.0, 13.0, 29.0, 15.0, 28.0, 36.0, 34.0, 56.0, 49.0, 40.0, 52.0, 64.0, 56.0, 50.0, 49.0, 49.0, 42.0, 37.0, 44.0, 39.0, 28.0, 24.0, 21.0, 22.0, 26.0, 7.0, 11.0, 6.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.640625, -11.2967529296875, -10.952880859375, -10.6090087890625, -10.26513671875, -9.9212646484375, -9.577392578125, -9.2335205078125, -8.8896484375, -8.5457763671875, -8.201904296875, -7.8580322265625, -7.51416015625, -7.1702880859375, -6.826416015625, -6.4825439453125, -6.138671875, -5.7947998046875, -5.450927734375, -5.1070556640625, -4.76318359375, -4.4193115234375, -4.075439453125, -3.7315673828125, -3.3876953125, -3.0438232421875, -2.699951171875, -2.3560791015625, -2.01220703125, -1.6683349609375, -1.324462890625, -0.9805908203125, -0.63671875, -0.2928466796875, 0.051025390625, 0.3948974609375, 0.73876953125, 1.0826416015625, 1.426513671875, 1.7703857421875, 2.1142578125, 2.4581298828125, 2.802001953125, 3.1458740234375, 3.48974609375, 3.8336181640625, 4.177490234375, 4.5213623046875, 4.865234375, 5.2091064453125, 5.552978515625, 5.8968505859375, 6.24072265625, 6.5845947265625, 6.928466796875, 7.2723388671875, 7.6162109375, 7.9600830078125, 8.303955078125, 8.6478271484375, 8.99169921875, 9.3355712890625, 9.679443359375, 10.0233154296875, 10.3671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 9.0, 23.0, 30.0, 37.0, 80.0, 91.0, 169.0, 297.0, 476.0, 760.0, 1355.0, 2310.0, 4010.0, 7454.0, 14351.0, 28567.0, 59704.0, 134738.0, 278797.0, 271292.0, 128843.0, 57502.0, 27284.0, 13742.0, 7324.0, 3951.0, 2213.0, 1238.0, 757.0, 438.0, 228.0, 177.0, 100.0, 60.0, 47.0, 34.0, 19.0, 12.0, 9.0, 3.0, 8.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.0491790771484375, -1.987030029296875, -1.9248809814453125, -1.86273193359375, -1.8005828857421875, -1.738433837890625, -1.6762847900390625, -1.6141357421875, -1.5519866943359375, -1.489837646484375, -1.4276885986328125, -1.36553955078125, -1.3033905029296875, -1.241241455078125, -1.1790924072265625, -1.116943359375, -1.0547943115234375, -0.992645263671875, -0.9304962158203125, -0.86834716796875, -0.8061981201171875, -0.744049072265625, -0.6819000244140625, -0.6197509765625, -0.5576019287109375, -0.495452880859375, -0.4333038330078125, -0.37115478515625, -0.3090057373046875, -0.246856689453125, -0.1847076416015625, -0.12255859375, -0.0604095458984375, 0.001739501953125, 0.0638885498046875, 0.12603759765625, 0.1881866455078125, 0.250335693359375, 0.3124847412109375, 0.3746337890625, 0.4367828369140625, 0.498931884765625, 0.5610809326171875, 0.62322998046875, 0.6853790283203125, 0.747528076171875, 0.8096771240234375, 0.871826171875, 0.9339752197265625, 0.996124267578125, 1.0582733154296875, 1.12042236328125, 1.1825714111328125, 1.244720458984375, 1.3068695068359375, 1.3690185546875, 1.4311676025390625, 1.493316650390625, 1.5554656982421875, 1.61761474609375, 1.6797637939453125, 1.741912841796875, 1.8040618896484375, 1.8662109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 12.0, 9.0, 16.0, 14.0, 20.0, 15.0, 20.0, 22.0, 23.0, 26.0, 40.0, 34.0, 52.0, 51.0, 49.0, 27.0, 1074.0, 57.0, 50.0, 52.0, 35.0, 38.0, 38.0, 35.0, 30.0, 29.0, 30.0, 31.0, 15.0, 18.0, 13.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.84857177734375, -5.6307373046875, -5.41290283203125, -5.195068359375, -4.97723388671875, -4.7593994140625, -4.54156494140625, -4.32373046875, -4.10589599609375, -3.8880615234375, -3.67022705078125, -3.452392578125, -3.23455810546875, -3.0167236328125, -2.79888916015625, -2.5810546875, -2.36322021484375, -2.1453857421875, -1.92755126953125, -1.709716796875, -1.49188232421875, -1.2740478515625, -1.05621337890625, -0.83837890625, -0.62054443359375, -0.4027099609375, -0.18487548828125, 0.032958984375, 0.25079345703125, 0.4686279296875, 0.68646240234375, 0.904296875, 1.12213134765625, 1.3399658203125, 1.55780029296875, 1.775634765625, 1.99346923828125, 2.2113037109375, 2.42913818359375, 2.64697265625, 2.86480712890625, 3.0826416015625, 3.30047607421875, 3.518310546875, 3.73614501953125, 3.9539794921875, 4.17181396484375, 4.3896484375, 4.60748291015625, 4.8253173828125, 5.04315185546875, 5.260986328125, 5.47882080078125, 5.6966552734375, 5.91448974609375, 6.13232421875, 6.35015869140625, 6.5679931640625, 6.78582763671875, 7.003662109375, 7.22149658203125, 7.4393310546875, 7.65716552734375, 7.875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 7.0, 11.0, 19.0, 24.0, 21.0, 45.0, 70.0, 91.0, 100.0, 160.0, 240.0, 387.0, 550.0, 781.0, 1225.0, 1947.0, 3182.0, 5257.0, 8640.0, 14876.0, 25324.0, 45824.0, 85228.0, 168466.0, 1270359.0, 225191.0, 106976.0, 56520.0, 31131.0, 17451.0, 10316.0, 6238.0, 3810.0, 2331.0, 1413.0, 983.0, 594.0, 404.0, 286.0, 170.0, 141.0, 84.0, 69.0, 43.0, 35.0, 27.0, 22.0, 16.0, 10.0, 9.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.6611328125, -0.6402587890625, -0.619384765625, -0.5985107421875, -0.57763671875, -0.5567626953125, -0.535888671875, -0.5150146484375, -0.494140625, -0.4732666015625, -0.452392578125, -0.4315185546875, -0.41064453125, -0.3897705078125, -0.368896484375, -0.3480224609375, -0.3271484375, -0.3062744140625, -0.285400390625, -0.2645263671875, -0.24365234375, -0.2227783203125, -0.201904296875, -0.1810302734375, -0.16015625, -0.1392822265625, -0.118408203125, -0.0975341796875, -0.07666015625, -0.0557861328125, -0.034912109375, -0.0140380859375, 0.0068359375, 0.0277099609375, 0.048583984375, 0.0694580078125, 0.09033203125, 0.1112060546875, 0.132080078125, 0.1529541015625, 0.173828125, 0.1947021484375, 0.215576171875, 0.2364501953125, 0.25732421875, 0.2781982421875, 0.299072265625, 0.3199462890625, 0.3408203125, 0.3616943359375, 0.382568359375, 0.4034423828125, 0.42431640625, 0.4451904296875, 0.466064453125, 0.4869384765625, 0.5078125, 0.5286865234375, 0.549560546875, 0.5704345703125, 0.59130859375, 0.6121826171875, 0.633056640625, 0.6539306640625, 0.6748046875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 2.0, 0.0, 8.0, 4.0, 8.0, 9.0, 10.0, 10.0, 15.0, 7.0, 16.0, 10.0, 17.0, 16.0, 28.0, 66.0, 109.0, 317.0, 103.0, 66.0, 22.0, 19.0, 10.0, 19.0, 11.0, 14.0, 13.0, 12.0, 11.0, 5.0, 4.0, 5.0, 2.0, 11.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1925048828125, -0.18638229370117188, -0.18025970458984375, -0.17413711547851562, -0.1680145263671875, -0.16189193725585938, -0.15576934814453125, -0.14964675903320312, -0.143524169921875, -0.13740158081054688, -0.13127899169921875, -0.12515640258789062, -0.1190338134765625, -0.11291122436523438, -0.10678863525390625, -0.10066604614257812, -0.09454345703125, -0.08842086791992188, -0.08229827880859375, -0.07617568969726562, -0.0700531005859375, -0.06393051147460938, -0.05780792236328125, -0.051685333251953125, -0.045562744140625, -0.039440155029296875, -0.03331756591796875, -0.027194976806640625, -0.0210723876953125, -0.014949798583984375, -0.00882720947265625, -0.002704620361328125, 0.00341796875, 0.009540557861328125, 0.01566314697265625, 0.021785736083984375, 0.0279083251953125, 0.034030914306640625, 0.04015350341796875, 0.046276092529296875, 0.052398681640625, 0.058521270751953125, 0.06464385986328125, 0.07076644897460938, 0.0768890380859375, 0.08301162719726562, 0.08913421630859375, 0.09525680541992188, 0.10137939453125, 0.10750198364257812, 0.11362457275390625, 0.11974716186523438, 0.1258697509765625, 0.13199234008789062, 0.13811492919921875, 0.14423751831054688, 0.150360107421875, 0.15648269653320312, 0.16260528564453125, 0.16872787475585938, 0.1748504638671875, 0.18097305297851562, 0.18709564208984375, 0.19321823120117188, 0.1993408203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 5.0, 7.0, 12.0, 12.0, 15.0, 16.0, 25.0, 35.0, 31.0, 63.0, 173.0, 425.0, 6046.0, 1028305.0, 12387.0, 527.0, 167.0, 71.0, 61.0, 20.0, 23.0, 13.0, 14.0, 16.0, 11.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.14984130859375, -4.0184326171875, -3.88702392578125, -3.755615234375, -3.62420654296875, -3.4927978515625, -3.36138916015625, -3.22998046875, -3.09857177734375, -2.9671630859375, -2.83575439453125, -2.704345703125, -2.57293701171875, -2.4415283203125, -2.31011962890625, -2.1787109375, -2.04730224609375, -1.9158935546875, -1.78448486328125, -1.653076171875, -1.52166748046875, -1.3902587890625, -1.25885009765625, -1.12744140625, -0.99603271484375, -0.8646240234375, -0.73321533203125, -0.601806640625, -0.47039794921875, -0.3389892578125, -0.20758056640625, -0.076171875, 0.05523681640625, 0.1866455078125, 0.31805419921875, 0.449462890625, 0.58087158203125, 0.7122802734375, 0.84368896484375, 0.97509765625, 1.10650634765625, 1.2379150390625, 1.36932373046875, 1.500732421875, 1.63214111328125, 1.7635498046875, 1.89495849609375, 2.0263671875, 2.15777587890625, 2.2891845703125, 2.42059326171875, 2.552001953125, 2.68341064453125, 2.8148193359375, 2.94622802734375, 3.07763671875, 3.20904541015625, 3.3404541015625, 3.47186279296875, 3.603271484375, 3.73468017578125, 3.8660888671875, 3.99749755859375, 4.12890625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 16.0, 32.0, 78.0, 206.0, 432.0, 145.0, 49.0, 28.0, 14.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.728989601135254, -1.6871917247772217, -1.6453938484191895, -1.6035958528518677, -1.5617979764938354, -1.5200001001358032, -1.4782021045684814, -1.4364042282104492, -1.394606351852417, -1.3528084754943848, -1.3110105991363525, -1.2692126035690308, -1.2274147272109985, -1.1856168508529663, -1.1438188552856445, -1.1020209789276123, -1.06022310256958, -1.0184252262115479, -0.9766272902488708, -0.9348293542861938, -0.8930314779281616, -0.8512336015701294, -0.8094356656074524, -0.7676377296447754, -0.7258398532867432, -0.6840419769287109, -0.6422440409660339, -0.6004461050033569, -0.5586482286453247, -0.5168503522872925, -0.4750524163246155, -0.43325451016426086, -0.3914567232131958, -0.3496588170528412, -0.3078609108924866, -0.26606300473213196, -0.22426509857177734, -0.18246719241142273, -0.14066928625106812, -0.0988713800907135, -0.05707347393035889, -0.015275567770004272, 0.026522338390350342, 0.06832024455070496, 0.11011815071105957, 0.15191605687141418, 0.1937139630317688, 0.2355118691921234, 0.277309775352478, 0.31910768151283264, 0.36090558767318726, 0.40270349383354187, 0.4445013999938965, 0.4862993061542511, 0.5280972123146057, 0.5698951482772827, 0.6116930246353149, 0.6534909009933472, 0.6952888369560242, 0.7370867729187012, 0.7788846492767334, 0.8206825256347656, 0.8624804615974426, 0.9042783975601196, 0.9460762739181519]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 8.0, 5.0, 7.0, 10.0, 13.0, 9.0, 17.0, 15.0, 12.0, 27.0, 22.0, 29.0, 29.0, 37.0, 24.0, 36.0, 24.0, 31.0, 36.0, 48.0, 34.0, 32.0, 38.0, 29.0, 24.0, 37.0, 25.0, 34.0, 26.0, 30.0, 21.0, 40.0, 24.0, 21.0, 26.0, 19.0, 17.0, 14.0, 9.0, 9.0, 17.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.4947187900543213, -0.4796886742115021, -0.46465858817100525, -0.44962847232818604, -0.4345983862876892, -0.41956827044487, -0.4045381546020508, -0.38950806856155396, -0.37447795271873474, -0.3594478368759155, -0.3444177508354187, -0.3293876349925995, -0.31435754895210266, -0.29932743310928345, -0.2842973470687866, -0.2692672312259674, -0.2542371153831482, -0.23920701444149017, -0.22417691349983215, -0.20914679765701294, -0.19411669671535492, -0.1790865957736969, -0.16405649483203888, -0.14902639389038086, -0.13399630784988403, -0.11896620690822601, -0.1039360985159874, -0.08890599757432938, -0.07387588918209076, -0.05884578824043274, -0.04381568729877472, -0.028785578906536102, -0.013755470514297485, 0.0012746332213282585, 0.016304736956954002, 0.03133483976125717, 0.04636494442820549, 0.06139504909515381, 0.07642515003681183, 0.09145525842905045, 0.10648535937070847, 0.12151546031236649, 0.1365455687046051, 0.15157566964626312, 0.16660577058792114, 0.18163588643074036, 0.19666597247123718, 0.2116960883140564, 0.22672618925571442, 0.24175629019737244, 0.25678640604019165, 0.2718164920806885, 0.2868466079235077, 0.3018767237663269, 0.31690680980682373, 0.33193692564964294, 0.34696701169013977, 0.361997127532959, 0.3770272135734558, 0.392057329416275, 0.40708741545677185, 0.42211753129959106, 0.4371476173400879, 0.4521777331829071, 0.4672078490257263]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 6.0, 11.0, 10.0, 15.0, 14.0, 28.0, 16.0, 27.0, 35.0, 37.0, 52.0, 51.0, 39.0, 51.0, 66.0, 52.0, 50.0, 50.0, 52.0, 40.0, 39.0, 42.0, 39.0, 29.0, 25.0, 20.0, 22.0, 26.0, 7.0, 11.0, 7.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.625, -11.281494140625, -10.93798828125, -10.594482421875, -10.2509765625, -9.907470703125, -9.56396484375, -9.220458984375, -8.876953125, -8.533447265625, -8.18994140625, -7.846435546875, -7.5029296875, -7.159423828125, -6.81591796875, -6.472412109375, -6.12890625, -5.785400390625, -5.44189453125, -5.098388671875, -4.7548828125, -4.411376953125, -4.06787109375, -3.724365234375, -3.380859375, -3.037353515625, -2.69384765625, -2.350341796875, -2.0068359375, -1.663330078125, -1.31982421875, -0.976318359375, -0.6328125, -0.289306640625, 0.05419921875, 0.397705078125, 0.7412109375, 1.084716796875, 1.42822265625, 1.771728515625, 2.115234375, 2.458740234375, 2.80224609375, 3.145751953125, 3.4892578125, 3.832763671875, 4.17626953125, 4.519775390625, 4.86328125, 5.206787109375, 5.55029296875, 5.893798828125, 6.2373046875, 6.580810546875, 6.92431640625, 7.267822265625, 7.611328125, 7.954833984375, 8.29833984375, 8.641845703125, 8.9853515625, 9.328857421875, 9.67236328125, 10.015869140625, 10.359375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 20.0, 22.0, 23.0, 39.0, 59.0, 78.0, 122.0, 147.0, 234.0, 346.0, 569.0, 889.0, 1408.0, 2537.0, 4864.0, 9881.0, 24505.0, 76080.0, 317517.0, 450921.0, 102761.0, 30689.0, 11798.0, 5626.0, 2952.0, 1699.0, 969.0, 601.0, 396.0, 278.0, 150.0, 118.0, 76.0, 51.0, 31.0, 25.0, 27.0, 17.0, 8.0, 9.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.96875, -16.4854736328125, -16.002197265625, -15.5189208984375, -15.03564453125, -14.5523681640625, -14.069091796875, -13.5858154296875, -13.1025390625, -12.6192626953125, -12.135986328125, -11.6527099609375, -11.16943359375, -10.6861572265625, -10.202880859375, -9.7196044921875, -9.236328125, -8.7530517578125, -8.269775390625, -7.7864990234375, -7.30322265625, -6.8199462890625, -6.336669921875, -5.8533935546875, -5.3701171875, -4.8868408203125, -4.403564453125, -3.9202880859375, -3.43701171875, -2.9537353515625, -2.470458984375, -1.9871826171875, -1.50390625, -1.0206298828125, -0.537353515625, -0.0540771484375, 0.42919921875, 0.9124755859375, 1.395751953125, 1.8790283203125, 2.3623046875, 2.8455810546875, 3.328857421875, 3.8121337890625, 4.29541015625, 4.7786865234375, 5.261962890625, 5.7452392578125, 6.228515625, 6.7117919921875, 7.195068359375, 7.6783447265625, 8.16162109375, 8.6448974609375, 9.128173828125, 9.6114501953125, 10.0947265625, 10.5780029296875, 11.061279296875, 11.5445556640625, 12.02783203125, 12.5111083984375, 12.994384765625, 13.4776611328125, 13.9609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 3.0, 9.0, 17.0, 10.0, 19.0, 17.0, 15.0, 22.0, 24.0, 38.0, 28.0, 26.0, 33.0, 56.0, 57.0, 67.0, 120.0, 253.0, 1482.0, 208.0, 106.0, 61.0, 50.0, 40.0, 43.0, 40.0, 23.0, 16.0, 21.0, 23.0, 10.0, 21.0, 15.0, 17.0, 9.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.75, -24.97900390625, -24.2080078125, -23.43701171875, -22.666015625, -21.89501953125, -21.1240234375, -20.35302734375, -19.58203125, -18.81103515625, -18.0400390625, -17.26904296875, -16.498046875, -15.72705078125, -14.9560546875, -14.18505859375, -13.4140625, -12.64306640625, -11.8720703125, -11.10107421875, -10.330078125, -9.55908203125, -8.7880859375, -8.01708984375, -7.24609375, -6.47509765625, -5.7041015625, -4.93310546875, -4.162109375, -3.39111328125, -2.6201171875, -1.84912109375, -1.078125, -0.30712890625, 0.4638671875, 1.23486328125, 2.005859375, 2.77685546875, 3.5478515625, 4.31884765625, 5.08984375, 5.86083984375, 6.6318359375, 7.40283203125, 8.173828125, 8.94482421875, 9.7158203125, 10.48681640625, 11.2578125, 12.02880859375, 12.7998046875, 13.57080078125, 14.341796875, 15.11279296875, 15.8837890625, 16.65478515625, 17.42578125, 18.19677734375, 18.9677734375, 19.73876953125, 20.509765625, 21.28076171875, 22.0517578125, 22.82275390625, 23.59375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 1.0, 7.0, 12.0, 11.0, 20.0, 20.0, 23.0, 30.0, 51.0, 43.0, 59.0, 77.0, 95.0, 150.0, 195.0, 306.0, 627.0, 1840.0, 8653.0, 141329.0, 2907085.0, 75516.0, 6431.0, 1476.0, 553.0, 283.0, 191.0, 118.0, 105.0, 86.0, 61.0, 53.0, 43.0, 37.0, 22.0, 28.0, 15.0, 10.0, 6.0, 9.0, 7.0, 9.0, 2.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.65625, -45.17138671875, -43.6865234375, -42.20166015625, -40.716796875, -39.23193359375, -37.7470703125, -36.26220703125, -34.77734375, -33.29248046875, -31.8076171875, -30.32275390625, -28.837890625, -27.35302734375, -25.8681640625, -24.38330078125, -22.8984375, -21.41357421875, -19.9287109375, -18.44384765625, -16.958984375, -15.47412109375, -13.9892578125, -12.50439453125, -11.01953125, -9.53466796875, -8.0498046875, -6.56494140625, -5.080078125, -3.59521484375, -2.1103515625, -0.62548828125, 0.859375, 2.34423828125, 3.8291015625, 5.31396484375, 6.798828125, 8.28369140625, 9.7685546875, 11.25341796875, 12.73828125, 14.22314453125, 15.7080078125, 17.19287109375, 18.677734375, 20.16259765625, 21.6474609375, 23.13232421875, 24.6171875, 26.10205078125, 27.5869140625, 29.07177734375, 30.556640625, 32.04150390625, 33.5263671875, 35.01123046875, 36.49609375, 37.98095703125, 39.4658203125, 40.95068359375, 42.435546875, 43.92041015625, 45.4052734375, 46.89013671875, 48.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 22.0, 347.0, 540.0, 103.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.33827209472656, -30.995132446289062, -23.651994705200195, -16.308856964111328, -8.965717315673828, -1.6225776672363281, 5.720558166503906, 13.063697814941406, 20.406837463378906, 27.749977111816406, 35.093116760253906, 42.43625259399414, 49.77939224243164, 57.12253189086914, 64.46566772460938, 71.80880737304688, 79.15194702148438, 86.49508666992188, 93.83822631835938, 101.18136596679688, 108.52450561523438, 115.86764526367188, 123.21077728271484, 130.55392456054688, 137.89706420898438, 145.24020385742188, 152.58334350585938, 159.92648315429688, 167.26962280273438, 174.61276245117188, 181.95590209960938, 189.29904174804688, 196.64218139648438, 203.98532104492188, 211.32846069335938, 218.67160034179688, 226.01473999023438, 233.35787963867188, 240.70101928710938, 248.04415893554688, 255.38729858398438, 262.7304382324219, 270.0735778808594, 277.4167175292969, 284.7598571777344, 292.1029968261719, 299.4461364746094, 306.7892761230469, 314.13238525390625, 321.47552490234375, 328.81866455078125, 336.16180419921875, 343.50494384765625, 350.84808349609375, 358.19122314453125, 365.53436279296875, 372.87750244140625, 380.22064208984375, 387.56378173828125, 394.90692138671875, 402.25006103515625, 409.59320068359375, 416.93634033203125, 424.27947998046875, 431.62261962890625]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 9.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 13.0, 12.0, 30.0, 25.0, 23.0, 19.0, 26.0, 34.0, 35.0, 32.0, 26.0, 29.0, 37.0, 37.0, 43.0, 57.0, 38.0, 40.0, 36.0, 36.0, 31.0, 28.0, 35.0, 25.0, 29.0, 24.0, 14.0, 17.0, 19.0, 12.0, 7.0, 7.0, 9.0, 13.0, 9.0, 2.0, 7.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0], "bins": [-62.882659912109375, -61.04526901245117, -59.20787811279297, -57.37049102783203, -55.53310012817383, -53.695709228515625, -51.85831832885742, -50.02092742919922, -48.18354034423828, -46.34614944458008, -44.508758544921875, -42.67137145996094, -40.833980560302734, -38.99658966064453, -37.15919876098633, -35.321807861328125, -33.48441696166992, -31.64702606201172, -29.80963706970215, -27.972246170043945, -26.134857177734375, -24.297466278076172, -22.46007537841797, -20.622684478759766, -18.785295486450195, -16.947904586791992, -15.110515594482422, -13.273124694824219, -11.435734748840332, -9.598344802856445, -7.760953903198242, -5.9235639572143555, -4.086174011230469, -2.248783826828003, -0.4113936424255371, 1.4259967803955078, 3.2633867263793945, 5.100776672363281, 6.938167572021484, 8.775557518005371, 10.612947463989258, 12.450337409973145, 14.287727355957031, 16.125118255615234, 17.962509155273438, 19.799898147583008, 21.63728904724121, 23.47467803955078, 25.312068939208984, 27.149459838867188, 28.986848831176758, 30.82423973083496, 32.66162872314453, 34.499019622802734, 36.33641052246094, 38.17380142211914, 40.011192321777344, 41.84858322143555, 43.68597412109375, 45.52336120605469, 47.36075210571289, 49.198143005371094, 51.0355339050293, 52.8729248046875, 54.71031188964844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 11.0, 12.0, 21.0, 19.0, 23.0, 24.0, 34.0, 38.0, 36.0, 45.0, 48.0, 53.0, 47.0, 58.0, 44.0, 52.0, 48.0, 46.0, 48.0, 45.0, 37.0, 25.0, 29.0, 20.0, 25.0, 25.0, 21.0, 14.0, 7.0, 4.0, 7.0, 4.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.453125, -11.09912109375, -10.7451171875, -10.39111328125, -10.037109375, -9.68310546875, -9.3291015625, -8.97509765625, -8.62109375, -8.26708984375, -7.9130859375, -7.55908203125, -7.205078125, -6.85107421875, -6.4970703125, -6.14306640625, -5.7890625, -5.43505859375, -5.0810546875, -4.72705078125, -4.373046875, -4.01904296875, -3.6650390625, -3.31103515625, -2.95703125, -2.60302734375, -2.2490234375, -1.89501953125, -1.541015625, -1.18701171875, -0.8330078125, -0.47900390625, -0.125, 0.22900390625, 0.5830078125, 0.93701171875, 1.291015625, 1.64501953125, 1.9990234375, 2.35302734375, 2.70703125, 3.06103515625, 3.4150390625, 3.76904296875, 4.123046875, 4.47705078125, 4.8310546875, 5.18505859375, 5.5390625, 5.89306640625, 6.2470703125, 6.60107421875, 6.955078125, 7.30908203125, 7.6630859375, 8.01708984375, 8.37109375, 8.72509765625, 9.0791015625, 9.43310546875, 9.787109375, 10.14111328125, 10.4951171875, 10.84912109375, 11.203125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 14.0, 10.0, 6.0, 19.0, 23.0, 34.0, 44.0, 64.0, 95.0, 162.0, 235.0, 414.0, 661.0, 1188.0, 2352.0, 5303.0, 13531.0, 53492.0, 561600.0, 3067099.0, 420491.0, 45137.0, 12368.0, 4908.0, 2136.0, 1143.0, 640.0, 378.0, 237.0, 142.0, 117.0, 76.0, 34.0, 36.0, 26.0, 26.0, 11.0, 15.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-32.5625, -31.669189453125, -30.77587890625, -29.882568359375, -28.9892578125, -28.095947265625, -27.20263671875, -26.309326171875, -25.416015625, -24.522705078125, -23.62939453125, -22.736083984375, -21.8427734375, -20.949462890625, -20.05615234375, -19.162841796875, -18.26953125, -17.376220703125, -16.48291015625, -15.589599609375, -14.6962890625, -13.802978515625, -12.90966796875, -12.016357421875, -11.123046875, -10.229736328125, -9.33642578125, -8.443115234375, -7.5498046875, -6.656494140625, -5.76318359375, -4.869873046875, -3.9765625, -3.083251953125, -2.18994140625, -1.296630859375, -0.4033203125, 0.489990234375, 1.38330078125, 2.276611328125, 3.169921875, 4.063232421875, 4.95654296875, 5.849853515625, 6.7431640625, 7.636474609375, 8.52978515625, 9.423095703125, 10.31640625, 11.209716796875, 12.10302734375, 12.996337890625, 13.8896484375, 14.782958984375, 15.67626953125, 16.569580078125, 17.462890625, 18.356201171875, 19.24951171875, 20.142822265625, 21.0361328125, 21.929443359375, 22.82275390625, 23.716064453125, 24.609375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 11.0, 11.0, 18.0, 18.0, 30.0, 47.0, 67.0, 92.0, 150.0, 212.0, 341.0, 508.0, 629.0, 566.0, 453.0, 284.0, 179.0, 131.0, 73.0, 72.0, 41.0, 39.0, 26.0, 19.0, 14.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.78125, -21.137939453125, -20.49462890625, -19.851318359375, -19.2080078125, -18.564697265625, -17.92138671875, -17.278076171875, -16.634765625, -15.991455078125, -15.34814453125, -14.704833984375, -14.0615234375, -13.418212890625, -12.77490234375, -12.131591796875, -11.48828125, -10.844970703125, -10.20166015625, -9.558349609375, -8.9150390625, -8.271728515625, -7.62841796875, -6.985107421875, -6.341796875, -5.698486328125, -5.05517578125, -4.411865234375, -3.7685546875, -3.125244140625, -2.48193359375, -1.838623046875, -1.1953125, -0.552001953125, 0.09130859375, 0.734619140625, 1.3779296875, 2.021240234375, 2.66455078125, 3.307861328125, 3.951171875, 4.594482421875, 5.23779296875, 5.881103515625, 6.5244140625, 7.167724609375, 7.81103515625, 8.454345703125, 9.09765625, 9.740966796875, 10.38427734375, 11.027587890625, 11.6708984375, 12.314208984375, 12.95751953125, 13.600830078125, 14.244140625, 14.887451171875, 15.53076171875, 16.174072265625, 16.8173828125, 17.460693359375, 18.10400390625, 18.747314453125, 19.390625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 10.0, 14.0, 8.0, 11.0, 13.0, 26.0, 37.0, 51.0, 48.0, 81.0, 125.0, 193.0, 423.0, 1036.0, 3911.0, 45100.0, 3708968.0, 419162.0, 11679.0, 1977.0, 635.0, 294.0, 146.0, 90.0, 69.0, 39.0, 30.0, 30.0, 15.0, 12.0, 9.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-80.875, -78.1572265625, -75.439453125, -72.7216796875, -70.00390625, -67.2861328125, -64.568359375, -61.8505859375, -59.1328125, -56.4150390625, -53.697265625, -50.9794921875, -48.26171875, -45.5439453125, -42.826171875, -40.1083984375, -37.390625, -34.6728515625, -31.955078125, -29.2373046875, -26.51953125, -23.8017578125, -21.083984375, -18.3662109375, -15.6484375, -12.9306640625, -10.212890625, -7.4951171875, -4.77734375, -2.0595703125, 0.658203125, 3.3759765625, 6.09375, 8.8115234375, 11.529296875, 14.2470703125, 16.96484375, 19.6826171875, 22.400390625, 25.1181640625, 27.8359375, 30.5537109375, 33.271484375, 35.9892578125, 38.70703125, 41.4248046875, 44.142578125, 46.8603515625, 49.578125, 52.2958984375, 55.013671875, 57.7314453125, 60.44921875, 63.1669921875, 65.884765625, 68.6025390625, 71.3203125, 74.0380859375, 76.755859375, 79.4736328125, 82.19140625, 84.9091796875, 87.626953125, 90.3447265625, 93.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 15.0, 23.0, 36.0, 61.0, 68.0, 115.0, 168.0, 146.0, 110.0, 115.0, 50.0, 40.0, 23.0, 9.0, 14.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.791595458984375, -42.027671813964844, -38.26375198364258, -34.49983215332031, -30.73590850830078, -26.971986770629883, -23.208065032958984, -19.444143295288086, -15.680221557617188, -11.916299819946289, -8.15237808227539, -4.388456344604492, -0.6245346069335938, 3.1393871307373047, 6.903308868408203, 10.667230606079102, 14.43115234375, 18.1950740814209, 21.958995819091797, 25.722917556762695, 29.486839294433594, 33.250762939453125, 37.01468276977539, 40.778602600097656, 44.54252624511719, 48.30644989013672, 52.070369720458984, 55.83428955078125, 59.59821319580078, 63.36213684082031, 67.12605285644531, 70.88997650146484, 74.65390014648438, 78.4178237915039, 82.18174743652344, 85.94566345214844, 89.70958709716797, 93.4735107421875, 97.2374267578125, 101.00135040283203, 104.76527404785156, 108.5291976928711, 112.29312133789062, 116.05703735351562, 119.82096099853516, 123.58488464355469, 127.34880065917969, 131.11273193359375, 134.87664794921875, 138.64056396484375, 142.4044952392578, 146.1684112548828, 149.93234252929688, 153.69625854492188, 157.46017456054688, 161.22410583496094, 164.98802185058594, 168.75193786621094, 172.515869140625, 176.27978515625, 180.043701171875, 183.80763244628906, 187.57154846191406, 191.33547973632812, 195.09939575195312]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 6.0, 4.0, 9.0, 3.0, 16.0, 19.0, 15.0, 24.0, 28.0, 20.0, 31.0, 25.0, 32.0, 27.0, 36.0, 37.0, 46.0, 26.0, 29.0, 41.0, 35.0, 44.0, 32.0, 37.0, 40.0, 33.0, 30.0, 26.0, 27.0, 22.0, 25.0, 29.0, 20.0, 21.0, 14.0, 11.0, 14.0, 8.0, 8.0, 12.0, 6.0, 3.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 4.0], "bins": [-61.32733154296875, -59.58025360107422, -57.83317565917969, -56.08610153198242, -54.33902359008789, -52.59194564819336, -50.84486770629883, -49.09779357910156, -47.35071563720703, -45.6036376953125, -43.85655975341797, -42.1094856262207, -40.36240768432617, -38.61532974243164, -36.86825180053711, -35.121177673339844, -33.37409973144531, -31.62702178955078, -29.879945755004883, -28.13286781311035, -26.385791778564453, -24.638713836669922, -22.89163589477539, -21.144559860229492, -19.397480010986328, -17.650402069091797, -15.903326034545898, -14.156248092651367, -12.409172058105469, -10.662094116210938, -8.915017127990723, -7.167940139770508, -5.420864105224609, -3.6737871170043945, -1.9267098903656006, -0.17963266372680664, 1.5674443244934082, 3.3145217895507812, 5.061598777770996, 6.808675765991211, 8.555752754211426, 10.30282974243164, 12.049906730651855, 13.79698371887207, 15.544061660766602, 17.2911376953125, 19.03821563720703, 20.785293579101562, 22.53236961364746, 24.279447555541992, 26.02652359008789, 27.773601531982422, 29.52067756652832, 31.26775550842285, 33.01483154296875, 34.76190948486328, 36.50898742675781, 38.256065368652344, 40.003143310546875, 41.75021743774414, 43.49729537963867, 45.2443733215332, 46.991451263427734, 48.738525390625, 50.48560333251953]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 13.0, 5.0, 6.0, 11.0, 10.0, 7.0, 19.0, 21.0, 25.0, 28.0, 32.0, 41.0, 44.0, 52.0, 34.0, 53.0, 37.0, 51.0, 62.0, 46.0, 47.0, 41.0, 43.0, 35.0, 35.0, 29.0, 23.0, 31.0, 26.0, 19.0, 11.0, 10.0, 17.0, 6.0, 7.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.359375, -10.026611328125, -9.69384765625, -9.361083984375, -9.0283203125, -8.695556640625, -8.36279296875, -8.030029296875, -7.697265625, -7.364501953125, -7.03173828125, -6.698974609375, -6.3662109375, -6.033447265625, -5.70068359375, -5.367919921875, -5.03515625, -4.702392578125, -4.36962890625, -4.036865234375, -3.7041015625, -3.371337890625, -3.03857421875, -2.705810546875, -2.373046875, -2.040283203125, -1.70751953125, -1.374755859375, -1.0419921875, -0.709228515625, -0.37646484375, -0.043701171875, 0.2890625, 0.621826171875, 0.95458984375, 1.287353515625, 1.6201171875, 1.952880859375, 2.28564453125, 2.618408203125, 2.951171875, 3.283935546875, 3.61669921875, 3.949462890625, 4.2822265625, 4.614990234375, 4.94775390625, 5.280517578125, 5.61328125, 5.946044921875, 6.27880859375, 6.611572265625, 6.9443359375, 7.277099609375, 7.60986328125, 7.942626953125, 8.275390625, 8.608154296875, 8.94091796875, 9.273681640625, 9.6064453125, 9.939208984375, 10.27197265625, 10.604736328125, 10.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 16.0, 29.0, 40.0, 67.0, 95.0, 144.0, 254.0, 377.0, 556.0, 914.0, 1409.0, 2253.0, 3540.0, 5689.0, 9337.0, 15347.0, 25341.0, 42325.0, 72734.0, 124428.0, 194141.0, 207738.0, 138787.0, 82506.0, 47810.0, 27998.0, 16993.0, 10530.0, 6277.0, 3998.0, 2535.0, 1539.0, 993.0, 612.0, 457.0, 266.0, 167.0, 121.0, 61.0, 51.0, 26.0, 19.0, 10.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2188720703125, -1.177001953125, -1.1351318359375, -1.09326171875, -1.0513916015625, -1.009521484375, -0.9676513671875, -0.92578125, -0.8839111328125, -0.842041015625, -0.8001708984375, -0.75830078125, -0.7164306640625, -0.674560546875, -0.6326904296875, -0.5908203125, -0.5489501953125, -0.507080078125, -0.4652099609375, -0.42333984375, -0.3814697265625, -0.339599609375, -0.2977294921875, -0.255859375, -0.2139892578125, -0.172119140625, -0.1302490234375, -0.08837890625, -0.0465087890625, -0.004638671875, 0.0372314453125, 0.0791015625, 0.1209716796875, 0.162841796875, 0.2047119140625, 0.24658203125, 0.2884521484375, 0.330322265625, 0.3721923828125, 0.4140625, 0.4559326171875, 0.497802734375, 0.5396728515625, 0.58154296875, 0.6234130859375, 0.665283203125, 0.7071533203125, 0.7490234375, 0.7908935546875, 0.832763671875, 0.8746337890625, 0.91650390625, 0.9583740234375, 1.000244140625, 1.0421142578125, 1.083984375, 1.1258544921875, 1.167724609375, 1.2095947265625, 1.25146484375, 1.2933349609375, 1.335205078125, 1.3770751953125, 1.4189453125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 5.0, 9.0, 7.0, 20.0, 17.0, 16.0, 21.0, 20.0, 18.0, 31.0, 26.0, 38.0, 31.0, 30.0, 48.0, 21.0, 43.0, 42.0, 1062.0, 31.0, 36.0, 38.0, 40.0, 34.0, 35.0, 26.0, 40.0, 37.0, 13.0, 24.0, 22.0, 18.0, 12.0, 17.0, 7.0, 19.0, 6.0, 11.0, 4.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-5.74609375, -5.56475830078125, -5.3834228515625, -5.20208740234375, -5.020751953125, -4.83941650390625, -4.6580810546875, -4.47674560546875, -4.29541015625, -4.11407470703125, -3.9327392578125, -3.75140380859375, -3.570068359375, -3.38873291015625, -3.2073974609375, -3.02606201171875, -2.8447265625, -2.66339111328125, -2.4820556640625, -2.30072021484375, -2.119384765625, -1.93804931640625, -1.7567138671875, -1.57537841796875, -1.39404296875, -1.21270751953125, -1.0313720703125, -0.85003662109375, -0.668701171875, -0.48736572265625, -0.3060302734375, -0.12469482421875, 0.056640625, 0.23797607421875, 0.4193115234375, 0.60064697265625, 0.781982421875, 0.96331787109375, 1.1446533203125, 1.32598876953125, 1.50732421875, 1.68865966796875, 1.8699951171875, 2.05133056640625, 2.232666015625, 2.41400146484375, 2.5953369140625, 2.77667236328125, 2.9580078125, 3.13934326171875, 3.3206787109375, 3.50201416015625, 3.683349609375, 3.86468505859375, 4.0460205078125, 4.22735595703125, 4.40869140625, 4.59002685546875, 4.7713623046875, 4.95269775390625, 5.134033203125, 5.31536865234375, 5.4967041015625, 5.67803955078125, 5.859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 20.0, 28.0, 38.0, 54.0, 105.0, 163.0, 201.0, 372.0, 598.0, 1064.0, 1733.0, 2840.0, 4716.0, 8012.0, 13749.0, 23777.0, 43023.0, 80510.0, 154448.0, 1262589.0, 246168.0, 115080.0, 60007.0, 32712.0, 18722.0, 10641.0, 6215.0, 3832.0, 2194.0, 1303.0, 789.0, 523.0, 360.0, 195.0, 117.0, 75.0, 42.0, 32.0, 19.0, 22.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.787109375, -0.765106201171875, -0.74310302734375, -0.721099853515625, -0.6990966796875, -0.677093505859375, -0.65509033203125, -0.633087158203125, -0.611083984375, -0.589080810546875, -0.56707763671875, -0.545074462890625, -0.5230712890625, -0.501068115234375, -0.47906494140625, -0.457061767578125, -0.43505859375, -0.413055419921875, -0.39105224609375, -0.369049072265625, -0.3470458984375, -0.325042724609375, -0.30303955078125, -0.281036376953125, -0.259033203125, -0.237030029296875, -0.21502685546875, -0.193023681640625, -0.1710205078125, -0.149017333984375, -0.12701416015625, -0.105010986328125, -0.0830078125, -0.061004638671875, -0.03900146484375, -0.016998291015625, 0.0050048828125, 0.027008056640625, 0.04901123046875, 0.071014404296875, 0.093017578125, 0.115020751953125, 0.13702392578125, 0.159027099609375, 0.1810302734375, 0.203033447265625, 0.22503662109375, 0.247039794921875, 0.26904296875, 0.291046142578125, 0.31304931640625, 0.335052490234375, 0.3570556640625, 0.379058837890625, 0.40106201171875, 0.423065185546875, 0.445068359375, 0.467071533203125, 0.48907470703125, 0.511077880859375, 0.5330810546875, 0.555084228515625, 0.57708740234375, 0.599090576171875, 0.62109375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 7.0, 5.0, 4.0, 10.0, 5.0, 4.0, 7.0, 8.0, 21.0, 14.0, 15.0, 20.0, 21.0, 41.0, 49.0, 62.0, 125.0, 243.0, 93.0, 56.0, 38.0, 18.0, 19.0, 19.0, 12.0, 9.0, 11.0, 14.0, 5.0, 8.0, 10.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1304931640625, -0.12668991088867188, -0.12288665771484375, -0.11908340454101562, -0.1152801513671875, -0.11147689819335938, -0.10767364501953125, -0.10387039184570312, -0.100067138671875, -0.09626388549804688, -0.09246063232421875, -0.08865737915039062, -0.0848541259765625, -0.08105087280273438, -0.07724761962890625, -0.07344436645507812, -0.06964111328125, -0.06583786010742188, -0.06203460693359375, -0.058231353759765625, -0.0544281005859375, -0.050624847412109375, -0.04682159423828125, -0.043018341064453125, -0.039215087890625, -0.035411834716796875, -0.03160858154296875, -0.027805328369140625, -0.0240020751953125, -0.020198822021484375, -0.01639556884765625, -0.012592315673828125, -0.0087890625, -0.004985809326171875, -0.00118255615234375, 0.002620697021484375, 0.0064239501953125, 0.010227203369140625, 0.01403045654296875, 0.017833709716796875, 0.021636962890625, 0.025440216064453125, 0.02924346923828125, 0.033046722412109375, 0.0368499755859375, 0.040653228759765625, 0.04445648193359375, 0.048259735107421875, 0.05206298828125, 0.055866241455078125, 0.05966949462890625, 0.06347274780273438, 0.0672760009765625, 0.07107925415039062, 0.07488250732421875, 0.07868576049804688, 0.082489013671875, 0.08629226684570312, 0.09009552001953125, 0.09389877319335938, 0.0977020263671875, 0.10150527954101562, 0.10530853271484375, 0.10911178588867188, 0.1129150390625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 3.0, 9.0, 12.0, 9.0, 17.0, 13.0, 27.0, 38.0, 69.0, 145.0, 451.0, 8749.0, 1003198.0, 34469.0, 819.0, 214.0, 89.0, 48.0, 39.0, 19.0, 16.0, 18.0, 9.0, 3.0, 8.0, 8.0, 4.0, 6.0, 5.0, 4.0, 0.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.67578125, -2.58551025390625, -2.4952392578125, -2.40496826171875, -2.314697265625, -2.22442626953125, -2.1341552734375, -2.04388427734375, -1.95361328125, -1.86334228515625, -1.7730712890625, -1.68280029296875, -1.592529296875, -1.50225830078125, -1.4119873046875, -1.32171630859375, -1.2314453125, -1.14117431640625, -1.0509033203125, -0.96063232421875, -0.870361328125, -0.78009033203125, -0.6898193359375, -0.59954833984375, -0.50927734375, -0.41900634765625, -0.3287353515625, -0.23846435546875, -0.148193359375, -0.05792236328125, 0.0323486328125, 0.12261962890625, 0.212890625, 0.30316162109375, 0.3934326171875, 0.48370361328125, 0.573974609375, 0.66424560546875, 0.7545166015625, 0.84478759765625, 0.93505859375, 1.02532958984375, 1.1156005859375, 1.20587158203125, 1.296142578125, 1.38641357421875, 1.4766845703125, 1.56695556640625, 1.6572265625, 1.74749755859375, 1.8377685546875, 1.92803955078125, 2.018310546875, 2.10858154296875, 2.1988525390625, 2.28912353515625, 2.37939453125, 2.46966552734375, 2.5599365234375, 2.65020751953125, 2.740478515625, 2.83074951171875, 2.9210205078125, 3.01129150390625, 3.1015625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 17.0, 21.0, 17.0, 45.0, 81.0, 117.0, 198.0, 210.0, 90.0, 51.0, 35.0, 29.0, 23.0, 11.0, 7.0, 10.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6201918125152588, -0.5994992852210999, -0.5788067579269409, -0.558114230632782, -0.537421703338623, -0.5167291760444641, -0.4960366487503052, -0.47534412145614624, -0.4546515941619873, -0.43395906686782837, -0.41326653957366943, -0.3925740122795105, -0.37188148498535156, -0.3511889576911926, -0.3304964303970337, -0.30980390310287476, -0.2891114056110382, -0.2684188783168793, -0.24772635102272034, -0.2270338237285614, -0.20634129643440247, -0.18564876914024353, -0.1649562567472458, -0.14426372945308685, -0.12357120215892792, -0.10287867486476898, -0.08218614757061005, -0.06149362772703171, -0.04080110043287277, -0.020108573138713837, 0.000583946704864502, 0.021276473999023438, 0.04196900129318237, 0.06266152858734131, 0.08335405588150024, 0.10404657572507858, 0.12473910301923752, 0.14543163776397705, 0.1661241501569748, 0.18681667745113373, 0.20750920474529266, 0.2282017320394516, 0.24889425933361053, 0.2695867717266083, 0.2902792990207672, 0.31097182631492615, 0.3316643536090851, 0.352356880903244, 0.37304940819740295, 0.3937419354915619, 0.4144344627857208, 0.43512699007987976, 0.4558195173740387, 0.47651204466819763, 0.4972045421600342, 0.5178970694541931, 0.538589596748352, 0.559282124042511, 0.5799746513366699, 0.6006671786308289, 0.6213597059249878, 0.6420522332191467, 0.6627447605133057, 0.6834372878074646, 0.7041298151016235]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 0.0, 5.0, 5.0, 13.0, 10.0, 22.0, 20.0, 11.0, 18.0, 21.0, 29.0, 23.0, 22.0, 31.0, 33.0, 44.0, 43.0, 36.0, 42.0, 51.0, 40.0, 41.0, 41.0, 29.0, 37.0, 28.0, 29.0, 33.0, 27.0, 15.0, 28.0, 14.0, 34.0, 13.0, 20.0, 16.0, 13.0, 13.0, 9.0, 8.0, 6.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3506801724433899, -0.34051117300987244, -0.330342173576355, -0.3201731741428375, -0.31000417470932007, -0.2998351752758026, -0.28966617584228516, -0.2794971466064453, -0.26932817697525024, -0.2591591775417328, -0.24899017810821533, -0.23882117867469788, -0.22865217924118042, -0.21848317980766296, -0.20831416547298431, -0.19814516603946686, -0.1879761517047882, -0.17780715227127075, -0.1676381528377533, -0.15746915340423584, -0.14730015397071838, -0.13713115453720093, -0.12696214020252228, -0.11679314076900482, -0.10662414133548737, -0.09645514190196991, -0.08628614246845245, -0.0761171355843544, -0.06594813615083694, -0.05577913671731949, -0.045610133558511734, -0.03544113039970398, -0.025272130966186523, -0.015103129670023918, -0.004934128373861313, 0.005234872922301292, 0.015403874218463898, 0.025572873651981354, 0.03574187681078911, 0.04591087996959686, 0.05607987940311432, 0.06624887883663177, 0.07641787827014923, 0.08658688515424728, 0.09675588458776474, 0.1069248840212822, 0.11709389090538025, 0.1272628903388977, 0.13743188977241516, 0.14760088920593262, 0.15776988863945007, 0.16793888807296753, 0.17810788750648499, 0.18827688694000244, 0.1984459012746811, 0.20861490070819855, 0.218783900141716, 0.22895289957523346, 0.23912189900875092, 0.24929089844226837, 0.259459912776947, 0.2696289122104645, 0.27979791164398193, 0.2899669110774994, 0.30013591051101685]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 13.0, 5.0, 6.0, 11.0, 10.0, 6.0, 19.0, 21.0, 25.0, 29.0, 31.0, 40.0, 44.0, 51.0, 37.0, 50.0, 38.0, 51.0, 62.0, 45.0, 50.0, 40.0, 44.0, 35.0, 35.0, 29.0, 22.0, 32.0, 25.0, 19.0, 11.0, 10.0, 18.0, 5.0, 8.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.3671875, -10.0345458984375, -9.701904296875, -9.3692626953125, -9.03662109375, -8.7039794921875, -8.371337890625, -8.0386962890625, -7.7060546875, -7.3734130859375, -7.040771484375, -6.7081298828125, -6.37548828125, -6.0428466796875, -5.710205078125, -5.3775634765625, -5.044921875, -4.7122802734375, -4.379638671875, -4.0469970703125, -3.71435546875, -3.3817138671875, -3.049072265625, -2.7164306640625, -2.3837890625, -2.0511474609375, -1.718505859375, -1.3858642578125, -1.05322265625, -0.7205810546875, -0.387939453125, -0.0552978515625, 0.27734375, 0.6099853515625, 0.942626953125, 1.2752685546875, 1.60791015625, 1.9405517578125, 2.273193359375, 2.6058349609375, 2.9384765625, 3.2711181640625, 3.603759765625, 3.9364013671875, 4.26904296875, 4.6016845703125, 4.934326171875, 5.2669677734375, 5.599609375, 5.9322509765625, 6.264892578125, 6.5975341796875, 6.93017578125, 7.2628173828125, 7.595458984375, 7.9281005859375, 8.2607421875, 8.5933837890625, 8.926025390625, 9.2586669921875, 9.59130859375, 9.9239501953125, 10.256591796875, 10.5892333984375, 10.921875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 3.0, 11.0, 25.0, 28.0, 24.0, 63.0, 91.0, 150.0, 228.0, 406.0, 803.0, 1756.0, 5038.0, 17175.0, 70313.0, 368254.0, 471295.0, 82986.0, 20193.0, 5817.0, 1891.0, 851.0, 450.0, 224.0, 154.0, 93.0, 71.0, 43.0, 31.0, 15.0, 11.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.578125, -17.02978515625, -16.4814453125, -15.93310546875, -15.384765625, -14.83642578125, -14.2880859375, -13.73974609375, -13.19140625, -12.64306640625, -12.0947265625, -11.54638671875, -10.998046875, -10.44970703125, -9.9013671875, -9.35302734375, -8.8046875, -8.25634765625, -7.7080078125, -7.15966796875, -6.611328125, -6.06298828125, -5.5146484375, -4.96630859375, -4.41796875, -3.86962890625, -3.3212890625, -2.77294921875, -2.224609375, -1.67626953125, -1.1279296875, -0.57958984375, -0.03125, 0.51708984375, 1.0654296875, 1.61376953125, 2.162109375, 2.71044921875, 3.2587890625, 3.80712890625, 4.35546875, 4.90380859375, 5.4521484375, 6.00048828125, 6.548828125, 7.09716796875, 7.6455078125, 8.19384765625, 8.7421875, 9.29052734375, 9.8388671875, 10.38720703125, 10.935546875, 11.48388671875, 12.0322265625, 12.58056640625, 13.12890625, 13.67724609375, 14.2255859375, 14.77392578125, 15.322265625, 15.87060546875, 16.4189453125, 16.96728515625, 17.515625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 10.0, 10.0, 5.0, 9.0, 14.0, 18.0, 13.0, 16.0, 24.0, 28.0, 27.0, 32.0, 33.0, 49.0, 45.0, 62.0, 70.0, 109.0, 196.0, 1527.0, 194.0, 118.0, 68.0, 51.0, 40.0, 40.0, 24.0, 32.0, 28.0, 20.0, 28.0, 24.0, 9.0, 15.0, 18.0, 11.0, 3.0, 2.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.8125, -24.965576171875, -24.11865234375, -23.271728515625, -22.4248046875, -21.577880859375, -20.73095703125, -19.884033203125, -19.037109375, -18.190185546875, -17.34326171875, -16.496337890625, -15.6494140625, -14.802490234375, -13.95556640625, -13.108642578125, -12.26171875, -11.414794921875, -10.56787109375, -9.720947265625, -8.8740234375, -8.027099609375, -7.18017578125, -6.333251953125, -5.486328125, -4.639404296875, -3.79248046875, -2.945556640625, -2.0986328125, -1.251708984375, -0.40478515625, 0.442138671875, 1.2890625, 2.135986328125, 2.98291015625, 3.829833984375, 4.6767578125, 5.523681640625, 6.37060546875, 7.217529296875, 8.064453125, 8.911376953125, 9.75830078125, 10.605224609375, 11.4521484375, 12.299072265625, 13.14599609375, 13.992919921875, 14.83984375, 15.686767578125, 16.53369140625, 17.380615234375, 18.2275390625, 19.074462890625, 19.92138671875, 20.768310546875, 21.615234375, 22.462158203125, 23.30908203125, 24.156005859375, 25.0029296875, 25.849853515625, 26.69677734375, 27.543701171875, 28.390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 6.0, 6.0, 12.0, 14.0, 14.0, 16.0, 22.0, 24.0, 35.0, 42.0, 49.0, 66.0, 88.0, 145.0, 321.0, 629.0, 2242.0, 33011.0, 2961253.0, 141835.0, 3968.0, 851.0, 361.0, 193.0, 117.0, 85.0, 59.0, 38.0, 39.0, 35.0, 22.0, 16.0, 16.0, 10.0, 11.0, 6.0, 13.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-68.8125, -66.767578125, -64.72265625, -62.677734375, -60.6328125, -58.587890625, -56.54296875, -54.498046875, -52.453125, -50.408203125, -48.36328125, -46.318359375, -44.2734375, -42.228515625, -40.18359375, -38.138671875, -36.09375, -34.048828125, -32.00390625, -29.958984375, -27.9140625, -25.869140625, -23.82421875, -21.779296875, -19.734375, -17.689453125, -15.64453125, -13.599609375, -11.5546875, -9.509765625, -7.46484375, -5.419921875, -3.375, -1.330078125, 0.71484375, 2.759765625, 4.8046875, 6.849609375, 8.89453125, 10.939453125, 12.984375, 15.029296875, 17.07421875, 19.119140625, 21.1640625, 23.208984375, 25.25390625, 27.298828125, 29.34375, 31.388671875, 33.43359375, 35.478515625, 37.5234375, 39.568359375, 41.61328125, 43.658203125, 45.703125, 47.748046875, 49.79296875, 51.837890625, 53.8828125, 55.927734375, 57.97265625, 60.017578125, 62.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [314.0, 676.0, 28.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.072973251342773, -3.105311393737793, 9.862350463867188, 22.83001136779785, 35.79767608642578, 48.76533508300781, 61.732994079589844, 74.7006607055664, 87.66831970214844, 100.63597869873047, 113.60364532470703, 126.57130432128906, 139.53897094726562, 152.50662231445312, 165.4742889404297, 178.44195556640625, 191.4096221923828, 204.37728881835938, 217.34494018554688, 230.31260681152344, 243.2802734375, 256.2479248046875, 269.215576171875, 282.1832580566406, 295.1509094238281, 308.1185607910156, 321.08624267578125, 334.05389404296875, 347.02154541015625, 359.9892272949219, 372.9568786621094, 385.924560546875, 398.8921813964844, 411.8598327636719, 424.8275146484375, 437.795166015625, 450.7628173828125, 463.7304992675781, 476.6981506347656, 489.66583251953125, 502.63348388671875, 515.6011352539062, 528.5687866210938, 541.5364990234375, 554.504150390625, 567.4718017578125, 580.439453125, 593.4071044921875, 606.374755859375, 619.3424072265625, 632.31005859375, 645.2777099609375, 658.2454223632812, 671.2130737304688, 684.1807250976562, 697.1483764648438, 710.1160888671875, 723.083740234375, 736.0513916015625, 749.01904296875, 761.9867553710938, 774.9544067382812, 787.9220581054688, 800.8897094726562, 813.8573608398438]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 4.0, 4.0, 14.0, 20.0, 15.0, 11.0, 25.0, 20.0, 42.0, 22.0, 35.0, 25.0, 30.0, 43.0, 51.0, 40.0, 40.0, 47.0, 39.0, 53.0, 48.0, 38.0, 42.0, 26.0, 22.0, 25.0, 23.0, 21.0, 25.0, 15.0, 18.0, 13.0, 11.0, 9.0, 17.0, 8.0, 4.0, 10.0, 7.0, 2.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-79.46998596191406, -77.28299713134766, -75.09601593017578, -72.90902709960938, -70.7220458984375, -68.5350570678711, -66.34807586669922, -64.16108703613281, -61.97410583496094, -59.7871208190918, -57.600135803222656, -55.413150787353516, -53.226165771484375, -51.039180755615234, -48.852195739746094, -46.66520690917969, -44.47822189331055, -42.291236877441406, -40.104251861572266, -37.917266845703125, -35.730281829833984, -33.543296813964844, -31.35630989074707, -29.16932487487793, -26.98233985900879, -24.79535484313965, -22.608369827270508, -20.421382904052734, -18.234397888183594, -16.047412872314453, -13.860427856445312, -11.673442840576172, -9.486454010009766, -7.299468994140625, -5.112483501434326, -2.9254980087280273, -0.7385129928588867, 1.448472023010254, 3.635457992553711, 5.822443008422852, 8.009428024291992, 10.196413040161133, 12.383398056030273, 14.57038402557373, 16.757369995117188, 18.944355010986328, 21.13134002685547, 23.31832504272461, 25.50531005859375, 27.69229507446289, 29.87928009033203, 32.06626510620117, 34.25325012207031, 36.44023513793945, 38.627220153808594, 40.814208984375, 43.001190185546875, 45.188175201416016, 47.375160217285156, 49.5621452331543, 51.74913024902344, 53.93611526489258, 56.12310028076172, 58.310089111328125, 60.497074127197266]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 10.0, 8.0, 10.0, 10.0, 16.0, 15.0, 22.0, 22.0, 31.0, 45.0, 43.0, 38.0, 33.0, 36.0, 43.0, 35.0, 41.0, 40.0, 40.0, 49.0, 49.0, 44.0, 37.0, 41.0, 28.0, 26.0, 26.0, 28.0, 21.0, 25.0, 8.0, 7.0, 14.0, 10.0, 10.0, 9.0, 2.0, 5.0, 2.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.921875, -9.596923828125, -9.27197265625, -8.947021484375, -8.6220703125, -8.297119140625, -7.97216796875, -7.647216796875, -7.322265625, -6.997314453125, -6.67236328125, -6.347412109375, -6.0224609375, -5.697509765625, -5.37255859375, -5.047607421875, -4.72265625, -4.397705078125, -4.07275390625, -3.747802734375, -3.4228515625, -3.097900390625, -2.77294921875, -2.447998046875, -2.123046875, -1.798095703125, -1.47314453125, -1.148193359375, -0.8232421875, -0.498291015625, -0.17333984375, 0.151611328125, 0.4765625, 0.801513671875, 1.12646484375, 1.451416015625, 1.7763671875, 2.101318359375, 2.42626953125, 2.751220703125, 3.076171875, 3.401123046875, 3.72607421875, 4.051025390625, 4.3759765625, 4.700927734375, 5.02587890625, 5.350830078125, 5.67578125, 6.000732421875, 6.32568359375, 6.650634765625, 6.9755859375, 7.300537109375, 7.62548828125, 7.950439453125, 8.275390625, 8.600341796875, 8.92529296875, 9.250244140625, 9.5751953125, 9.900146484375, 10.22509765625, 10.550048828125, 10.875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 8.0, 11.0, 19.0, 30.0, 35.0, 38.0, 54.0, 57.0, 99.0, 148.0, 201.0, 331.0, 465.0, 733.0, 1344.0, 2169.0, 4175.0, 9154.0, 22808.0, 78390.0, 434879.0, 2062671.0, 1291541.0, 208317.0, 45828.0, 15620.0, 6867.0, 3328.0, 1875.0, 1065.0, 682.0, 395.0, 283.0, 179.0, 124.0, 93.0, 66.0, 51.0, 36.0, 35.0, 22.0, 15.0, 8.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.34375, -16.719970703125, -16.09619140625, -15.472412109375, -14.8486328125, -14.224853515625, -13.60107421875, -12.977294921875, -12.353515625, -11.729736328125, -11.10595703125, -10.482177734375, -9.8583984375, -9.234619140625, -8.61083984375, -7.987060546875, -7.36328125, -6.739501953125, -6.11572265625, -5.491943359375, -4.8681640625, -4.244384765625, -3.62060546875, -2.996826171875, -2.373046875, -1.749267578125, -1.12548828125, -0.501708984375, 0.1220703125, 0.745849609375, 1.36962890625, 1.993408203125, 2.6171875, 3.240966796875, 3.86474609375, 4.488525390625, 5.1123046875, 5.736083984375, 6.35986328125, 6.983642578125, 7.607421875, 8.231201171875, 8.85498046875, 9.478759765625, 10.1025390625, 10.726318359375, 11.35009765625, 11.973876953125, 12.59765625, 13.221435546875, 13.84521484375, 14.468994140625, 15.0927734375, 15.716552734375, 16.34033203125, 16.964111328125, 17.587890625, 18.211669921875, 18.83544921875, 19.459228515625, 20.0830078125, 20.706787109375, 21.33056640625, 21.954345703125, 22.578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 14.0, 20.0, 31.0, 31.0, 44.0, 78.0, 95.0, 178.0, 259.0, 394.0, 594.0, 641.0, 531.0, 334.0, 253.0, 156.0, 130.0, 91.0, 57.0, 27.0, 23.0, 31.0, 14.0, 13.0, 5.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.5703125, -19.84375, -19.1171875, -18.390625, -17.6640625, -16.9375, -16.2109375, -15.484375, -14.7578125, -14.03125, -13.3046875, -12.578125, -11.8515625, -11.125, -10.3984375, -9.671875, -8.9453125, -8.21875, -7.4921875, -6.765625, -6.0390625, -5.3125, -4.5859375, -3.859375, -3.1328125, -2.40625, -1.6796875, -0.953125, -0.2265625, 0.5, 1.2265625, 1.953125, 2.6796875, 3.40625, 4.1328125, 4.859375, 5.5859375, 6.3125, 7.0390625, 7.765625, 8.4921875, 9.21875, 9.9453125, 10.671875, 11.3984375, 12.125, 12.8515625, 13.578125, 14.3046875, 15.03125, 15.7578125, 16.484375, 17.2109375, 17.9375, 18.6640625, 19.390625, 20.1171875, 20.84375, 21.5703125, 22.296875, 23.0234375, 23.75, 24.4765625, 25.203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 9.0, 14.0, 20.0, 16.0, 22.0, 43.0, 59.0, 87.0, 164.0, 271.0, 586.0, 2133.0, 17828.0, 1101553.0, 3035342.0, 31532.0, 3182.0, 740.0, 280.0, 138.0, 82.0, 52.0, 42.0, 22.0, 19.0, 12.0, 10.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.25, -87.6787109375, -85.107421875, -82.5361328125, -79.96484375, -77.3935546875, -74.822265625, -72.2509765625, -69.6796875, -67.1083984375, -64.537109375, -61.9658203125, -59.39453125, -56.8232421875, -54.251953125, -51.6806640625, -49.109375, -46.5380859375, -43.966796875, -41.3955078125, -38.82421875, -36.2529296875, -33.681640625, -31.1103515625, -28.5390625, -25.9677734375, -23.396484375, -20.8251953125, -18.25390625, -15.6826171875, -13.111328125, -10.5400390625, -7.96875, -5.3974609375, -2.826171875, -0.2548828125, 2.31640625, 4.8876953125, 7.458984375, 10.0302734375, 12.6015625, 15.1728515625, 17.744140625, 20.3154296875, 22.88671875, 25.4580078125, 28.029296875, 30.6005859375, 33.171875, 35.7431640625, 38.314453125, 40.8857421875, 43.45703125, 46.0283203125, 48.599609375, 51.1708984375, 53.7421875, 56.3134765625, 58.884765625, 61.4560546875, 64.02734375, 66.5986328125, 69.169921875, 71.7412109375, 74.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 36.0, 76.0, 160.0, 268.0, 260.0, 129.0, 46.0, 16.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.4894104003906, -287.7291564941406, -280.96893310546875, -274.20867919921875, -267.44842529296875, -260.68817138671875, -253.9279327392578, -247.16769409179688, -240.40744018554688, -233.64718627929688, -226.88694763183594, -220.126708984375, -213.366455078125, -206.606201171875, -199.84596252441406, -193.08572387695312, -186.32546997070312, -179.56521606445312, -172.8049774169922, -166.04473876953125, -159.28448486328125, -152.52423095703125, -145.7639923095703, -139.00375366210938, -132.24349975585938, -125.4832534790039, -118.72300720214844, -111.96276092529297, -105.2025146484375, -98.44226837158203, -91.68202209472656, -84.9217758178711, -78.16154479980469, -71.40129852294922, -64.64105224609375, -57.88080596923828, -51.12055969238281, -44.360313415527344, -37.600067138671875, -30.839820861816406, -24.079574584960938, -17.31932830810547, -10.55908203125, -3.7988357543945312, 2.9614105224609375, 9.721656799316406, 16.481903076171875, 23.242149353027344, 30.002395629882812, 36.76264190673828, 43.52288818359375, 50.28313446044922, 57.04338073730469, 63.803627014160156, 70.56387329101562, 77.3241195678711, 84.08436584472656, 90.84461212158203, 97.6048583984375, 104.36510467529297, 111.12535095214844, 117.8855972290039, 124.64584350585938, 131.40609741210938, 138.1663360595703]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 8.0, 17.0, 19.0, 16.0, 29.0, 24.0, 26.0, 36.0, 35.0, 24.0, 36.0, 51.0, 37.0, 38.0, 53.0, 46.0, 47.0, 49.0, 39.0, 43.0, 34.0, 41.0, 37.0, 36.0, 28.0, 26.0, 16.0, 23.0, 15.0, 11.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.77525329589844, -69.49578857421875, -67.21632385253906, -64.93685913085938, -62.65739059448242, -60.377925872802734, -58.09845733642578, -55.818992614746094, -53.539527893066406, -51.26006317138672, -48.98059844970703, -46.70112991333008, -44.42166519165039, -42.1422004699707, -39.86273193359375, -37.58326721191406, -35.303802490234375, -33.02433776855469, -30.744871139526367, -28.465404510498047, -26.18593978881836, -23.906475067138672, -21.62700843811035, -19.34754180908203, -17.068077087402344, -14.78861141204834, -12.509145736694336, -10.229680061340332, -7.950214385986328, -5.670748710632324, -3.3912830352783203, -1.1118173599243164, 1.1676406860351562, 3.44710636138916, 5.726572036743164, 8.006037712097168, 10.285503387451172, 12.564969062805176, 14.84443473815918, 17.1239013671875, 19.403366088867188, 21.682830810546875, 23.962297439575195, 26.241764068603516, 28.521228790283203, 30.80069351196289, 33.080162048339844, 35.35962677001953, 37.63909149169922, 39.918556213378906, 42.198020935058594, 44.47748947143555, 46.756954193115234, 49.03641891479492, 51.315887451171875, 53.59535217285156, 55.87481689453125, 58.15428161621094, 60.433746337890625, 62.71321487426758, 64.99267578125, 67.27214813232422, 69.5516128540039, 71.8310775756836, 74.11054229736328]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 5.0, 7.0, 11.0, 8.0, 17.0, 19.0, 36.0, 29.0, 32.0, 27.0, 43.0, 37.0, 37.0, 46.0, 53.0, 43.0, 54.0, 55.0, 50.0, 37.0, 42.0, 45.0, 27.0, 34.0, 27.0, 27.0, 20.0, 17.0, 16.0, 18.0, 12.0, 14.0, 2.0, 8.0, 11.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.7401123046875, -9.409912109375, -9.0797119140625, -8.74951171875, -8.4193115234375, -8.089111328125, -7.7589111328125, -7.4287109375, -7.0985107421875, -6.768310546875, -6.4381103515625, -6.10791015625, -5.7777099609375, -5.447509765625, -5.1173095703125, -4.787109375, -4.4569091796875, -4.126708984375, -3.7965087890625, -3.46630859375, -3.1361083984375, -2.805908203125, -2.4757080078125, -2.1455078125, -1.8153076171875, -1.485107421875, -1.1549072265625, -0.82470703125, -0.4945068359375, -0.164306640625, 0.1658935546875, 0.49609375, 0.8262939453125, 1.156494140625, 1.4866943359375, 1.81689453125, 2.1470947265625, 2.477294921875, 2.8074951171875, 3.1376953125, 3.4678955078125, 3.798095703125, 4.1282958984375, 4.45849609375, 4.7886962890625, 5.118896484375, 5.4490966796875, 5.779296875, 6.1094970703125, 6.439697265625, 6.7698974609375, 7.10009765625, 7.4302978515625, 7.760498046875, 8.0906982421875, 8.4208984375, 8.7510986328125, 9.081298828125, 9.4114990234375, 9.74169921875, 10.0718994140625, 10.402099609375, 10.7322998046875, 11.0625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 11.0, 18.0, 27.0, 39.0, 75.0, 107.0, 154.0, 235.0, 357.0, 556.0, 830.0, 1279.0, 1955.0, 3077.0, 4758.0, 7493.0, 11534.0, 19209.0, 32398.0, 56959.0, 103772.0, 185598.0, 242630.0, 162172.0, 89497.0, 49067.0, 28638.0, 17010.0, 10334.0, 6569.0, 4344.0, 2744.0, 1761.0, 1150.0, 745.0, 500.0, 308.0, 236.0, 137.0, 83.0, 67.0, 48.0, 15.0, 15.0, 12.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.3408203125, -1.299407958984375, -1.25799560546875, -1.216583251953125, -1.1751708984375, -1.133758544921875, -1.09234619140625, -1.050933837890625, -1.009521484375, -0.968109130859375, -0.92669677734375, -0.885284423828125, -0.8438720703125, -0.802459716796875, -0.76104736328125, -0.719635009765625, -0.67822265625, -0.636810302734375, -0.59539794921875, -0.553985595703125, -0.5125732421875, -0.471160888671875, -0.42974853515625, -0.388336181640625, -0.346923828125, -0.305511474609375, -0.26409912109375, -0.222686767578125, -0.1812744140625, -0.139862060546875, -0.09844970703125, -0.057037353515625, -0.015625, 0.025787353515625, 0.06719970703125, 0.108612060546875, 0.1500244140625, 0.191436767578125, 0.23284912109375, 0.274261474609375, 0.315673828125, 0.357086181640625, 0.39849853515625, 0.439910888671875, 0.4813232421875, 0.522735595703125, 0.56414794921875, 0.605560302734375, 0.64697265625, 0.688385009765625, 0.72979736328125, 0.771209716796875, 0.8126220703125, 0.854034423828125, 0.89544677734375, 0.936859130859375, 0.978271484375, 1.019683837890625, 1.06109619140625, 1.102508544921875, 1.1439208984375, 1.185333251953125, 1.22674560546875, 1.268157958984375, 1.3095703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 5.0, 14.0, 5.0, 12.0, 14.0, 9.0, 12.0, 15.0, 14.0, 33.0, 24.0, 28.0, 35.0, 30.0, 31.0, 40.0, 41.0, 36.0, 32.0, 47.0, 1061.0, 39.0, 44.0, 37.0, 37.0, 33.0, 23.0, 23.0, 20.0, 22.0, 21.0, 23.0, 19.0, 22.0, 19.0, 18.0, 14.0, 12.0, 8.0, 10.0, 12.0, 7.0, 3.0, 2.0, 1.0, 7.0, 2.0, 3.0, 2.0], "bins": [-6.45703125, -6.273681640625, -6.09033203125, -5.906982421875, -5.7236328125, -5.540283203125, -5.35693359375, -5.173583984375, -4.990234375, -4.806884765625, -4.62353515625, -4.440185546875, -4.2568359375, -4.073486328125, -3.89013671875, -3.706787109375, -3.5234375, -3.340087890625, -3.15673828125, -2.973388671875, -2.7900390625, -2.606689453125, -2.42333984375, -2.239990234375, -2.056640625, -1.873291015625, -1.68994140625, -1.506591796875, -1.3232421875, -1.139892578125, -0.95654296875, -0.773193359375, -0.58984375, -0.406494140625, -0.22314453125, -0.039794921875, 0.1435546875, 0.326904296875, 0.51025390625, 0.693603515625, 0.876953125, 1.060302734375, 1.24365234375, 1.427001953125, 1.6103515625, 1.793701171875, 1.97705078125, 2.160400390625, 2.34375, 2.527099609375, 2.71044921875, 2.893798828125, 3.0771484375, 3.260498046875, 3.44384765625, 3.627197265625, 3.810546875, 3.993896484375, 4.17724609375, 4.360595703125, 4.5439453125, 4.727294921875, 4.91064453125, 5.093994140625, 5.27734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 7.0, 11.0, 14.0, 30.0, 34.0, 63.0, 94.0, 138.0, 191.0, 275.0, 354.0, 603.0, 834.0, 1203.0, 1760.0, 2670.0, 3870.0, 5670.0, 8662.0, 12724.0, 19382.0, 29212.0, 45574.0, 72935.0, 117420.0, 266904.0, 1144568.0, 132226.0, 81705.0, 51188.0, 32720.0, 21045.0, 13928.0, 9453.0, 6352.0, 4302.0, 2914.0, 2031.0, 1272.0, 846.0, 595.0, 461.0, 310.0, 185.0, 144.0, 89.0, 51.0, 41.0, 20.0, 22.0, 16.0, 6.0, 4.0, 3.0, 4.0, 3.0], "bins": [-0.52392578125, -0.5085716247558594, -0.49321746826171875, -0.4778633117675781, -0.4625091552734375, -0.4471549987792969, -0.43180084228515625, -0.4164466857910156, -0.401092529296875, -0.3857383728027344, -0.37038421630859375, -0.3550300598144531, -0.3396759033203125, -0.3243217468261719, -0.30896759033203125, -0.2936134338378906, -0.27825927734375, -0.2629051208496094, -0.24755096435546875, -0.23219680786132812, -0.2168426513671875, -0.20148849487304688, -0.18613433837890625, -0.17078018188476562, -0.155426025390625, -0.14007186889648438, -0.12471771240234375, -0.10936355590820312, -0.0940093994140625, -0.07865524291992188, -0.06330108642578125, -0.047946929931640625, -0.0325927734375, -0.017238616943359375, -0.00188446044921875, 0.013469696044921875, 0.0288238525390625, 0.044178009033203125, 0.05953216552734375, 0.07488632202148438, 0.090240478515625, 0.10559463500976562, 0.12094879150390625, 0.13630294799804688, 0.1516571044921875, 0.16701126098632812, 0.18236541748046875, 0.19771957397460938, 0.21307373046875, 0.22842788696289062, 0.24378204345703125, 0.2591361999511719, 0.2744903564453125, 0.2898445129394531, 0.30519866943359375, 0.3205528259277344, 0.335906982421875, 0.3512611389160156, 0.36661529541015625, 0.3819694519042969, 0.3973236083984375, 0.4126777648925781, 0.42803192138671875, 0.4433860778808594, 0.458740234375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 13.0, 13.0, 11.0, 9.0, 24.0, 14.0, 26.0, 32.0, 41.0, 42.0, 79.0, 277.0, 105.0, 74.0, 37.0, 25.0, 33.0, 21.0, 19.0, 9.0, 8.0, 12.0, 9.0, 9.0, 5.0, 11.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.07940673828125, -0.07704448699951172, -0.07468223571777344, -0.07231998443603516, -0.06995773315429688, -0.0675954818725586, -0.06523323059082031, -0.06287097930908203, -0.06050872802734375, -0.05814647674560547, -0.05578422546386719, -0.053421974182128906, -0.051059722900390625, -0.048697471618652344, -0.04633522033691406, -0.04397296905517578, -0.0416107177734375, -0.03924846649169922, -0.03688621520996094, -0.034523963928222656, -0.032161712646484375, -0.029799461364746094, -0.027437210083007812, -0.02507495880126953, -0.02271270751953125, -0.02035045623779297, -0.017988204956054688, -0.015625953674316406, -0.013263702392578125, -0.010901451110839844, -0.008539199829101562, -0.006176948547363281, -0.003814697265625, -0.0014524459838867188, 0.0009098052978515625, 0.0032720565795898438, 0.005634307861328125, 0.007996559143066406, 0.010358810424804688, 0.012721061706542969, 0.01508331298828125, 0.01744556427001953, 0.019807815551757812, 0.022170066833496094, 0.024532318115234375, 0.026894569396972656, 0.029256820678710938, 0.03161907196044922, 0.0339813232421875, 0.03634357452392578, 0.03870582580566406, 0.041068077087402344, 0.043430328369140625, 0.045792579650878906, 0.04815483093261719, 0.05051708221435547, 0.05287933349609375, 0.05524158477783203, 0.05760383605957031, 0.059966087341308594, 0.062328338623046875, 0.06469058990478516, 0.06705284118652344, 0.06941509246826172, 0.07177734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 8.0, 9.0, 15.0, 8.0, 21.0, 19.0, 40.0, 78.0, 109.0, 210.0, 961.0, 233955.0, 811245.0, 1263.0, 222.0, 113.0, 74.0, 50.0, 25.0, 18.0, 14.0, 15.0, 13.0, 11.0, 3.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.91015625, -1.85235595703125, -1.7945556640625, -1.73675537109375, -1.678955078125, -1.62115478515625, -1.5633544921875, -1.50555419921875, -1.44775390625, -1.38995361328125, -1.3321533203125, -1.27435302734375, -1.216552734375, -1.15875244140625, -1.1009521484375, -1.04315185546875, -0.9853515625, -0.92755126953125, -0.8697509765625, -0.81195068359375, -0.754150390625, -0.69635009765625, -0.6385498046875, -0.58074951171875, -0.52294921875, -0.46514892578125, -0.4073486328125, -0.34954833984375, -0.291748046875, -0.23394775390625, -0.1761474609375, -0.11834716796875, -0.060546875, -0.00274658203125, 0.0550537109375, 0.11285400390625, 0.170654296875, 0.22845458984375, 0.2862548828125, 0.34405517578125, 0.40185546875, 0.45965576171875, 0.5174560546875, 0.57525634765625, 0.633056640625, 0.69085693359375, 0.7486572265625, 0.80645751953125, 0.8642578125, 0.92205810546875, 0.9798583984375, 1.03765869140625, 1.095458984375, 1.15325927734375, 1.2110595703125, 1.26885986328125, 1.32666015625, 1.38446044921875, 1.4422607421875, 1.50006103515625, 1.557861328125, 1.61566162109375, 1.6734619140625, 1.73126220703125, 1.7890625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 12.0, 28.0, 39.0, 157.0, 394.0, 224.0, 86.0, 42.0, 14.0, 8.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42340564727783203, -0.4086211025714874, -0.39383652806282043, -0.37905198335647583, -0.3642674386501312, -0.3494828939437866, -0.33469831943511963, -0.319913774728775, -0.3051292300224304, -0.2903446853160858, -0.2755601108074188, -0.2607755661010742, -0.24599102139472961, -0.23120646178722382, -0.21642190217971802, -0.2016373574733734, -0.18685279786586761, -0.17206823825836182, -0.1572836935520172, -0.1424991339445114, -0.1277145892381668, -0.11293002963066101, -0.09814547747373581, -0.08336092531681061, -0.0685763731598854, -0.053791821002960205, -0.039007268846035004, -0.024222712963819504, -0.009438160806894302, 0.0053463950753211975, 0.0201309472322464, 0.0349154993891716, 0.0497000515460968, 0.064484603703022, 0.0792691558599472, 0.094053715467453, 0.10883826017379761, 0.1236228197813034, 0.1384073793888092, 0.1531919240951538, 0.1679764688014984, 0.1827610284090042, 0.19754557311534882, 0.21233013272285461, 0.22711467742919922, 0.24189923703670502, 0.2566837966442108, 0.2714683413505554, 0.2862529158592224, 0.301037460565567, 0.315822035074234, 0.3306065797805786, 0.3453911244869232, 0.3601756691932678, 0.3749602437019348, 0.3897447884082794, 0.404529333114624, 0.41931387782096863, 0.4340984523296356, 0.4488829970359802, 0.46366754174232483, 0.47845208644866943, 0.4932366609573364, 0.5080212354660034, 0.5228057503700256]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 7.0, 3.0, 6.0, 7.0, 6.0, 12.0, 8.0, 5.0, 7.0, 12.0, 16.0, 12.0, 16.0, 20.0, 23.0, 16.0, 33.0, 21.0, 22.0, 33.0, 37.0, 36.0, 39.0, 42.0, 32.0, 40.0, 25.0, 39.0, 38.0, 40.0, 44.0, 33.0, 33.0, 26.0, 20.0, 20.0, 15.0, 26.0, 19.0, 18.0, 14.0, 16.0, 14.0, 15.0, 7.0, 14.0, 2.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11607164144515991, -0.11205572634935379, -0.10803981125354767, -0.10402388870716095, -0.10000797361135483, -0.0959920585155487, -0.09197613596916199, -0.08796022087335587, -0.08394430577754974, -0.07992839068174362, -0.0759124755859375, -0.07189655303955078, -0.06788063794374466, -0.06386472284793854, -0.05984880402684212, -0.0558328852057457, -0.051816970109939575, -0.04780105501413345, -0.04378513619303703, -0.03976921737194061, -0.03575330227613449, -0.03173738718032837, -0.02772146835923195, -0.023705551400780678, -0.019689634442329407, -0.015673717483878136, -0.011657800525426865, -0.007641883566975594, -0.0036259666085243225, 0.00038995034992694855, 0.00440586730837822, 0.00842178426682949, 0.012437701225280762, 0.016453618183732033, 0.020469535142183304, 0.024485452100634575, 0.028501369059085846, 0.03251728415489197, 0.03653320297598839, 0.04054912179708481, 0.04456503689289093, 0.04858095198869705, 0.05259687080979347, 0.05661278963088989, 0.060628704726696014, 0.06464461982250214, 0.06866054236888885, 0.07267645746469498, 0.0766923725605011, 0.08070828765630722, 0.08472420275211334, 0.08874012529850006, 0.09275604039430618, 0.0967719554901123, 0.10078787803649902, 0.10480379313230515, 0.10881970822811127, 0.11283562332391739, 0.11685153841972351, 0.12086746096611023, 0.12488337606191635, 0.12889929115772247, 0.1329152137041092, 0.13693112134933472, 0.14094704389572144]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 5.0, 7.0, 11.0, 8.0, 16.0, 20.0, 35.0, 30.0, 32.0, 26.0, 44.0, 36.0, 38.0, 46.0, 51.0, 45.0, 54.0, 55.0, 48.0, 39.0, 42.0, 44.0, 28.0, 33.0, 27.0, 26.0, 21.0, 18.0, 16.0, 17.0, 13.0, 12.0, 4.0, 8.0, 10.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.740234375, -9.41015625, -9.080078125, -8.75, -8.419921875, -8.08984375, -7.759765625, -7.4296875, -7.099609375, -6.76953125, -6.439453125, -6.109375, -5.779296875, -5.44921875, -5.119140625, -4.7890625, -4.458984375, -4.12890625, -3.798828125, -3.46875, -3.138671875, -2.80859375, -2.478515625, -2.1484375, -1.818359375, -1.48828125, -1.158203125, -0.828125, -0.498046875, -0.16796875, 0.162109375, 0.4921875, 0.822265625, 1.15234375, 1.482421875, 1.8125, 2.142578125, 2.47265625, 2.802734375, 3.1328125, 3.462890625, 3.79296875, 4.123046875, 4.453125, 4.783203125, 5.11328125, 5.443359375, 5.7734375, 6.103515625, 6.43359375, 6.763671875, 7.09375, 7.423828125, 7.75390625, 8.083984375, 8.4140625, 8.744140625, 9.07421875, 9.404296875, 9.734375, 10.064453125, 10.39453125, 10.724609375, 11.0546875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 15.0, 12.0, 16.0, 19.0, 40.0, 66.0, 102.0, 157.0, 274.0, 387.0, 716.0, 1168.0, 2156.0, 3960.0, 7185.0, 14186.0, 27716.0, 56594.0, 125656.0, 303426.0, 282340.0, 115265.0, 52310.0, 26168.0, 13097.0, 6908.0, 3726.0, 2004.0, 1098.0, 668.0, 387.0, 259.0, 145.0, 90.0, 71.0, 52.0, 20.0, 25.0, 16.0, 16.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-11.015625, -10.691162109375, -10.36669921875, -10.042236328125, -9.7177734375, -9.393310546875, -9.06884765625, -8.744384765625, -8.419921875, -8.095458984375, -7.77099609375, -7.446533203125, -7.1220703125, -6.797607421875, -6.47314453125, -6.148681640625, -5.82421875, -5.499755859375, -5.17529296875, -4.850830078125, -4.5263671875, -4.201904296875, -3.87744140625, -3.552978515625, -3.228515625, -2.904052734375, -2.57958984375, -2.255126953125, -1.9306640625, -1.606201171875, -1.28173828125, -0.957275390625, -0.6328125, -0.308349609375, 0.01611328125, 0.340576171875, 0.6650390625, 0.989501953125, 1.31396484375, 1.638427734375, 1.962890625, 2.287353515625, 2.61181640625, 2.936279296875, 3.2607421875, 3.585205078125, 3.90966796875, 4.234130859375, 4.55859375, 4.883056640625, 5.20751953125, 5.531982421875, 5.8564453125, 6.180908203125, 6.50537109375, 6.829833984375, 7.154296875, 7.478759765625, 7.80322265625, 8.127685546875, 8.4521484375, 8.776611328125, 9.10107421875, 9.425537109375, 9.75]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 2.0, 7.0, 5.0, 11.0, 18.0, 16.0, 21.0, 11.0, 19.0, 26.0, 21.0, 26.0, 26.0, 35.0, 38.0, 46.0, 53.0, 71.0, 89.0, 197.0, 1406.0, 282.0, 115.0, 69.0, 61.0, 54.0, 40.0, 47.0, 40.0, 27.0, 29.0, 17.0, 24.0, 20.0, 14.0, 20.0, 10.0, 7.0, 6.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.515625, -24.686279296875, -23.85693359375, -23.027587890625, -22.1982421875, -21.368896484375, -20.53955078125, -19.710205078125, -18.880859375, -18.051513671875, -17.22216796875, -16.392822265625, -15.5634765625, -14.734130859375, -13.90478515625, -13.075439453125, -12.24609375, -11.416748046875, -10.58740234375, -9.758056640625, -8.9287109375, -8.099365234375, -7.27001953125, -6.440673828125, -5.611328125, -4.781982421875, -3.95263671875, -3.123291015625, -2.2939453125, -1.464599609375, -0.63525390625, 0.194091796875, 1.0234375, 1.852783203125, 2.68212890625, 3.511474609375, 4.3408203125, 5.170166015625, 5.99951171875, 6.828857421875, 7.658203125, 8.487548828125, 9.31689453125, 10.146240234375, 10.9755859375, 11.804931640625, 12.63427734375, 13.463623046875, 14.29296875, 15.122314453125, 15.95166015625, 16.781005859375, 17.6103515625, 18.439697265625, 19.26904296875, 20.098388671875, 20.927734375, 21.757080078125, 22.58642578125, 23.415771484375, 24.2451171875, 25.074462890625, 25.90380859375, 26.733154296875, 27.5625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 12.0, 9.0, 14.0, 11.0, 15.0, 33.0, 29.0, 47.0, 50.0, 62.0, 90.0, 125.0, 190.0, 295.0, 588.0, 1322.0, 4921.0, 35379.0, 829135.0, 2199224.0, 63565.0, 7178.0, 1672.0, 617.0, 346.0, 195.0, 133.0, 103.0, 72.0, 66.0, 42.0, 26.0, 24.0, 26.0, 20.0, 16.0, 8.0, 12.0, 7.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.0625, -40.82958984375, -39.5966796875, -38.36376953125, -37.130859375, -35.89794921875, -34.6650390625, -33.43212890625, -32.19921875, -30.96630859375, -29.7333984375, -28.50048828125, -27.267578125, -26.03466796875, -24.8017578125, -23.56884765625, -22.3359375, -21.10302734375, -19.8701171875, -18.63720703125, -17.404296875, -16.17138671875, -14.9384765625, -13.70556640625, -12.47265625, -11.23974609375, -10.0068359375, -8.77392578125, -7.541015625, -6.30810546875, -5.0751953125, -3.84228515625, -2.609375, -1.37646484375, -0.1435546875, 1.08935546875, 2.322265625, 3.55517578125, 4.7880859375, 6.02099609375, 7.25390625, 8.48681640625, 9.7197265625, 10.95263671875, 12.185546875, 13.41845703125, 14.6513671875, 15.88427734375, 17.1171875, 18.35009765625, 19.5830078125, 20.81591796875, 22.048828125, 23.28173828125, 24.5146484375, 25.74755859375, 26.98046875, 28.21337890625, 29.4462890625, 30.67919921875, 31.912109375, 33.14501953125, 34.3779296875, 35.61083984375, 36.84375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 233.0, 750.0, 31.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.6969985961914, -75.49006652832031, -61.283138275146484, -47.076210021972656, -32.86927795410156, -18.66234588623047, -4.455421447753906, 9.751510620117188, 23.95844268798828, 38.165374755859375, 52.3723030090332, 66.57923126220703, 80.78616333007812, 94.99309539794922, 109.20001983642578, 123.40695190429688, 137.6138916015625, 151.82081604003906, 166.0277557373047, 180.23468017578125, 194.44161987304688, 208.64854431152344, 222.85546875, 237.06240844726562, 251.26931762695312, 265.47625732421875, 279.68316650390625, 293.8901062011719, 308.0970458984375, 322.303955078125, 336.5108947753906, 350.71783447265625, 364.92474365234375, 379.1316833496094, 393.3385925292969, 407.5455322265625, 421.7524719238281, 435.95941162109375, 450.16632080078125, 464.3732604980469, 478.5802001953125, 492.7871398925781, 506.9940490722656, 521.2009887695312, 535.4078979492188, 549.6148681640625, 563.82177734375, 578.0286865234375, 592.235595703125, 606.4425048828125, 620.6494750976562, 634.8563842773438, 649.0632934570312, 663.270263671875, 677.4771728515625, 691.68408203125, 705.8910522460938, 720.0979614257812, 734.304931640625, 748.5118408203125, 762.71875, 776.9257202148438, 791.1326293945312, 805.3395385742188, 819.5465087890625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 4.0, 5.0, 8.0, 9.0, 9.0, 11.0, 16.0, 14.0, 17.0, 24.0, 23.0, 34.0, 27.0, 35.0, 29.0, 49.0, 41.0, 34.0, 37.0, 49.0, 55.0, 53.0, 51.0, 42.0, 26.0, 30.0, 37.0, 28.0, 26.0, 28.0, 23.0, 18.0, 15.0, 12.0, 15.0, 12.0, 15.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-85.1396484375, -82.82827758789062, -80.51690673828125, -78.2055435180664, -75.89417266845703, -73.58280181884766, -71.27143859863281, -68.96006774902344, -66.64869689941406, -64.33732604980469, -62.02595901489258, -59.71459197998047, -57.403221130371094, -55.09185028076172, -52.78048324584961, -50.4691162109375, -48.157745361328125, -45.84637451171875, -43.53500747680664, -41.22364044189453, -38.912269592285156, -36.60089874267578, -34.28953170776367, -31.97816276550293, -29.666793823242188, -27.355424880981445, -25.044055938720703, -22.73268699645996, -20.42131805419922, -18.109949111938477, -15.798580169677734, -13.487211227416992, -11.17584228515625, -8.864473342895508, -6.553104400634766, -4.241735458374023, -1.9303665161132812, 0.38100242614746094, 2.692371368408203, 5.003740310668945, 7.3151092529296875, 9.62647819519043, 11.937847137451172, 14.249216079711914, 16.560585021972656, 18.8719539642334, 21.18332290649414, 23.494691848754883, 25.806060791015625, 28.117429733276367, 30.42879867553711, 32.74016571044922, 35.051536560058594, 37.36290740966797, 39.67427444458008, 41.98564147949219, 44.29701232910156, 46.60838317871094, 48.91975021362305, 51.231117248535156, 53.54248809814453, 55.853858947753906, 58.165225982666016, 60.476593017578125, 62.7879638671875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 11.0, 9.0, 11.0, 17.0, 19.0, 22.0, 26.0, 41.0, 33.0, 47.0, 34.0, 47.0, 45.0, 47.0, 49.0, 49.0, 46.0, 43.0, 40.0, 48.0, 36.0, 38.0, 34.0, 30.0, 20.0, 26.0, 21.0, 18.0, 16.0, 10.0, 6.0, 10.0, 9.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.9200439453125, -9.574462890625, -9.2288818359375, -8.88330078125, -8.5377197265625, -8.192138671875, -7.8465576171875, -7.5009765625, -7.1553955078125, -6.809814453125, -6.4642333984375, -6.11865234375, -5.7730712890625, -5.427490234375, -5.0819091796875, -4.736328125, -4.3907470703125, -4.045166015625, -3.6995849609375, -3.35400390625, -3.0084228515625, -2.662841796875, -2.3172607421875, -1.9716796875, -1.6260986328125, -1.280517578125, -0.9349365234375, -0.58935546875, -0.2437744140625, 0.101806640625, 0.4473876953125, 0.79296875, 1.1385498046875, 1.484130859375, 1.8297119140625, 2.17529296875, 2.5208740234375, 2.866455078125, 3.2120361328125, 3.5576171875, 3.9031982421875, 4.248779296875, 4.5943603515625, 4.93994140625, 5.2855224609375, 5.631103515625, 5.9766845703125, 6.322265625, 6.6678466796875, 7.013427734375, 7.3590087890625, 7.70458984375, 8.0501708984375, 8.395751953125, 8.7413330078125, 9.0869140625, 9.4324951171875, 9.778076171875, 10.1236572265625, 10.46923828125, 10.8148193359375, 11.160400390625, 11.5059814453125, 11.8515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 11.0, 12.0, 19.0, 23.0, 29.0, 58.0, 55.0, 106.0, 174.0, 296.0, 447.0, 837.0, 1403.0, 2532.0, 5227.0, 11761.0, 34074.0, 205853.0, 2468379.0, 1317400.0, 103420.0, 23752.0, 9277.0, 4233.0, 2185.0, 1103.0, 614.0, 358.0, 229.0, 133.0, 97.0, 45.0, 39.0, 19.0, 18.0, 16.0, 17.0, 9.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.203125, -27.344482421875, -26.48583984375, -25.627197265625, -24.7685546875, -23.909912109375, -23.05126953125, -22.192626953125, -21.333984375, -20.475341796875, -19.61669921875, -18.758056640625, -17.8994140625, -17.040771484375, -16.18212890625, -15.323486328125, -14.46484375, -13.606201171875, -12.74755859375, -11.888916015625, -11.0302734375, -10.171630859375, -9.31298828125, -8.454345703125, -7.595703125, -6.737060546875, -5.87841796875, -5.019775390625, -4.1611328125, -3.302490234375, -2.44384765625, -1.585205078125, -0.7265625, 0.132080078125, 0.99072265625, 1.849365234375, 2.7080078125, 3.566650390625, 4.42529296875, 5.283935546875, 6.142578125, 7.001220703125, 7.85986328125, 8.718505859375, 9.5771484375, 10.435791015625, 11.29443359375, 12.153076171875, 13.01171875, 13.870361328125, 14.72900390625, 15.587646484375, 16.4462890625, 17.304931640625, 18.16357421875, 19.022216796875, 19.880859375, 20.739501953125, 21.59814453125, 22.456787109375, 23.3154296875, 24.174072265625, 25.03271484375, 25.891357421875, 26.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 9.0, 10.0, 12.0, 18.0, 20.0, 33.0, 48.0, 65.0, 85.0, 149.0, 201.0, 388.0, 523.0, 732.0, 564.0, 370.0, 266.0, 156.0, 130.0, 86.0, 56.0, 43.0, 25.0, 21.0, 14.0, 10.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.6787109375, -19.013671875, -18.3486328125, -17.68359375, -17.0185546875, -16.353515625, -15.6884765625, -15.0234375, -14.3583984375, -13.693359375, -13.0283203125, -12.36328125, -11.6982421875, -11.033203125, -10.3681640625, -9.703125, -9.0380859375, -8.373046875, -7.7080078125, -7.04296875, -6.3779296875, -5.712890625, -5.0478515625, -4.3828125, -3.7177734375, -3.052734375, -2.3876953125, -1.72265625, -1.0576171875, -0.392578125, 0.2724609375, 0.9375, 1.6025390625, 2.267578125, 2.9326171875, 3.59765625, 4.2626953125, 4.927734375, 5.5927734375, 6.2578125, 6.9228515625, 7.587890625, 8.2529296875, 8.91796875, 9.5830078125, 10.248046875, 10.9130859375, 11.578125, 12.2431640625, 12.908203125, 13.5732421875, 14.23828125, 14.9033203125, 15.568359375, 16.2333984375, 16.8984375, 17.5634765625, 18.228515625, 18.8935546875, 19.55859375, 20.2236328125, 20.888671875, 21.5537109375, 22.21875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 12.0, 7.0, 9.0, 15.0, 32.0, 40.0, 65.0, 101.0, 183.0, 284.0, 614.0, 1558.0, 6273.0, 44772.0, 2374826.0, 1718984.0, 38201.0, 5580.0, 1514.0, 519.0, 281.0, 147.0, 89.0, 50.0, 31.0, 26.0, 20.0, 15.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.375, -68.240234375, -66.10546875, -63.970703125, -61.8359375, -59.701171875, -57.56640625, -55.431640625, -53.296875, -51.162109375, -49.02734375, -46.892578125, -44.7578125, -42.623046875, -40.48828125, -38.353515625, -36.21875, -34.083984375, -31.94921875, -29.814453125, -27.6796875, -25.544921875, -23.41015625, -21.275390625, -19.140625, -17.005859375, -14.87109375, -12.736328125, -10.6015625, -8.466796875, -6.33203125, -4.197265625, -2.0625, 0.072265625, 2.20703125, 4.341796875, 6.4765625, 8.611328125, 10.74609375, 12.880859375, 15.015625, 17.150390625, 19.28515625, 21.419921875, 23.5546875, 25.689453125, 27.82421875, 29.958984375, 32.09375, 34.228515625, 36.36328125, 38.498046875, 40.6328125, 42.767578125, 44.90234375, 47.037109375, 49.171875, 51.306640625, 53.44140625, 55.576171875, 57.7109375, 59.845703125, 61.98046875, 64.115234375, 66.25]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 26.0, 62.0, 134.0, 202.0, 237.0, 166.0, 101.0, 53.0, 18.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-302.11712646484375, -296.54266357421875, -290.9681701660156, -285.3937072753906, -279.8192443847656, -274.2447509765625, -268.6702880859375, -263.0958251953125, -257.5213317871094, -251.9468536376953, -246.3723907470703, -240.79791259765625, -235.2234344482422, -229.6489715576172, -224.07449340820312, -218.50003051757812, -212.92556762695312, -207.35108947753906, -201.77662658691406, -196.2021484375, -190.62767028808594, -185.05320739746094, -179.47872924804688, -173.90426635742188, -168.32977294921875, -162.7552947998047, -157.1808319091797, -151.60635375976562, -146.03187561035156, -140.45741271972656, -134.8829345703125, -129.3084716796875, -123.73399353027344, -118.1595230102539, -112.58504486083984, -107.01057434082031, -101.43610382080078, -95.86163330078125, -90.28715515136719, -84.71268463134766, -79.13821411132812, -73.5637435913086, -67.98926544189453, -62.414794921875, -56.84032440185547, -51.26585006713867, -45.691375732421875, -40.116905212402344, -34.54242706298828, -28.967954635620117, -23.393482208251953, -17.819007873535156, -12.244535446166992, -6.670063018798828, -1.0955886840820312, 4.4788818359375, 10.053356170654297, 15.627828598022461, 21.202301025390625, 26.776775360107422, 32.35124969482422, 37.92572021484375, 43.50019454956055, 49.07466506958008, 54.649139404296875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 7.0, 5.0, 10.0, 23.0, 15.0, 15.0, 25.0, 21.0, 24.0, 21.0, 30.0, 21.0, 40.0, 41.0, 39.0, 29.0, 40.0, 39.0, 58.0, 30.0, 37.0, 33.0, 39.0, 35.0, 30.0, 48.0, 31.0, 35.0, 29.0, 20.0, 17.0, 15.0, 14.0, 7.0, 12.0, 10.0, 6.0, 13.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-53.73297882080078, -52.03872299194336, -50.34446334838867, -48.65020751953125, -46.95594787597656, -45.26169204711914, -43.56743621826172, -41.87317657470703, -40.17892074584961, -38.48466491699219, -36.7904052734375, -35.09614944458008, -33.40188980102539, -31.70763397216797, -30.013376235961914, -28.31911849975586, -26.624860763549805, -24.93060302734375, -23.236345291137695, -21.54208755493164, -19.84783172607422, -18.153573989868164, -16.45931625366211, -14.765059471130371, -13.070801734924316, -11.376543998718262, -9.682287216186523, -7.988029479980469, -6.293772220611572, -4.599514961242676, -2.905257225036621, -1.2110004425048828, 0.4832572937011719, 2.1775145530700684, 3.871772050857544, 5.5660295486450195, 7.260286808013916, 8.954544067382812, 10.648801803588867, 12.343058586120605, 14.03731632232666, 15.731574058532715, 17.425830841064453, 19.120088577270508, 20.814346313476562, 22.508602142333984, 24.202861785888672, 25.897117614746094, 27.59137535095215, 29.285633087158203, 30.979890823364258, 32.67414855957031, 34.368404388427734, 36.062660217285156, 37.756919860839844, 39.451175689697266, 41.14543533325195, 42.839691162109375, 44.53395080566406, 46.228206634521484, 47.92246627807617, 49.616722106933594, 51.31098175048828, 53.0052375793457, 54.699493408203125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 2.0, 7.0, 6.0, 8.0, 8.0, 11.0, 20.0, 15.0, 23.0, 36.0, 38.0, 32.0, 37.0, 30.0, 49.0, 48.0, 41.0, 34.0, 43.0, 48.0, 43.0, 50.0, 39.0, 39.0, 33.0, 45.0, 32.0, 23.0, 33.0, 18.0, 17.0, 11.0, 18.0, 9.0, 10.0, 9.0, 10.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.007568359375, -9.66357421875, -9.319580078125, -8.9755859375, -8.631591796875, -8.28759765625, -7.943603515625, -7.599609375, -7.255615234375, -6.91162109375, -6.567626953125, -6.2236328125, -5.879638671875, -5.53564453125, -5.191650390625, -4.84765625, -4.503662109375, -4.15966796875, -3.815673828125, -3.4716796875, -3.127685546875, -2.78369140625, -2.439697265625, -2.095703125, -1.751708984375, -1.40771484375, -1.063720703125, -0.7197265625, -0.375732421875, -0.03173828125, 0.312255859375, 0.65625, 1.000244140625, 1.34423828125, 1.688232421875, 2.0322265625, 2.376220703125, 2.72021484375, 3.064208984375, 3.408203125, 3.752197265625, 4.09619140625, 4.440185546875, 4.7841796875, 5.128173828125, 5.47216796875, 5.816162109375, 6.16015625, 6.504150390625, 6.84814453125, 7.192138671875, 7.5361328125, 7.880126953125, 8.22412109375, 8.568115234375, 8.912109375, 9.256103515625, 9.60009765625, 9.944091796875, 10.2880859375, 10.632080078125, 10.97607421875, 11.320068359375, 11.6640625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 9.0, 13.0, 15.0, 42.0, 59.0, 74.0, 138.0, 198.0, 306.0, 523.0, 744.0, 1381.0, 2260.0, 3879.0, 6645.0, 11851.0, 21639.0, 40271.0, 78787.0, 156452.0, 268054.0, 216997.0, 112964.0, 57193.0, 30124.0, 16176.0, 9027.0, 5067.0, 3068.0, 1800.0, 1104.0, 624.0, 401.0, 235.0, 146.0, 107.0, 71.0, 36.0, 19.0, 18.0, 15.0, 3.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.7998046875, -1.7480316162109375, -1.696258544921875, -1.6444854736328125, -1.59271240234375, -1.5409393310546875, -1.489166259765625, -1.4373931884765625, -1.3856201171875, -1.3338470458984375, -1.282073974609375, -1.2303009033203125, -1.17852783203125, -1.1267547607421875, -1.074981689453125, -1.0232086181640625, -0.971435546875, -0.9196624755859375, -0.867889404296875, -0.8161163330078125, -0.76434326171875, -0.7125701904296875, -0.660797119140625, -0.6090240478515625, -0.5572509765625, -0.5054779052734375, -0.453704833984375, -0.4019317626953125, -0.35015869140625, -0.2983856201171875, -0.246612548828125, -0.1948394775390625, -0.14306640625, -0.0912933349609375, -0.039520263671875, 0.0122528076171875, 0.06402587890625, 0.1157989501953125, 0.167572021484375, 0.2193450927734375, 0.2711181640625, 0.3228912353515625, 0.374664306640625, 0.4264373779296875, 0.47821044921875, 0.5299835205078125, 0.581756591796875, 0.6335296630859375, 0.685302734375, 0.7370758056640625, 0.788848876953125, 0.8406219482421875, 0.89239501953125, 0.9441680908203125, 0.995941162109375, 1.0477142333984375, 1.0994873046875, 1.1512603759765625, 1.203033447265625, 1.2548065185546875, 1.30657958984375, 1.3583526611328125, 1.410125732421875, 1.4618988037109375, 1.513671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 8.0, 10.0, 13.0, 12.0, 21.0, 24.0, 29.0, 24.0, 28.0, 31.0, 41.0, 36.0, 43.0, 42.0, 41.0, 37.0, 1072.0, 51.0, 47.0, 46.0, 45.0, 44.0, 39.0, 38.0, 22.0, 29.0, 23.0, 23.0, 23.0, 19.0, 20.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-8.5703125, -8.3492431640625, -8.128173828125, -7.9071044921875, -7.68603515625, -7.4649658203125, -7.243896484375, -7.0228271484375, -6.8017578125, -6.5806884765625, -6.359619140625, -6.1385498046875, -5.91748046875, -5.6964111328125, -5.475341796875, -5.2542724609375, -5.033203125, -4.8121337890625, -4.591064453125, -4.3699951171875, -4.14892578125, -3.9278564453125, -3.706787109375, -3.4857177734375, -3.2646484375, -3.0435791015625, -2.822509765625, -2.6014404296875, -2.38037109375, -2.1593017578125, -1.938232421875, -1.7171630859375, -1.49609375, -1.2750244140625, -1.053955078125, -0.8328857421875, -0.61181640625, -0.3907470703125, -0.169677734375, 0.0513916015625, 0.2724609375, 0.4935302734375, 0.714599609375, 0.9356689453125, 1.15673828125, 1.3778076171875, 1.598876953125, 1.8199462890625, 2.041015625, 2.2620849609375, 2.483154296875, 2.7042236328125, 2.92529296875, 3.1463623046875, 3.367431640625, 3.5885009765625, 3.8095703125, 4.0306396484375, 4.251708984375, 4.4727783203125, 4.69384765625, 4.9149169921875, 5.135986328125, 5.3570556640625, 5.578125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 10.0, 12.0, 24.0, 23.0, 49.0, 78.0, 120.0, 182.0, 285.0, 396.0, 605.0, 979.0, 1510.0, 2268.0, 3605.0, 5612.0, 8933.0, 14644.0, 24475.0, 41054.0, 71419.0, 123357.0, 279157.0, 1177236.0, 141214.0, 80973.0, 46700.0, 27522.0, 16727.0, 10186.0, 6373.0, 4116.0, 2551.0, 1613.0, 1057.0, 697.0, 472.0, 313.0, 206.0, 124.0, 73.0, 60.0, 37.0, 26.0, 21.0, 8.0, 6.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5703125, -0.5519866943359375, -0.533660888671875, -0.5153350830078125, -0.49700927734375, -0.4786834716796875, -0.460357666015625, -0.4420318603515625, -0.4237060546875, -0.4053802490234375, -0.387054443359375, -0.3687286376953125, -0.35040283203125, -0.3320770263671875, -0.313751220703125, -0.2954254150390625, -0.277099609375, -0.2587738037109375, -0.240447998046875, -0.2221221923828125, -0.20379638671875, -0.1854705810546875, -0.167144775390625, -0.1488189697265625, -0.1304931640625, -0.1121673583984375, -0.093841552734375, -0.0755157470703125, -0.05718994140625, -0.0388641357421875, -0.020538330078125, -0.0022125244140625, 0.01611328125, 0.0344390869140625, 0.052764892578125, 0.0710906982421875, 0.08941650390625, 0.1077423095703125, 0.126068115234375, 0.1443939208984375, 0.1627197265625, 0.1810455322265625, 0.199371337890625, 0.2176971435546875, 0.23602294921875, 0.2543487548828125, 0.272674560546875, 0.2910003662109375, 0.309326171875, 0.3276519775390625, 0.345977783203125, 0.3643035888671875, 0.38262939453125, 0.4009552001953125, 0.419281005859375, 0.4376068115234375, 0.4559326171875, 0.4742584228515625, 0.492584228515625, 0.5109100341796875, 0.52923583984375, 0.5475616455078125, 0.565887451171875, 0.5842132568359375, 0.6025390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 10.0, 12.0, 12.0, 20.0, 34.0, 34.0, 45.0, 57.0, 81.0, 171.0, 176.0, 89.0, 54.0, 43.0, 23.0, 19.0, 19.0, 10.0, 15.0, 11.0, 9.0, 6.0, 4.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0726318359375, -0.07012653350830078, -0.06762123107910156, -0.06511592864990234, -0.06261062622070312, -0.060105323791503906, -0.05760002136230469, -0.05509471893310547, -0.05258941650390625, -0.05008411407470703, -0.04757881164550781, -0.045073509216308594, -0.042568206787109375, -0.040062904357910156, -0.03755760192871094, -0.03505229949951172, -0.0325469970703125, -0.03004169464111328, -0.027536392211914062, -0.025031089782714844, -0.022525787353515625, -0.020020484924316406, -0.017515182495117188, -0.015009880065917969, -0.01250457763671875, -0.009999275207519531, -0.0074939727783203125, -0.004988670349121094, -0.002483367919921875, 2.193450927734375e-05, 0.0025272369384765625, 0.005032539367675781, 0.007537841796875, 0.010043144226074219, 0.012548446655273438, 0.015053749084472656, 0.017559051513671875, 0.020064353942871094, 0.022569656372070312, 0.02507495880126953, 0.02758026123046875, 0.03008556365966797, 0.03259086608886719, 0.035096168518066406, 0.037601470947265625, 0.040106773376464844, 0.04261207580566406, 0.04511737823486328, 0.0476226806640625, 0.05012798309326172, 0.05263328552246094, 0.055138587951660156, 0.057643890380859375, 0.060149192810058594, 0.06265449523925781, 0.06515979766845703, 0.06766510009765625, 0.07017040252685547, 0.07267570495605469, 0.0751810073852539, 0.07768630981445312, 0.08019161224365234, 0.08269691467285156, 0.08520221710205078, 0.08770751953125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 9.0, 4.0, 9.0, 10.0, 20.0, 16.0, 22.0, 37.0, 44.0, 97.0, 275.0, 1311.0, 669432.0, 375449.0, 1227.0, 264.0, 100.0, 72.0, 43.0, 25.0, 16.0, 16.0, 10.0, 10.0, 3.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.08984375, -2.0301055908203125, -1.970367431640625, -1.9106292724609375, -1.85089111328125, -1.7911529541015625, -1.731414794921875, -1.6716766357421875, -1.6119384765625, -1.5522003173828125, -1.492462158203125, -1.4327239990234375, -1.37298583984375, -1.3132476806640625, -1.253509521484375, -1.1937713623046875, -1.134033203125, -1.0742950439453125, -1.014556884765625, -0.9548187255859375, -0.89508056640625, -0.8353424072265625, -0.775604248046875, -0.7158660888671875, -0.6561279296875, -0.5963897705078125, -0.536651611328125, -0.4769134521484375, -0.41717529296875, -0.3574371337890625, -0.297698974609375, -0.2379608154296875, -0.17822265625, -0.1184844970703125, -0.058746337890625, 0.0009918212890625, 0.06072998046875, 0.1204681396484375, 0.180206298828125, 0.2399444580078125, 0.2996826171875, 0.3594207763671875, 0.419158935546875, 0.4788970947265625, 0.53863525390625, 0.5983734130859375, 0.658111572265625, 0.7178497314453125, 0.777587890625, 0.8373260498046875, 0.897064208984375, 0.9568023681640625, 1.01654052734375, 1.0762786865234375, 1.136016845703125, 1.1957550048828125, 1.2554931640625, 1.3152313232421875, 1.374969482421875, 1.4347076416015625, 1.49444580078125, 1.5541839599609375, 1.613922119140625, 1.6736602783203125, 1.7333984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 15.0, 16.0, 30.0, 50.0, 118.0, 218.0, 244.0, 140.0, 76.0, 28.0, 20.0, 19.0, 11.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.41359221935272217, -0.40500080585479736, -0.39640936255455017, -0.38781794905662537, -0.3792265057563782, -0.37063509225845337, -0.36204367876052856, -0.35345223546028137, -0.34486082196235657, -0.33626940846443176, -0.32767796516418457, -0.31908655166625977, -0.3104951083660126, -0.30190369486808777, -0.2933122515678406, -0.28472083806991577, -0.27612942457199097, -0.26753801107406616, -0.25894656777381897, -0.25035515427589417, -0.24176372587680817, -0.23317229747772217, -0.22458086907863617, -0.21598944067955017, -0.20739799737930298, -0.19880656898021698, -0.19021514058113098, -0.18162372708320618, -0.17303229868412018, -0.16444087028503418, -0.15584944188594818, -0.14725801348686218, -0.13866659998893738, -0.13007517158985138, -0.12148375064134598, -0.11289232224225998, -0.10430090129375458, -0.09570947289466858, -0.08711804449558258, -0.07852661609649658, -0.06993519514799118, -0.06134377047419548, -0.05275234580039978, -0.04416091740131378, -0.03556949272751808, -0.02697806805372238, -0.018386639654636383, -0.009795214980840683, -0.001203790307044983, 0.007387635298073292, 0.015979060903191566, 0.024570487439632416, 0.033161912113428116, 0.041753336787223816, 0.050344765186309814, 0.058936189860105515, 0.06752761453390121, 0.07611904293298721, 0.08471046388149261, 0.09330189228057861, 0.10189332067966461, 0.11048474162817001, 0.11907617002725601, 0.1276675909757614, 0.1362590193748474]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 12.0, 12.0, 9.0, 17.0, 16.0, 19.0, 31.0, 24.0, 33.0, 42.0, 27.0, 43.0, 39.0, 36.0, 41.0, 47.0, 43.0, 35.0, 42.0, 39.0, 45.0, 29.0, 39.0, 36.0, 40.0, 36.0, 23.0, 27.0, 22.0, 12.0, 14.0, 8.0, 15.0, 4.0, 9.0, 1.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04847234487533569, -0.04685968533158302, -0.04524702578783035, -0.043634362518787384, -0.042021702975034714, -0.04040904343128204, -0.038796380162239075, -0.037183720618486404, -0.035571061074733734, -0.033958401530981064, -0.032345741987228394, -0.030733078718185425, -0.029120419174432755, -0.027507759630680084, -0.025895098224282265, -0.024282436817884445, -0.022669777274131775, -0.021057117730379105, -0.019444456323981285, -0.017831794917583466, -0.016219135373830795, -0.01460647489875555, -0.012993814423680305, -0.01138115394860506, -0.009768493473529816, -0.00815583299845457, -0.006543172523379326, -0.004930512048304081, -0.003317851573228836, -0.0017051910981535912, -9.253062307834625e-05, 0.0015201298519968987, 0.0031327903270721436, 0.0047454508021473885, 0.006358111277222633, 0.007970771752297878, 0.009583432227373123, 0.011196092702448368, 0.012808753177523613, 0.014421413652598858, 0.016034074127674103, 0.017646733671426773, 0.019259395077824593, 0.020872056484222412, 0.022484716027975082, 0.024097375571727753, 0.025710036978125572, 0.02732269838452339, 0.028935357928276062, 0.030548017472028732, 0.0321606770157814, 0.03377334028482437, 0.03538599982857704, 0.03699865937232971, 0.03861132264137268, 0.04022398218512535, 0.04183664172887802, 0.04344930127263069, 0.04506196081638336, 0.04667462408542633, 0.048287283629179, 0.04989994317293167, 0.05151260644197464, 0.05312526598572731, 0.05473792552947998]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 2.0, 7.0, 6.0, 8.0, 9.0, 10.0, 20.0, 15.0, 23.0, 36.0, 38.0, 32.0, 37.0, 30.0, 49.0, 48.0, 40.0, 35.0, 43.0, 47.0, 44.0, 50.0, 38.0, 40.0, 33.0, 46.0, 31.0, 23.0, 33.0, 18.0, 17.0, 11.0, 18.0, 9.0, 10.0, 9.0, 10.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.007568359375, -9.66357421875, -9.319580078125, -8.9755859375, -8.631591796875, -8.28759765625, -7.943603515625, -7.599609375, -7.255615234375, -6.91162109375, -6.567626953125, -6.2236328125, -5.879638671875, -5.53564453125, -5.191650390625, -4.84765625, -4.503662109375, -4.15966796875, -3.815673828125, -3.4716796875, -3.127685546875, -2.78369140625, -2.439697265625, -2.095703125, -1.751708984375, -1.40771484375, -1.063720703125, -0.7197265625, -0.375732421875, -0.03173828125, 0.312255859375, 0.65625, 1.000244140625, 1.34423828125, 1.688232421875, 2.0322265625, 2.376220703125, 2.72021484375, 3.064208984375, 3.408203125, 3.752197265625, 4.09619140625, 4.440185546875, 4.7841796875, 5.128173828125, 5.47216796875, 5.816162109375, 6.16015625, 6.504150390625, 6.84814453125, 7.192138671875, 7.5361328125, 7.880126953125, 8.22412109375, 8.568115234375, 8.912109375, 9.256103515625, 9.60009765625, 9.944091796875, 10.2880859375, 10.632080078125, 10.97607421875, 11.320068359375, 11.6640625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 0.0, 4.0, 3.0, 8.0, 6.0, 6.0, 18.0, 28.0, 33.0, 47.0, 48.0, 85.0, 127.0, 211.0, 359.0, 718.0, 1743.0, 4553.0, 12624.0, 39029.0, 218856.0, 625656.0, 104870.0, 25259.0, 8477.0, 3194.0, 1230.0, 556.0, 271.0, 177.0, 97.0, 64.0, 47.0, 36.0, 24.0, 27.0, 13.0, 8.0, 9.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.652099609375, -17.06982421875, -16.487548828125, -15.9052734375, -15.322998046875, -14.74072265625, -14.158447265625, -13.576171875, -12.993896484375, -12.41162109375, -11.829345703125, -11.2470703125, -10.664794921875, -10.08251953125, -9.500244140625, -8.91796875, -8.335693359375, -7.75341796875, -7.171142578125, -6.5888671875, -6.006591796875, -5.42431640625, -4.842041015625, -4.259765625, -3.677490234375, -3.09521484375, -2.512939453125, -1.9306640625, -1.348388671875, -0.76611328125, -0.183837890625, 0.3984375, 0.980712890625, 1.56298828125, 2.145263671875, 2.7275390625, 3.309814453125, 3.89208984375, 4.474365234375, 5.056640625, 5.638916015625, 6.22119140625, 6.803466796875, 7.3857421875, 7.968017578125, 8.55029296875, 9.132568359375, 9.71484375, 10.297119140625, 10.87939453125, 11.461669921875, 12.0439453125, 12.626220703125, 13.20849609375, 13.790771484375, 14.373046875, 14.955322265625, 15.53759765625, 16.119873046875, 16.7021484375, 17.284423828125, 17.86669921875, 18.448974609375, 19.03125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 11.0, 16.0, 23.0, 15.0, 22.0, 34.0, 37.0, 52.0, 48.0, 57.0, 68.0, 102.0, 250.0, 1640.0, 178.0, 77.0, 47.0, 50.0, 44.0, 40.0, 41.0, 35.0, 20.0, 25.0, 24.0, 13.0, 17.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.375, -36.2861328125, -35.197265625, -34.1083984375, -33.01953125, -31.9306640625, -30.841796875, -29.7529296875, -28.6640625, -27.5751953125, -26.486328125, -25.3974609375, -24.30859375, -23.2197265625, -22.130859375, -21.0419921875, -19.953125, -18.8642578125, -17.775390625, -16.6865234375, -15.59765625, -14.5087890625, -13.419921875, -12.3310546875, -11.2421875, -10.1533203125, -9.064453125, -7.9755859375, -6.88671875, -5.7978515625, -4.708984375, -3.6201171875, -2.53125, -1.4423828125, -0.353515625, 0.7353515625, 1.82421875, 2.9130859375, 4.001953125, 5.0908203125, 6.1796875, 7.2685546875, 8.357421875, 9.4462890625, 10.53515625, 11.6240234375, 12.712890625, 13.8017578125, 14.890625, 15.9794921875, 17.068359375, 18.1572265625, 19.24609375, 20.3349609375, 21.423828125, 22.5126953125, 23.6015625, 24.6904296875, 25.779296875, 26.8681640625, 27.95703125, 29.0458984375, 30.134765625, 31.2236328125, 32.3125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 4.0, 8.0, 8.0, 18.0, 15.0, 26.0, 19.0, 35.0, 51.0, 66.0, 75.0, 101.0, 156.0, 280.0, 752.0, 7606.0, 2558736.0, 572288.0, 4070.0, 604.0, 246.0, 145.0, 117.0, 79.0, 42.0, 34.0, 24.0, 20.0, 24.0, 14.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.5, -60.41015625, -58.3203125, -56.23046875, -54.140625, -52.05078125, -49.9609375, -47.87109375, -45.78125, -43.69140625, -41.6015625, -39.51171875, -37.421875, -35.33203125, -33.2421875, -31.15234375, -29.0625, -26.97265625, -24.8828125, -22.79296875, -20.703125, -18.61328125, -16.5234375, -14.43359375, -12.34375, -10.25390625, -8.1640625, -6.07421875, -3.984375, -1.89453125, 0.1953125, 2.28515625, 4.375, 6.46484375, 8.5546875, 10.64453125, 12.734375, 14.82421875, 16.9140625, 19.00390625, 21.09375, 23.18359375, 25.2734375, 27.36328125, 29.453125, 31.54296875, 33.6328125, 35.72265625, 37.8125, 39.90234375, 41.9921875, 44.08203125, 46.171875, 48.26171875, 50.3515625, 52.44140625, 54.53125, 56.62109375, 58.7109375, 60.80078125, 62.890625, 64.98046875, 67.0703125, 69.16015625, 71.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 10.0, 19.0, 37.0, 74.0, 101.0, 171.0, 174.0, 157.0, 127.0, 80.0, 38.0, 16.0, 7.0, 2.0, 2.0, 1.0, 1.0], "bins": [-87.00146484375, -85.37763214111328, -83.75379943847656, -82.12996673583984, -80.50613403320312, -78.8823013305664, -77.25846862792969, -75.63463592529297, -74.01080322265625, -72.38697052001953, -70.76313781738281, -69.1393051147461, -67.51547241210938, -65.89163970947266, -64.26780700683594, -62.64397430419922, -61.020145416259766, -59.39631271362305, -57.77248001098633, -56.14864730834961, -54.52481460571289, -52.90098190307617, -51.27715301513672, -49.6533203125, -48.02948760986328, -46.40565490722656, -44.781822204589844, -43.157989501953125, -41.534156799316406, -39.91032409667969, -38.28649139404297, -36.66265869140625, -35.03882598876953, -33.41499328613281, -31.791160583496094, -30.167327880859375, -28.543495178222656, -26.919662475585938, -25.29583168029785, -23.671998977661133, -22.048168182373047, -20.424335479736328, -18.80050277709961, -17.17667007446289, -15.552838325500488, -13.92900562286377, -12.305173873901367, -10.681341171264648, -9.05750846862793, -7.433675765991211, -5.80984354019165, -4.18601131439209, -2.562178611755371, -0.9383459091186523, 0.68548583984375, 2.3093185424804688, 3.9331512451171875, 5.556983947753906, 7.180816173553467, 8.804648399353027, 10.428481101989746, 12.052313804626465, 13.676145553588867, 15.299978256225586, 16.923810958862305]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 7.0, 15.0, 9.0, 14.0, 20.0, 27.0, 22.0, 21.0, 36.0, 32.0, 44.0, 44.0, 35.0, 39.0, 51.0, 42.0, 52.0, 50.0, 48.0, 41.0, 33.0, 31.0, 49.0, 26.0, 32.0, 24.0, 25.0, 22.0, 20.0, 17.0, 13.0, 11.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.67095184326172, -83.22492218017578, -80.77889251708984, -78.3328628540039, -75.88683319091797, -73.44080352783203, -70.9947738647461, -68.54875183105469, -66.10272216796875, -63.65669250488281, -61.210662841796875, -58.76463317871094, -56.318603515625, -53.87257385253906, -51.42654800415039, -48.98051834106445, -46.53448486328125, -44.08845520019531, -41.642425537109375, -39.19639587402344, -36.7503662109375, -34.30433654785156, -31.85831069946289, -29.412281036376953, -26.966251373291016, -24.520221710205078, -22.07419204711914, -19.628164291381836, -17.1821346282959, -14.736104965209961, -12.29007625579834, -9.844047546386719, -7.3980255126953125, -4.951996326446533, -2.505967140197754, -0.05993795394897461, 2.3860912322998047, 4.832120895385742, 7.278149604797363, 9.724178314208984, 12.170207977294922, 14.61623764038086, 17.062267303466797, 19.5082950592041, 21.95432472229004, 24.400354385375977, 26.84638214111328, 29.29241180419922, 31.738441467285156, 34.184471130371094, 36.63050079345703, 39.07653045654297, 41.522560119628906, 43.968589782714844, 46.414615631103516, 48.86064529418945, 51.30667495727539, 53.75270462036133, 56.198734283447266, 58.6447639465332, 61.090789794921875, 63.53681945800781, 65.98284912109375, 68.42887878417969, 70.87490844726562]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 9.0, 6.0, 7.0, 15.0, 15.0, 13.0, 24.0, 28.0, 23.0, 40.0, 38.0, 37.0, 40.0, 47.0, 45.0, 37.0, 44.0, 45.0, 50.0, 45.0, 50.0, 35.0, 33.0, 37.0, 45.0, 24.0, 29.0, 24.0, 20.0, 14.0, 11.0, 13.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.921142578125, -9.56103515625, -9.200927734375, -8.8408203125, -8.480712890625, -8.12060546875, -7.760498046875, -7.400390625, -7.040283203125, -6.68017578125, -6.320068359375, -5.9599609375, -5.599853515625, -5.23974609375, -4.879638671875, -4.51953125, -4.159423828125, -3.79931640625, -3.439208984375, -3.0791015625, -2.718994140625, -2.35888671875, -1.998779296875, -1.638671875, -1.278564453125, -0.91845703125, -0.558349609375, -0.1982421875, 0.161865234375, 0.52197265625, 0.882080078125, 1.2421875, 1.602294921875, 1.96240234375, 2.322509765625, 2.6826171875, 3.042724609375, 3.40283203125, 3.762939453125, 4.123046875, 4.483154296875, 4.84326171875, 5.203369140625, 5.5634765625, 5.923583984375, 6.28369140625, 6.643798828125, 7.00390625, 7.364013671875, 7.72412109375, 8.084228515625, 8.4443359375, 8.804443359375, 9.16455078125, 9.524658203125, 9.884765625, 10.244873046875, 10.60498046875, 10.965087890625, 11.3251953125, 11.685302734375, 12.04541015625, 12.405517578125, 12.765625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 11.0, 13.0, 23.0, 21.0, 36.0, 43.0, 69.0, 77.0, 123.0, 158.0, 235.0, 337.0, 538.0, 894.0, 1392.0, 2472.0, 4430.0, 9010.0, 21658.0, 68412.0, 422355.0, 2514122.0, 969261.0, 121580.0, 31329.0, 12231.0, 5858.0, 2988.0, 1739.0, 980.0, 586.0, 365.0, 287.0, 173.0, 133.0, 85.0, 56.0, 60.0, 46.0, 23.0, 15.0, 13.0, 12.0, 4.0, 4.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.84912109375, -22.1044921875, -21.35986328125, -20.615234375, -19.87060546875, -19.1259765625, -18.38134765625, -17.63671875, -16.89208984375, -16.1474609375, -15.40283203125, -14.658203125, -13.91357421875, -13.1689453125, -12.42431640625, -11.6796875, -10.93505859375, -10.1904296875, -9.44580078125, -8.701171875, -7.95654296875, -7.2119140625, -6.46728515625, -5.72265625, -4.97802734375, -4.2333984375, -3.48876953125, -2.744140625, -1.99951171875, -1.2548828125, -0.51025390625, 0.234375, 0.97900390625, 1.7236328125, 2.46826171875, 3.212890625, 3.95751953125, 4.7021484375, 5.44677734375, 6.19140625, 6.93603515625, 7.6806640625, 8.42529296875, 9.169921875, 9.91455078125, 10.6591796875, 11.40380859375, 12.1484375, 12.89306640625, 13.6376953125, 14.38232421875, 15.126953125, 15.87158203125, 16.6162109375, 17.36083984375, 18.10546875, 18.85009765625, 19.5947265625, 20.33935546875, 21.083984375, 21.82861328125, 22.5732421875, 23.31787109375, 24.0625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 7.0, 19.0, 15.0, 19.0, 28.0, 36.0, 62.0, 71.0, 133.0, 162.0, 257.0, 383.0, 616.0, 641.0, 505.0, 368.0, 222.0, 175.0, 103.0, 57.0, 57.0, 43.0, 37.0, 9.0, 21.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.5625, -19.86181640625, -19.1611328125, -18.46044921875, -17.759765625, -17.05908203125, -16.3583984375, -15.65771484375, -14.95703125, -14.25634765625, -13.5556640625, -12.85498046875, -12.154296875, -11.45361328125, -10.7529296875, -10.05224609375, -9.3515625, -8.65087890625, -7.9501953125, -7.24951171875, -6.548828125, -5.84814453125, -5.1474609375, -4.44677734375, -3.74609375, -3.04541015625, -2.3447265625, -1.64404296875, -0.943359375, -0.24267578125, 0.4580078125, 1.15869140625, 1.859375, 2.56005859375, 3.2607421875, 3.96142578125, 4.662109375, 5.36279296875, 6.0634765625, 6.76416015625, 7.46484375, 8.16552734375, 8.8662109375, 9.56689453125, 10.267578125, 10.96826171875, 11.6689453125, 12.36962890625, 13.0703125, 13.77099609375, 14.4716796875, 15.17236328125, 15.873046875, 16.57373046875, 17.2744140625, 17.97509765625, 18.67578125, 19.37646484375, 20.0771484375, 20.77783203125, 21.478515625, 22.17919921875, 22.8798828125, 23.58056640625, 24.28125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 8.0, 18.0, 16.0, 27.0, 35.0, 62.0, 109.0, 181.0, 330.0, 804.0, 2254.0, 8438.0, 51495.0, 934284.0, 3059076.0, 116380.0, 15119.0, 3452.0, 1115.0, 514.0, 226.0, 132.0, 77.0, 43.0, 35.0, 23.0, 10.0, 8.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.65625, -52.9033203125, -51.150390625, -49.3974609375, -47.64453125, -45.8916015625, -44.138671875, -42.3857421875, -40.6328125, -38.8798828125, -37.126953125, -35.3740234375, -33.62109375, -31.8681640625, -30.115234375, -28.3623046875, -26.609375, -24.8564453125, -23.103515625, -21.3505859375, -19.59765625, -17.8447265625, -16.091796875, -14.3388671875, -12.5859375, -10.8330078125, -9.080078125, -7.3271484375, -5.57421875, -3.8212890625, -2.068359375, -0.3154296875, 1.4375, 3.1904296875, 4.943359375, 6.6962890625, 8.44921875, 10.2021484375, 11.955078125, 13.7080078125, 15.4609375, 17.2138671875, 18.966796875, 20.7197265625, 22.47265625, 24.2255859375, 25.978515625, 27.7314453125, 29.484375, 31.2373046875, 32.990234375, 34.7431640625, 36.49609375, 38.2490234375, 40.001953125, 41.7548828125, 43.5078125, 45.2607421875, 47.013671875, 48.7666015625, 50.51953125, 52.2724609375, 54.025390625, 55.7783203125, 57.53125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 12.0, 19.0, 27.0, 32.0, 37.0, 54.0, 88.0, 118.0, 101.0, 140.0, 90.0, 91.0, 60.0, 47.0, 39.0, 14.0, 19.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.418426513671875, -53.722652435302734, -51.02688217163086, -48.33110809326172, -45.635337829589844, -42.9395637512207, -40.24378967285156, -37.54801940917969, -34.85224533081055, -32.156471252441406, -29.46070098876953, -26.76492691040039, -24.069154739379883, -21.373382568359375, -18.677608489990234, -15.981836318969727, -13.286064147949219, -10.590291976928711, -7.894518852233887, -5.1987457275390625, -2.5029735565185547, 0.19279861450195312, 2.8885726928710938, 5.584344863891602, 8.28011703491211, 10.975889205932617, 13.671662330627441, 16.367435455322266, 19.063207626342773, 21.75897979736328, 24.454753875732422, 27.15052604675293, 29.846290588378906, 32.54206466674805, 35.23783493041992, 37.93360900878906, 40.62937927246094, 43.32515335083008, 46.02092742919922, 48.716697692871094, 51.412471771240234, 54.108245849609375, 56.80401611328125, 59.49979019165039, 62.19556427001953, 64.8913345336914, 67.58711242675781, 70.28288269042969, 72.97865295410156, 75.67442321777344, 78.37020111083984, 81.06597137451172, 83.7617416381836, 86.45751953125, 89.15328979492188, 91.84906005859375, 94.54483032226562, 97.2406005859375, 99.9363784790039, 102.63214874267578, 105.32791900634766, 108.02369689941406, 110.71946716308594, 113.41523742675781, 116.11101531982422]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 13.0, 5.0, 6.0, 7.0, 12.0, 16.0, 12.0, 18.0, 25.0, 23.0, 26.0, 34.0, 34.0, 39.0, 28.0, 36.0, 37.0, 34.0, 41.0, 35.0, 33.0, 38.0, 34.0, 40.0, 38.0, 32.0, 30.0, 35.0, 28.0, 27.0, 26.0, 24.0, 17.0, 15.0, 12.0, 13.0, 14.0, 12.0, 5.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-56.64322280883789, -54.900875091552734, -53.158531188964844, -51.41618347167969, -49.67383575439453, -47.93149185180664, -46.189144134521484, -44.446800231933594, -42.70445251464844, -40.96210479736328, -39.21976089477539, -37.477413177490234, -35.73506546020508, -33.99272155761719, -32.25037384033203, -30.508028030395508, -28.76568031311035, -27.023334503173828, -25.280986785888672, -23.53864097595215, -21.796295166015625, -20.05394744873047, -18.311601638793945, -16.569255828857422, -14.826909065246582, -13.084562301635742, -11.342216491699219, -9.599869728088379, -7.857523441314697, -6.115177154541016, -4.372830390930176, -2.6304845809936523, -0.8881378173828125, 0.8542085886001587, 2.59655499458313, 4.338901519775391, 6.081247806549072, 7.823594093322754, 9.565940856933594, 11.308286666870117, 13.050633430480957, 14.792980194091797, 16.53532600402832, 18.277671813964844, 20.02001953125, 21.762365341186523, 23.504711151123047, 25.247058868408203, 26.989404678344727, 28.73175048828125, 30.474098205566406, 32.21644592285156, 33.95878982543945, 35.70113754272461, 37.4434814453125, 39.185829162597656, 40.92817687988281, 42.67052459716797, 44.41286849975586, 46.155216217041016, 47.89756393432617, 49.63990783691406, 51.38225555419922, 53.124603271484375, 54.866947174072266]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 17.0, 15.0, 20.0, 25.0, 23.0, 26.0, 29.0, 37.0, 27.0, 37.0, 41.0, 48.0, 49.0, 47.0, 47.0, 47.0, 39.0, 40.0, 35.0, 38.0, 31.0, 34.0, 34.0, 33.0, 32.0, 19.0, 13.0, 18.0, 11.0, 14.0, 8.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.891845703125, -9.53369140625, -9.175537109375, -8.8173828125, -8.459228515625, -8.10107421875, -7.742919921875, -7.384765625, -7.026611328125, -6.66845703125, -6.310302734375, -5.9521484375, -5.593994140625, -5.23583984375, -4.877685546875, -4.51953125, -4.161376953125, -3.80322265625, -3.445068359375, -3.0869140625, -2.728759765625, -2.37060546875, -2.012451171875, -1.654296875, -1.296142578125, -0.93798828125, -0.579833984375, -0.2216796875, 0.136474609375, 0.49462890625, 0.852783203125, 1.2109375, 1.569091796875, 1.92724609375, 2.285400390625, 2.6435546875, 3.001708984375, 3.35986328125, 3.718017578125, 4.076171875, 4.434326171875, 4.79248046875, 5.150634765625, 5.5087890625, 5.866943359375, 6.22509765625, 6.583251953125, 6.94140625, 7.299560546875, 7.65771484375, 8.015869140625, 8.3740234375, 8.732177734375, 9.09033203125, 9.448486328125, 9.806640625, 10.164794921875, 10.52294921875, 10.881103515625, 11.2392578125, 11.597412109375, 11.95556640625, 12.313720703125, 12.671875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 11.0, 7.0, 21.0, 36.0, 38.0, 70.0, 80.0, 146.0, 184.0, 299.0, 443.0, 671.0, 1009.0, 1453.0, 2172.0, 3381.0, 5147.0, 7899.0, 12169.0, 18843.0, 29963.0, 47657.0, 78685.0, 127542.0, 189557.0, 187648.0, 126044.0, 77004.0, 47429.0, 29483.0, 18620.0, 11908.0, 7763.0, 5018.0, 3393.0, 2209.0, 1459.0, 992.0, 676.0, 443.0, 315.0, 233.0, 129.0, 88.0, 63.0, 39.0, 37.0, 25.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0], "bins": [-1.19140625, -1.1552886962890625, -1.119171142578125, -1.0830535888671875, -1.04693603515625, -1.0108184814453125, -0.974700927734375, -0.9385833740234375, -0.9024658203125, -0.8663482666015625, -0.830230712890625, -0.7941131591796875, -0.75799560546875, -0.7218780517578125, -0.685760498046875, -0.6496429443359375, -0.613525390625, -0.5774078369140625, -0.541290283203125, -0.5051727294921875, -0.46905517578125, -0.4329376220703125, -0.396820068359375, -0.3607025146484375, -0.3245849609375, -0.2884674072265625, -0.252349853515625, -0.2162322998046875, -0.18011474609375, -0.1439971923828125, -0.107879638671875, -0.0717620849609375, -0.03564453125, 0.0004730224609375, 0.036590576171875, 0.0727081298828125, 0.10882568359375, 0.1449432373046875, 0.181060791015625, 0.2171783447265625, 0.2532958984375, 0.2894134521484375, 0.325531005859375, 0.3616485595703125, 0.39776611328125, 0.4338836669921875, 0.470001220703125, 0.5061187744140625, 0.542236328125, 0.5783538818359375, 0.614471435546875, 0.6505889892578125, 0.68670654296875, 0.7228240966796875, 0.758941650390625, 0.7950592041015625, 0.8311767578125, 0.8672943115234375, 0.903411865234375, 0.9395294189453125, 0.97564697265625, 1.0117645263671875, 1.047882080078125, 1.0839996337890625, 1.1201171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 11.0, 7.0, 15.0, 13.0, 18.0, 15.0, 24.0, 25.0, 26.0, 25.0, 35.0, 43.0, 37.0, 34.0, 40.0, 30.0, 45.0, 1071.0, 34.0, 43.0, 39.0, 43.0, 28.0, 23.0, 42.0, 38.0, 25.0, 27.0, 34.0, 14.0, 10.0, 13.0, 15.0, 7.0, 8.0, 9.0, 6.0, 7.0, 7.0, 2.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0], "bins": [-7.921875, -7.69769287109375, -7.4735107421875, -7.24932861328125, -7.025146484375, -6.80096435546875, -6.5767822265625, -6.35260009765625, -6.12841796875, -5.90423583984375, -5.6800537109375, -5.45587158203125, -5.231689453125, -5.00750732421875, -4.7833251953125, -4.55914306640625, -4.3349609375, -4.11077880859375, -3.8865966796875, -3.66241455078125, -3.438232421875, -3.21405029296875, -2.9898681640625, -2.76568603515625, -2.54150390625, -2.31732177734375, -2.0931396484375, -1.86895751953125, -1.644775390625, -1.42059326171875, -1.1964111328125, -0.97222900390625, -0.748046875, -0.52386474609375, -0.2996826171875, -0.07550048828125, 0.148681640625, 0.37286376953125, 0.5970458984375, 0.82122802734375, 1.04541015625, 1.26959228515625, 1.4937744140625, 1.71795654296875, 1.942138671875, 2.16632080078125, 2.3905029296875, 2.61468505859375, 2.8388671875, 3.06304931640625, 3.2872314453125, 3.51141357421875, 3.735595703125, 3.95977783203125, 4.1839599609375, 4.40814208984375, 4.63232421875, 4.85650634765625, 5.0806884765625, 5.30487060546875, 5.529052734375, 5.75323486328125, 5.9774169921875, 6.20159912109375, 6.42578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 9.0, 9.0, 22.0, 25.0, 40.0, 65.0, 108.0, 160.0, 237.0, 394.0, 707.0, 1108.0, 1806.0, 2926.0, 5047.0, 8819.0, 15262.0, 27020.0, 48143.0, 90037.0, 172275.0, 1290967.0, 200516.0, 104172.0, 55402.0, 30677.0, 17216.0, 9734.0, 5696.0, 3419.0, 1964.0, 1200.0, 755.0, 442.0, 267.0, 162.0, 119.0, 71.0, 42.0, 45.0, 13.0, 7.0, 10.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7199020385742188, -0.6971282958984375, -0.6743545532226562, -0.651580810546875, -0.6288070678710938, -0.6060333251953125, -0.5832595825195312, -0.56048583984375, -0.5377120971679688, -0.5149383544921875, -0.49216461181640625, -0.469390869140625, -0.44661712646484375, -0.4238433837890625, -0.40106964111328125, -0.3782958984375, -0.35552215576171875, -0.3327484130859375, -0.30997467041015625, -0.287200927734375, -0.26442718505859375, -0.2416534423828125, -0.21887969970703125, -0.19610595703125, -0.17333221435546875, -0.1505584716796875, -0.12778472900390625, -0.105010986328125, -0.08223724365234375, -0.0594635009765625, -0.03668975830078125, -0.013916015625, 0.00885772705078125, 0.0316314697265625, 0.05440521240234375, 0.077178955078125, 0.09995269775390625, 0.1227264404296875, 0.14550018310546875, 0.16827392578125, 0.19104766845703125, 0.2138214111328125, 0.23659515380859375, 0.259368896484375, 0.28214263916015625, 0.3049163818359375, 0.32769012451171875, 0.3504638671875, 0.37323760986328125, 0.3960113525390625, 0.41878509521484375, 0.441558837890625, 0.46433258056640625, 0.4871063232421875, 0.5098800659179688, 0.53265380859375, 0.5554275512695312, 0.5782012939453125, 0.6009750366210938, 0.623748779296875, 0.6465225219726562, 0.6692962646484375, 0.6920700073242188, 0.71484375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 8.0, 14.0, 22.0, 22.0, 21.0, 34.0, 49.0, 75.0, 108.0, 171.0, 134.0, 85.0, 70.0, 36.0, 30.0, 31.0, 17.0, 10.0, 10.0, 6.0, 4.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.08727645874023438, -0.08434295654296875, -0.08140945434570312, -0.0784759521484375, -0.07554244995117188, -0.07260894775390625, -0.06967544555664062, -0.066741943359375, -0.06380844116210938, -0.06087493896484375, -0.057941436767578125, -0.0550079345703125, -0.052074432373046875, -0.04914093017578125, -0.046207427978515625, -0.04327392578125, -0.040340423583984375, -0.03740692138671875, -0.034473419189453125, -0.0315399169921875, -0.028606414794921875, -0.02567291259765625, -0.022739410400390625, -0.019805908203125, -0.016872406005859375, -0.01393890380859375, -0.011005401611328125, -0.0080718994140625, -0.005138397216796875, -0.00220489501953125, 0.000728607177734375, 0.003662109375, 0.006595611572265625, 0.00952911376953125, 0.012462615966796875, 0.0153961181640625, 0.018329620361328125, 0.02126312255859375, 0.024196624755859375, 0.027130126953125, 0.030063629150390625, 0.03299713134765625, 0.035930633544921875, 0.0388641357421875, 0.041797637939453125, 0.04473114013671875, 0.047664642333984375, 0.05059814453125, 0.053531646728515625, 0.05646514892578125, 0.059398651123046875, 0.0623321533203125, 0.06526565551757812, 0.06819915771484375, 0.07113265991210938, 0.074066162109375, 0.07699966430664062, 0.07993316650390625, 0.08286666870117188, 0.0858001708984375, 0.08873367309570312, 0.09166717529296875, 0.09460067749023438, 0.0975341796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 1.0, 3.0, 10.0, 8.0, 10.0, 20.0, 28.0, 37.0, 61.0, 68.0, 168.0, 510.0, 31795.0, 1013508.0, 1721.0, 264.0, 110.0, 62.0, 34.0, 26.0, 28.0, 20.0, 12.0, 10.0, 8.0, 2.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.0951690673828125, -2.030181884765625, -1.9651947021484375, -1.90020751953125, -1.8352203369140625, -1.770233154296875, -1.7052459716796875, -1.6402587890625, -1.5752716064453125, -1.510284423828125, -1.4452972412109375, -1.38031005859375, -1.3153228759765625, -1.250335693359375, -1.1853485107421875, -1.120361328125, -1.0553741455078125, -0.990386962890625, -0.9253997802734375, -0.86041259765625, -0.7954254150390625, -0.730438232421875, -0.6654510498046875, -0.6004638671875, -0.5354766845703125, -0.470489501953125, -0.4055023193359375, -0.34051513671875, -0.2755279541015625, -0.210540771484375, -0.1455535888671875, -0.08056640625, -0.0155792236328125, 0.049407958984375, 0.1143951416015625, 0.17938232421875, 0.2443695068359375, 0.309356689453125, 0.3743438720703125, 0.4393310546875, 0.5043182373046875, 0.569305419921875, 0.6342926025390625, 0.69927978515625, 0.7642669677734375, 0.829254150390625, 0.8942413330078125, 0.959228515625, 1.0242156982421875, 1.089202880859375, 1.1541900634765625, 1.21917724609375, 1.2841644287109375, 1.349151611328125, 1.4141387939453125, 1.4791259765625, 1.5441131591796875, 1.609100341796875, 1.6740875244140625, 1.73907470703125, 1.8040618896484375, 1.869049072265625, 1.9340362548828125, 1.9990234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 21.0, 115.0, 623.0, 197.0, 33.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697900652885437, -0.6706209182739258, -0.6433412432670593, -0.6160615086555481, -0.5887818336486816, -0.5615020990371704, -0.5342223644256592, -0.5069426894187927, -0.4796629548072815, -0.45238324999809265, -0.4251035451889038, -0.3978238105773926, -0.37054410576820374, -0.3432644009590149, -0.31598469614982605, -0.2887049913406372, -0.26142528653144836, -0.23414558172225952, -0.20686586201190948, -0.17958615720272064, -0.1523064374923706, -0.12502673268318176, -0.09774702787399292, -0.07046730816364288, -0.04318760335445404, -0.01590789295732975, 0.01137181743979454, 0.03865152597427368, 0.06593123823404312, 0.09321095049381256, 0.1204906553030014, 0.14777037501335144, 0.17505007982254028, 0.20232978463172913, 0.22960950434207916, 0.2568892240524292, 0.28416892886161804, 0.3114486336708069, 0.3387283384799957, 0.36600804328918457, 0.3932877779006958, 0.42056748270988464, 0.4478471875190735, 0.4751269221305847, 0.5024065971374512, 0.5296863317489624, 0.5569660663604736, 0.5842457413673401, 0.6115254163742065, 0.6388051509857178, 0.6660848259925842, 0.6933645606040955, 0.7206442356109619, 0.7479239702224731, 0.7752037048339844, 0.8024833798408508, 0.8297631144523621, 0.8570428490638733, 0.8843225240707397, 0.911602258682251, 0.9388819336891174, 0.9661616683006287, 0.9934413433074951, 1.0207210779190063, 1.0480008125305176]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 5.0, 10.0, 9.0, 12.0, 20.0, 18.0, 19.0, 19.0, 23.0, 30.0, 32.0, 32.0, 40.0, 35.0, 41.0, 33.0, 41.0, 50.0, 36.0, 41.0, 47.0, 30.0, 37.0, 33.0, 42.0, 27.0, 27.0, 31.0, 26.0, 22.0, 23.0, 16.0, 14.0, 14.0, 12.0, 13.0, 6.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16932815313339233, -0.16395199298858643, -0.1585758477449417, -0.1531996876001358, -0.1478235423564911, -0.14244738221168518, -0.13707122206687927, -0.13169507682323456, -0.12631893157958984, -0.12094277888536453, -0.11556662619113922, -0.11019046604633331, -0.1048143208026886, -0.09943816065788269, -0.09406200796365738, -0.08868585526943207, -0.08330969512462616, -0.07793354243040085, -0.07255738973617554, -0.06718122959136963, -0.061805080622434616, -0.056428927928209305, -0.051052771508693695, -0.045676618814468384, -0.04030046612024307, -0.03492431342601776, -0.0295481588691473, -0.02417200431227684, -0.01879585161805153, -0.013419698923826218, -0.008043542504310608, -0.0026673898100852966, 0.0027087628841400146, 0.0080849165096879, 0.013461070135235786, 0.018837224692106247, 0.024213377386331558, 0.02958953008055687, 0.03496568650007248, 0.04034183919429779, 0.0457179918885231, 0.05109414458274841, 0.056470297276973724, 0.061846453696489334, 0.06722261011600494, 0.07259875535964966, 0.07797491550445557, 0.08335106819868088, 0.08872722089290619, 0.0941033735871315, 0.09947952628135681, 0.10485568642616272, 0.11023183166980743, 0.11560799181461334, 0.12098414450883865, 0.12636029720306396, 0.13173645734786987, 0.13711261749267578, 0.1424887627363205, 0.1478649228811264, 0.15324106812477112, 0.15861722826957703, 0.16399338841438293, 0.16936953365802765, 0.17474567890167236]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 17.0, 14.0, 21.0, 25.0, 23.0, 26.0, 29.0, 37.0, 27.0, 37.0, 42.0, 47.0, 49.0, 47.0, 47.0, 47.0, 39.0, 42.0, 34.0, 37.0, 31.0, 34.0, 35.0, 32.0, 32.0, 19.0, 12.0, 20.0, 10.0, 14.0, 8.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.891845703125, -9.53369140625, -9.175537109375, -8.8173828125, -8.459228515625, -8.10107421875, -7.742919921875, -7.384765625, -7.026611328125, -6.66845703125, -6.310302734375, -5.9521484375, -5.593994140625, -5.23583984375, -4.877685546875, -4.51953125, -4.161376953125, -3.80322265625, -3.445068359375, -3.0869140625, -2.728759765625, -2.37060546875, -2.012451171875, -1.654296875, -1.296142578125, -0.93798828125, -0.579833984375, -0.2216796875, 0.136474609375, 0.49462890625, 0.852783203125, 1.2109375, 1.569091796875, 1.92724609375, 2.285400390625, 2.6435546875, 3.001708984375, 3.35986328125, 3.718017578125, 4.076171875, 4.434326171875, 4.79248046875, 5.150634765625, 5.5087890625, 5.866943359375, 6.22509765625, 6.583251953125, 6.94140625, 7.299560546875, 7.65771484375, 8.015869140625, 8.3740234375, 8.732177734375, 9.09033203125, 9.448486328125, 9.806640625, 10.164794921875, 10.52294921875, 10.881103515625, 11.2392578125, 11.597412109375, 11.95556640625, 12.313720703125, 12.671875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 10.0, 15.0, 12.0, 26.0, 24.0, 30.0, 29.0, 65.0, 92.0, 144.0, 180.0, 248.0, 381.0, 643.0, 1070.0, 1875.0, 3712.0, 7196.0, 15750.0, 38700.0, 139572.0, 631213.0, 137793.0, 38570.0, 15430.0, 7284.0, 3598.0, 1914.0, 1094.0, 610.0, 397.0, 246.0, 158.0, 111.0, 89.0, 71.0, 46.0, 30.0, 28.0, 22.0, 16.0, 9.0, 10.0, 5.0, 11.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.1875, -18.51416015625, -17.8408203125, -17.16748046875, -16.494140625, -15.82080078125, -15.1474609375, -14.47412109375, -13.80078125, -13.12744140625, -12.4541015625, -11.78076171875, -11.107421875, -10.43408203125, -9.7607421875, -9.08740234375, -8.4140625, -7.74072265625, -7.0673828125, -6.39404296875, -5.720703125, -5.04736328125, -4.3740234375, -3.70068359375, -3.02734375, -2.35400390625, -1.6806640625, -1.00732421875, -0.333984375, 0.33935546875, 1.0126953125, 1.68603515625, 2.359375, 3.03271484375, 3.7060546875, 4.37939453125, 5.052734375, 5.72607421875, 6.3994140625, 7.07275390625, 7.74609375, 8.41943359375, 9.0927734375, 9.76611328125, 10.439453125, 11.11279296875, 11.7861328125, 12.45947265625, 13.1328125, 13.80615234375, 14.4794921875, 15.15283203125, 15.826171875, 16.49951171875, 17.1728515625, 17.84619140625, 18.51953125, 19.19287109375, 19.8662109375, 20.53955078125, 21.212890625, 21.88623046875, 22.5595703125, 23.23291015625, 23.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 12.0, 18.0, 32.0, 25.0, 17.0, 27.0, 35.0, 36.0, 48.0, 51.0, 53.0, 71.0, 108.0, 191.0, 1528.0, 231.0, 98.0, 80.0, 52.0, 52.0, 31.0, 37.0, 37.0, 29.0, 22.0, 14.0, 20.0, 21.0, 10.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.484375, -25.487060546875, -24.48974609375, -23.492431640625, -22.4951171875, -21.497802734375, -20.50048828125, -19.503173828125, -18.505859375, -17.508544921875, -16.51123046875, -15.513916015625, -14.5166015625, -13.519287109375, -12.52197265625, -11.524658203125, -10.52734375, -9.530029296875, -8.53271484375, -7.535400390625, -6.5380859375, -5.540771484375, -4.54345703125, -3.546142578125, -2.548828125, -1.551513671875, -0.55419921875, 0.443115234375, 1.4404296875, 2.437744140625, 3.43505859375, 4.432373046875, 5.4296875, 6.427001953125, 7.42431640625, 8.421630859375, 9.4189453125, 10.416259765625, 11.41357421875, 12.410888671875, 13.408203125, 14.405517578125, 15.40283203125, 16.400146484375, 17.3974609375, 18.394775390625, 19.39208984375, 20.389404296875, 21.38671875, 22.384033203125, 23.38134765625, 24.378662109375, 25.3759765625, 26.373291015625, 27.37060546875, 28.367919921875, 29.365234375, 30.362548828125, 31.35986328125, 32.357177734375, 33.3544921875, 34.351806640625, 35.34912109375, 36.346435546875, 37.34375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 10.0, 7.0, 18.0, 26.0, 22.0, 29.0, 32.0, 55.0, 67.0, 80.0, 129.0, 205.0, 430.0, 1334.0, 6521.0, 74687.0, 2899231.0, 150075.0, 9672.0, 1666.0, 568.0, 257.0, 153.0, 103.0, 74.0, 43.0, 35.0, 39.0, 22.0, 30.0, 24.0, 11.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-76.5, -74.51806640625, -72.5361328125, -70.55419921875, -68.572265625, -66.59033203125, -64.6083984375, -62.62646484375, -60.64453125, -58.66259765625, -56.6806640625, -54.69873046875, -52.716796875, -50.73486328125, -48.7529296875, -46.77099609375, -44.7890625, -42.80712890625, -40.8251953125, -38.84326171875, -36.861328125, -34.87939453125, -32.8974609375, -30.91552734375, -28.93359375, -26.95166015625, -24.9697265625, -22.98779296875, -21.005859375, -19.02392578125, -17.0419921875, -15.06005859375, -13.078125, -11.09619140625, -9.1142578125, -7.13232421875, -5.150390625, -3.16845703125, -1.1865234375, 0.79541015625, 2.77734375, 4.75927734375, 6.7412109375, 8.72314453125, 10.705078125, 12.68701171875, 14.6689453125, 16.65087890625, 18.6328125, 20.61474609375, 22.5966796875, 24.57861328125, 26.560546875, 28.54248046875, 30.5244140625, 32.50634765625, 34.48828125, 36.47021484375, 38.4521484375, 40.43408203125, 42.416015625, 44.39794921875, 46.3798828125, 48.36181640625, 50.34375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 7.0, 12.0, 26.0, 46.0, 70.0, 128.0, 146.0, 160.0, 142.0, 98.0, 84.0, 34.0, 30.0, 8.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.074270248413086, -21.95652961730957, -19.838788986206055, -17.721050262451172, -15.60330867767334, -13.485568046569824, -11.367828369140625, -9.25008773803711, -7.132347106933594, -5.014606475830078, -2.8968663215637207, -0.7791261672973633, 1.3386144638061523, 3.456355094909668, 5.574094772338867, 7.691835403442383, 9.809576034545898, 11.927316665649414, 14.04505729675293, 16.162796020507812, 18.280536651611328, 20.398277282714844, 22.51601791381836, 24.633758544921875, 26.75149917602539, 28.869239807128906, 30.986980438232422, 33.10472106933594, 35.22246170043945, 37.34020233154297, 39.45793914794922, 41.57568359375, 43.69342803955078, 45.8111686706543, 47.92890930175781, 50.04664993286133, 52.164390563964844, 54.28213119506836, 56.399871826171875, 58.517608642578125, 60.635353088378906, 62.75309371948242, 64.87083435058594, 66.98857116699219, 69.10631561279297, 71.22405242919922, 73.341796875, 75.45953369140625, 77.5772705078125, 79.69500732421875, 81.81275177001953, 83.93048858642578, 86.04823303222656, 88.16596984863281, 90.2837142944336, 92.40145111083984, 94.51919555664062, 96.63693237304688, 98.75467681884766, 100.8724136352539, 102.99015808105469, 105.10789489746094, 107.22563934326172, 109.34337615966797, 111.46112060546875]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 9.0, 14.0, 5.0, 15.0, 17.0, 16.0, 16.0, 16.0, 24.0, 22.0, 21.0, 24.0, 28.0, 28.0, 32.0, 44.0, 48.0, 39.0, 33.0, 35.0, 35.0, 38.0, 39.0, 38.0, 39.0, 33.0, 32.0, 25.0, 18.0, 36.0, 25.0, 18.0, 20.0, 13.0, 17.0, 9.0, 16.0, 9.0, 9.0, 7.0, 6.0, 1.0, 4.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-66.19977569580078, -64.14521789550781, -62.09065628051758, -60.03609848022461, -57.981536865234375, -55.926979064941406, -53.87242126464844, -51.8178596496582, -49.76329803466797, -47.708740234375, -45.654178619384766, -43.5996208190918, -41.54505920410156, -39.490501403808594, -37.435943603515625, -35.38138198852539, -33.32682418823242, -31.27226448059082, -29.21770477294922, -27.16314697265625, -25.108585357666016, -23.054027557373047, -20.999467849731445, -18.944908142089844, -16.890348434448242, -14.83578872680664, -12.781229019165039, -10.726670265197754, -8.672110557556152, -6.617550849914551, -4.562992095947266, -2.508432388305664, -0.4538726806640625, 1.60068678855896, 3.6552462577819824, 5.709805488586426, 7.764365196228027, 9.818924903869629, 11.873483657836914, 13.928043365478516, 15.982603073120117, 18.03716278076172, 20.09172248840332, 22.146282196044922, 24.20083999633789, 26.255401611328125, 28.309959411621094, 30.364519119262695, 32.4190788269043, 34.473636627197266, 36.5281982421875, 38.58275604248047, 40.6373176574707, 42.69187545776367, 44.746437072753906, 46.800994873046875, 48.855552673339844, 50.91011047363281, 52.96467208862305, 55.019229888916016, 57.07379150390625, 59.12834930419922, 61.18290710449219, 63.23746871948242, 65.29203033447266]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 15.0, 19.0, 22.0, 29.0, 27.0, 26.0, 30.0, 33.0, 46.0, 49.0, 48.0, 50.0, 57.0, 56.0, 46.0, 36.0, 43.0, 38.0, 43.0, 36.0, 40.0, 30.0, 30.0, 25.0, 22.0, 16.0, 15.0, 16.0, 11.0, 4.0, 5.0, 1.0, 4.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.3485107421875, -10.939208984375, -10.5299072265625, -10.12060546875, -9.7113037109375, -9.302001953125, -8.8927001953125, -8.4833984375, -8.0740966796875, -7.664794921875, -7.2554931640625, -6.84619140625, -6.4368896484375, -6.027587890625, -5.6182861328125, -5.208984375, -4.7996826171875, -4.390380859375, -3.9810791015625, -3.57177734375, -3.1624755859375, -2.753173828125, -2.3438720703125, -1.9345703125, -1.5252685546875, -1.115966796875, -0.7066650390625, -0.29736328125, 0.1119384765625, 0.521240234375, 0.9305419921875, 1.33984375, 1.7491455078125, 2.158447265625, 2.5677490234375, 2.97705078125, 3.3863525390625, 3.795654296875, 4.2049560546875, 4.6142578125, 5.0235595703125, 5.432861328125, 5.8421630859375, 6.25146484375, 6.6607666015625, 7.070068359375, 7.4793701171875, 7.888671875, 8.2979736328125, 8.707275390625, 9.1165771484375, 9.52587890625, 9.9351806640625, 10.344482421875, 10.7537841796875, 11.1630859375, 11.5723876953125, 11.981689453125, 12.3909912109375, 12.80029296875, 13.2095947265625, 13.618896484375, 14.0281982421875, 14.4375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 7.0, 10.0, 13.0, 9.0, 13.0, 30.0, 26.0, 32.0, 50.0, 72.0, 116.0, 127.0, 160.0, 256.0, 375.0, 462.0, 692.0, 1078.0, 1681.0, 2673.0, 4525.0, 8557.0, 17715.0, 46034.0, 194257.0, 1301374.0, 2120788.0, 371487.0, 71360.0, 24274.0, 10913.0, 5758.0, 3296.0, 2000.0, 1294.0, 875.0, 622.0, 361.0, 276.0, 195.0, 123.0, 102.0, 56.0, 51.0, 40.0, 28.0, 13.0, 5.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.452392578125, -21.79541015625, -21.138427734375, -20.4814453125, -19.824462890625, -19.16748046875, -18.510498046875, -17.853515625, -17.196533203125, -16.53955078125, -15.882568359375, -15.2255859375, -14.568603515625, -13.91162109375, -13.254638671875, -12.59765625, -11.940673828125, -11.28369140625, -10.626708984375, -9.9697265625, -9.312744140625, -8.65576171875, -7.998779296875, -7.341796875, -6.684814453125, -6.02783203125, -5.370849609375, -4.7138671875, -4.056884765625, -3.39990234375, -2.742919921875, -2.0859375, -1.428955078125, -0.77197265625, -0.114990234375, 0.5419921875, 1.198974609375, 1.85595703125, 2.512939453125, 3.169921875, 3.826904296875, 4.48388671875, 5.140869140625, 5.7978515625, 6.454833984375, 7.11181640625, 7.768798828125, 8.42578125, 9.082763671875, 9.73974609375, 10.396728515625, 11.0537109375, 11.710693359375, 12.36767578125, 13.024658203125, 13.681640625, 14.338623046875, 14.99560546875, 15.652587890625, 16.3095703125, 16.966552734375, 17.62353515625, 18.280517578125, 18.9375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 13.0, 16.0, 17.0, 21.0, 29.0, 39.0, 42.0, 72.0, 104.0, 132.0, 230.0, 303.0, 418.0, 554.0, 578.0, 436.0, 290.0, 219.0, 145.0, 98.0, 71.0, 60.0, 33.0, 30.0, 15.0, 20.0, 21.0, 11.0, 8.0, 5.0, 4.0, 9.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.265625, -17.65673828125, -17.0478515625, -16.43896484375, -15.830078125, -15.22119140625, -14.6123046875, -14.00341796875, -13.39453125, -12.78564453125, -12.1767578125, -11.56787109375, -10.958984375, -10.35009765625, -9.7412109375, -9.13232421875, -8.5234375, -7.91455078125, -7.3056640625, -6.69677734375, -6.087890625, -5.47900390625, -4.8701171875, -4.26123046875, -3.65234375, -3.04345703125, -2.4345703125, -1.82568359375, -1.216796875, -0.60791015625, 0.0009765625, 0.60986328125, 1.21875, 1.82763671875, 2.4365234375, 3.04541015625, 3.654296875, 4.26318359375, 4.8720703125, 5.48095703125, 6.08984375, 6.69873046875, 7.3076171875, 7.91650390625, 8.525390625, 9.13427734375, 9.7431640625, 10.35205078125, 10.9609375, 11.56982421875, 12.1787109375, 12.78759765625, 13.396484375, 14.00537109375, 14.6142578125, 15.22314453125, 15.83203125, 16.44091796875, 17.0498046875, 17.65869140625, 18.267578125, 18.87646484375, 19.4853515625, 20.09423828125, 20.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 11.0, 16.0, 24.0, 27.0, 32.0, 46.0, 81.0, 145.0, 273.0, 547.0, 1276.0, 3420.0, 11598.0, 54582.0, 674876.0, 3240245.0, 171096.0, 25628.0, 6313.0, 2196.0, 877.0, 419.0, 215.0, 99.0, 61.0, 37.0, 29.0, 19.0, 14.0, 19.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.65625, -51.07373046875, -49.4912109375, -47.90869140625, -46.326171875, -44.74365234375, -43.1611328125, -41.57861328125, -39.99609375, -38.41357421875, -36.8310546875, -35.24853515625, -33.666015625, -32.08349609375, -30.5009765625, -28.91845703125, -27.3359375, -25.75341796875, -24.1708984375, -22.58837890625, -21.005859375, -19.42333984375, -17.8408203125, -16.25830078125, -14.67578125, -13.09326171875, -11.5107421875, -9.92822265625, -8.345703125, -6.76318359375, -5.1806640625, -3.59814453125, -2.015625, -0.43310546875, 1.1494140625, 2.73193359375, 4.314453125, 5.89697265625, 7.4794921875, 9.06201171875, 10.64453125, 12.22705078125, 13.8095703125, 15.39208984375, 16.974609375, 18.55712890625, 20.1396484375, 21.72216796875, 23.3046875, 24.88720703125, 26.4697265625, 28.05224609375, 29.634765625, 31.21728515625, 32.7998046875, 34.38232421875, 35.96484375, 37.54736328125, 39.1298828125, 40.71240234375, 42.294921875, 43.87744140625, 45.4599609375, 47.04248046875, 48.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 10.0, 19.0, 46.0, 92.0, 155.0, 199.0, 177.0, 122.0, 97.0, 47.0, 21.0, 6.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.65194702148438, -213.535888671875, -208.41983032226562, -203.30377197265625, -198.18771362304688, -193.0716552734375, -187.95559692382812, -182.83953857421875, -177.72348022460938, -172.607421875, -167.49136352539062, -162.37530517578125, -157.25924682617188, -152.1431884765625, -147.02713012695312, -141.91107177734375, -136.79501342773438, -131.678955078125, -126.56289672851562, -121.44683837890625, -116.33078002929688, -111.2147216796875, -106.09866333007812, -100.98260498046875, -95.86656188964844, -90.75050354003906, -85.63444519042969, -80.51838684082031, -75.40232849121094, -70.28627014160156, -65.17021179199219, -60.05415725708008, -54.938087463378906, -49.82202911376953, -44.705970764160156, -39.58991241455078, -34.473854064941406, -29.357797622680664, -24.241741180419922, -19.125682830810547, -14.009624481201172, -8.893566131591797, -3.7775087356567383, 1.3385486602783203, 6.454607009887695, 11.57066535949707, 16.686721801757812, 21.802780151367188, 26.918838500976562, 32.03489685058594, 37.15095520019531, 42.26701354980469, 47.38307189941406, 52.49913024902344, 57.61518478393555, 62.73124313354492, 67.84730529785156, 72.96336364746094, 78.07942199707031, 83.19548034667969, 88.31153869628906, 93.42759704589844, 98.54365539550781, 103.65971374511719, 108.77576446533203]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 10.0, 10.0, 7.0, 13.0, 19.0, 21.0, 12.0, 22.0, 24.0, 22.0, 31.0, 23.0, 19.0, 31.0, 33.0, 43.0, 42.0, 27.0, 32.0, 44.0, 44.0, 36.0, 30.0, 29.0, 54.0, 43.0, 38.0, 33.0, 19.0, 32.0, 21.0, 16.0, 20.0, 16.0, 14.0, 13.0, 9.0, 15.0, 8.0, 6.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.485225677490234, -56.39339828491211, -54.30157470703125, -52.209747314453125, -50.117919921875, -48.026092529296875, -45.93426513671875, -43.84244155883789, -41.750614166259766, -39.65878677368164, -37.56696319580078, -35.475135803222656, -33.38330841064453, -31.291481018066406, -29.199655532836914, -27.107830047607422, -25.016002655029297, -22.924175262451172, -20.83234977722168, -18.740524291992188, -16.648696899414062, -14.556870460510254, -12.465044021606445, -10.373217582702637, -8.281391143798828, -6.1895647048950195, -4.097738265991211, -2.0059118270874023, 0.08591461181640625, 2.177741050720215, 4.269567489624023, 6.361393928527832, 8.453216552734375, 10.545042991638184, 12.636869430541992, 14.7286958694458, 16.82052230834961, 18.912349700927734, 21.004175186157227, 23.09600067138672, 25.187828063964844, 27.27965545654297, 29.37148094177246, 31.463306427001953, 33.55513381958008, 35.6469612121582, 37.73878479003906, 39.83061218261719, 41.92243957519531, 44.01426696777344, 46.10609436035156, 48.19791793823242, 50.28974533081055, 52.38157272338867, 54.47339630126953, 56.565223693847656, 58.65705108642578, 60.748878479003906, 62.84070587158203, 64.93253326416016, 67.02435302734375, 69.11618041992188, 71.2080078125, 73.29983520507812, 75.39166259765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 8.0, 12.0, 10.0, 12.0, 13.0, 20.0, 27.0, 20.0, 32.0, 39.0, 25.0, 48.0, 39.0, 31.0, 38.0, 43.0, 40.0, 44.0, 60.0, 45.0, 49.0, 44.0, 42.0, 36.0, 28.0, 37.0, 25.0, 16.0, 12.0, 18.0, 18.0, 12.0, 12.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.5765380859375, -10.176513671875, -9.7764892578125, -9.37646484375, -8.9764404296875, -8.576416015625, -8.1763916015625, -7.7763671875, -7.3763427734375, -6.976318359375, -6.5762939453125, -6.17626953125, -5.7762451171875, -5.376220703125, -4.9761962890625, -4.576171875, -4.1761474609375, -3.776123046875, -3.3760986328125, -2.97607421875, -2.5760498046875, -2.176025390625, -1.7760009765625, -1.3759765625, -0.9759521484375, -0.575927734375, -0.1759033203125, 0.22412109375, 0.6241455078125, 1.024169921875, 1.4241943359375, 1.82421875, 2.2242431640625, 2.624267578125, 3.0242919921875, 3.42431640625, 3.8243408203125, 4.224365234375, 4.6243896484375, 5.0244140625, 5.4244384765625, 5.824462890625, 6.2244873046875, 6.62451171875, 7.0245361328125, 7.424560546875, 7.8245849609375, 8.224609375, 8.6246337890625, 9.024658203125, 9.4246826171875, 9.82470703125, 10.2247314453125, 10.624755859375, 11.0247802734375, 11.4248046875, 11.8248291015625, 12.224853515625, 12.6248779296875, 13.02490234375, 13.4249267578125, 13.824951171875, 14.2249755859375, 14.625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 12.0, 10.0, 13.0, 22.0, 34.0, 62.0, 94.0, 123.0, 182.0, 299.0, 465.0, 754.0, 1168.0, 1744.0, 2748.0, 4466.0, 7058.0, 11926.0, 19515.0, 32792.0, 55381.0, 97167.0, 169219.0, 233223.0, 171083.0, 98477.0, 56215.0, 33118.0, 19590.0, 12025.0, 7345.0, 4481.0, 2758.0, 1767.0, 1135.0, 737.0, 454.0, 318.0, 220.0, 145.0, 77.0, 36.0, 35.0, 37.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.4765625, -1.43377685546875, -1.3909912109375, -1.34820556640625, -1.305419921875, -1.26263427734375, -1.2198486328125, -1.17706298828125, -1.13427734375, -1.09149169921875, -1.0487060546875, -1.00592041015625, -0.963134765625, -0.92034912109375, -0.8775634765625, -0.83477783203125, -0.7919921875, -0.74920654296875, -0.7064208984375, -0.66363525390625, -0.620849609375, -0.57806396484375, -0.5352783203125, -0.49249267578125, -0.44970703125, -0.40692138671875, -0.3641357421875, -0.32135009765625, -0.278564453125, -0.23577880859375, -0.1929931640625, -0.15020751953125, -0.107421875, -0.06463623046875, -0.0218505859375, 0.02093505859375, 0.063720703125, 0.10650634765625, 0.1492919921875, 0.19207763671875, 0.23486328125, 0.27764892578125, 0.3204345703125, 0.36322021484375, 0.406005859375, 0.44879150390625, 0.4915771484375, 0.53436279296875, 0.5771484375, 0.61993408203125, 0.6627197265625, 0.70550537109375, 0.748291015625, 0.79107666015625, 0.8338623046875, 0.87664794921875, 0.91943359375, 0.96221923828125, 1.0050048828125, 1.04779052734375, 1.090576171875, 1.13336181640625, 1.1761474609375, 1.21893310546875, 1.26171875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 12.0, 13.0, 21.0, 13.0, 16.0, 19.0, 19.0, 35.0, 27.0, 27.0, 35.0, 24.0, 39.0, 45.0, 38.0, 32.0, 37.0, 1056.0, 50.0, 40.0, 51.0, 36.0, 28.0, 27.0, 36.0, 25.0, 28.0, 18.0, 19.0, 22.0, 25.0, 16.0, 12.0, 20.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.728271484375, -6.49951171875, -6.270751953125, -6.0419921875, -5.813232421875, -5.58447265625, -5.355712890625, -5.126953125, -4.898193359375, -4.66943359375, -4.440673828125, -4.2119140625, -3.983154296875, -3.75439453125, -3.525634765625, -3.296875, -3.068115234375, -2.83935546875, -2.610595703125, -2.3818359375, -2.153076171875, -1.92431640625, -1.695556640625, -1.466796875, -1.238037109375, -1.00927734375, -0.780517578125, -0.5517578125, -0.322998046875, -0.09423828125, 0.134521484375, 0.36328125, 0.592041015625, 0.82080078125, 1.049560546875, 1.2783203125, 1.507080078125, 1.73583984375, 1.964599609375, 2.193359375, 2.422119140625, 2.65087890625, 2.879638671875, 3.1083984375, 3.337158203125, 3.56591796875, 3.794677734375, 4.0234375, 4.252197265625, 4.48095703125, 4.709716796875, 4.9384765625, 5.167236328125, 5.39599609375, 5.624755859375, 5.853515625, 6.082275390625, 6.31103515625, 6.539794921875, 6.7685546875, 6.997314453125, 7.22607421875, 7.454833984375, 7.68359375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 13.0, 21.0, 39.0, 47.0, 68.0, 86.0, 143.0, 200.0, 310.0, 435.0, 619.0, 865.0, 1205.0, 1835.0, 2687.0, 3874.0, 5899.0, 8602.0, 12932.0, 19654.0, 30532.0, 47807.0, 75894.0, 120209.0, 282108.0, 1111028.0, 133961.0, 83877.0, 52976.0, 33905.0, 21652.0, 14356.0, 9460.0, 6208.0, 4257.0, 2943.0, 1945.0, 1363.0, 971.0, 680.0, 465.0, 311.0, 220.0, 142.0, 101.0, 70.0, 60.0, 38.0, 15.0, 17.0, 14.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.56640625, -0.5493011474609375, -0.532196044921875, -0.5150909423828125, -0.49798583984375, -0.4808807373046875, -0.463775634765625, -0.4466705322265625, -0.4295654296875, -0.4124603271484375, -0.395355224609375, -0.3782501220703125, -0.36114501953125, -0.3440399169921875, -0.326934814453125, -0.3098297119140625, -0.292724609375, -0.2756195068359375, -0.258514404296875, -0.2414093017578125, -0.22430419921875, -0.2071990966796875, -0.190093994140625, -0.1729888916015625, -0.1558837890625, -0.1387786865234375, -0.121673583984375, -0.1045684814453125, -0.08746337890625, -0.0703582763671875, -0.053253173828125, -0.0361480712890625, -0.01904296875, -0.0019378662109375, 0.015167236328125, 0.0322723388671875, 0.04937744140625, 0.0664825439453125, 0.083587646484375, 0.1006927490234375, 0.1177978515625, 0.1349029541015625, 0.152008056640625, 0.1691131591796875, 0.18621826171875, 0.2033233642578125, 0.220428466796875, 0.2375335693359375, 0.254638671875, 0.2717437744140625, 0.288848876953125, 0.3059539794921875, 0.32305908203125, 0.3401641845703125, 0.357269287109375, 0.3743743896484375, 0.3914794921875, 0.4085845947265625, 0.425689697265625, 0.4427947998046875, 0.45989990234375, 0.4770050048828125, 0.494110107421875, 0.5112152099609375, 0.5283203125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 7.0, 17.0, 5.0, 14.0, 19.0, 21.0, 27.0, 37.0, 48.0, 129.0, 285.0, 141.0, 37.0, 35.0, 23.0, 27.0, 14.0, 12.0, 13.0, 11.0, 12.0, 6.0, 0.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1016845703125, -0.09874248504638672, -0.09580039978027344, -0.09285831451416016, -0.08991622924804688, -0.0869741439819336, -0.08403205871582031, -0.08108997344970703, -0.07814788818359375, -0.07520580291748047, -0.07226371765136719, -0.0693216323852539, -0.06637954711914062, -0.06343746185302734, -0.06049537658691406, -0.05755329132080078, -0.0546112060546875, -0.05166912078857422, -0.04872703552246094, -0.045784950256347656, -0.042842864990234375, -0.039900779724121094, -0.03695869445800781, -0.03401660919189453, -0.03107452392578125, -0.02813243865966797, -0.025190353393554688, -0.022248268127441406, -0.019306182861328125, -0.016364097595214844, -0.013422012329101562, -0.010479927062988281, -0.007537841796875, -0.004595756530761719, -0.0016536712646484375, 0.0012884140014648438, 0.004230499267578125, 0.007172584533691406, 0.010114669799804688, 0.013056755065917969, 0.01599884033203125, 0.01894092559814453, 0.021883010864257812, 0.024825096130371094, 0.027767181396484375, 0.030709266662597656, 0.03365135192871094, 0.03659343719482422, 0.0395355224609375, 0.04247760772705078, 0.04541969299316406, 0.048361778259277344, 0.051303863525390625, 0.054245948791503906, 0.05718803405761719, 0.06013011932373047, 0.06307220458984375, 0.06601428985595703, 0.06895637512207031, 0.0718984603881836, 0.07484054565429688, 0.07778263092041016, 0.08072471618652344, 0.08366680145263672, 0.08660888671875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 3.0, 4.0, 10.0, 13.0, 20.0, 20.0, 19.0, 24.0, 33.0, 70.0, 164.0, 592.0, 15490.0, 1021452.0, 9782.0, 498.0, 124.0, 57.0, 32.0, 28.0, 17.0, 14.0, 18.0, 9.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.01885986328125, -1.9478759765625, -1.87689208984375, -1.805908203125, -1.73492431640625, -1.6639404296875, -1.59295654296875, -1.52197265625, -1.45098876953125, -1.3800048828125, -1.30902099609375, -1.238037109375, -1.16705322265625, -1.0960693359375, -1.02508544921875, -0.9541015625, -0.88311767578125, -0.8121337890625, -0.74114990234375, -0.670166015625, -0.59918212890625, -0.5281982421875, -0.45721435546875, -0.38623046875, -0.31524658203125, -0.2442626953125, -0.17327880859375, -0.102294921875, -0.03131103515625, 0.0396728515625, 0.11065673828125, 0.181640625, 0.25262451171875, 0.3236083984375, 0.39459228515625, 0.465576171875, 0.53656005859375, 0.6075439453125, 0.67852783203125, 0.74951171875, 0.82049560546875, 0.8914794921875, 0.96246337890625, 1.033447265625, 1.10443115234375, 1.1754150390625, 1.24639892578125, 1.3173828125, 1.38836669921875, 1.4593505859375, 1.53033447265625, 1.601318359375, 1.67230224609375, 1.7432861328125, 1.81427001953125, 1.88525390625, 1.95623779296875, 2.0272216796875, 2.09820556640625, 2.169189453125, 2.24017333984375, 2.3111572265625, 2.38214111328125, 2.453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 20.0, 52.0, 101.0, 289.0, 297.0, 128.0, 63.0, 23.0, 8.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2532458007335663, -0.23838427662849426, -0.22352273762226105, -0.20866119861602783, -0.1937996745109558, -0.1789381504058838, -0.16407661139965057, -0.14921507239341736, -0.13435354828834534, -0.11949201673269272, -0.1046304851770401, -0.08976895362138748, -0.07490742206573486, -0.060045890510082245, -0.045184358954429626, -0.030322827398777008, -0.01546129584312439, -0.0005997642874717712, 0.014261767268180847, 0.029123298823833466, 0.043984830379486084, 0.0588463619351387, 0.07370789349079132, 0.08856942504644394, 0.10343095660209656, 0.11829248815774918, 0.1331540197134018, 0.148015558719635, 0.16287708282470703, 0.17773860692977905, 0.19260014593601227, 0.20746168494224548, 0.22232317924499512, 0.23718470335006714, 0.25204622745513916, 0.26690778136253357, 0.2817693054676056, 0.2966308295726776, 0.311492383480072, 0.32635390758514404, 0.34121543169021606, 0.3560769557952881, 0.3709384799003601, 0.3858000338077545, 0.40066155791282654, 0.41552308201789856, 0.43038463592529297, 0.445246160030365, 0.460107684135437, 0.47496920824050903, 0.48983073234558105, 0.5046922564506531, 0.5195537805557251, 0.5344153642654419, 0.5492768883705139, 0.5641384124755859, 0.578999936580658, 0.59386146068573, 0.608722984790802, 0.623584508895874, 0.6384460926055908, 0.6533076167106628, 0.6681691408157349, 0.6830306649208069, 0.6978921890258789]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 10.0, 9.0, 13.0, 10.0, 13.0, 14.0, 21.0, 18.0, 29.0, 26.0, 30.0, 31.0, 25.0, 46.0, 39.0, 48.0, 45.0, 30.0, 32.0, 31.0, 50.0, 57.0, 34.0, 42.0, 41.0, 37.0, 29.0, 22.0, 19.0, 19.0, 17.0, 15.0, 14.0, 17.0, 18.0, 10.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.17142736911773682, -0.16631774604320526, -0.1612081080675125, -0.15609848499298096, -0.1509888470172882, -0.14587922394275665, -0.1407695859670639, -0.13565996289253235, -0.1305503249168396, -0.12544070184230804, -0.1203310638666153, -0.11522143334150314, -0.11011180281639099, -0.10500217974185944, -0.09989254921674728, -0.09478291869163513, -0.08967329561710358, -0.08456366509199142, -0.07945403456687927, -0.07434440404176712, -0.06923477351665497, -0.06412515044212341, -0.05901551991701126, -0.05390588939189911, -0.04879625886678696, -0.043686628341674805, -0.03857699781656265, -0.0334673710167408, -0.028357740491628647, -0.023248109966516495, -0.018138481304049492, -0.013028852641582489, -0.007919222116470337, -0.0028095925226807594, 0.002300037071108818, 0.0074096666648983955, 0.012519296258687973, 0.017628926783800125, 0.022738555446267128, 0.02784818410873413, 0.03295781463384628, 0.038067445158958435, 0.04317707568407059, 0.04828670248389244, 0.05339633300900459, 0.058505963534116745, 0.0636155903339386, 0.06872522085905075, 0.0738348513841629, 0.07894448190927505, 0.08405411243438721, 0.08916374295949936, 0.09427337348461151, 0.09938299655914307, 0.10449262708425522, 0.10960225760936737, 0.11471188813447952, 0.11982151865959167, 0.12493114918470383, 0.13004077970981598, 0.13515040278434753, 0.14026004076004028, 0.14536966383457184, 0.1504792869091034, 0.15558892488479614]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 12.0, 13.0, 20.0, 27.0, 20.0, 34.0, 37.0, 26.0, 47.0, 39.0, 32.0, 36.0, 45.0, 39.0, 44.0, 60.0, 45.0, 50.0, 43.0, 43.0, 36.0, 27.0, 37.0, 25.0, 16.0, 12.0, 18.0, 18.0, 12.0, 11.0, 11.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.56884765625, -10.1689453125, -9.76904296875, -9.369140625, -8.96923828125, -8.5693359375, -8.16943359375, -7.76953125, -7.36962890625, -6.9697265625, -6.56982421875, -6.169921875, -5.77001953125, -5.3701171875, -4.97021484375, -4.5703125, -4.17041015625, -3.7705078125, -3.37060546875, -2.970703125, -2.57080078125, -2.1708984375, -1.77099609375, -1.37109375, -0.97119140625, -0.5712890625, -0.17138671875, 0.228515625, 0.62841796875, 1.0283203125, 1.42822265625, 1.828125, 2.22802734375, 2.6279296875, 3.02783203125, 3.427734375, 3.82763671875, 4.2275390625, 4.62744140625, 5.02734375, 5.42724609375, 5.8271484375, 6.22705078125, 6.626953125, 7.02685546875, 7.4267578125, 7.82666015625, 8.2265625, 8.62646484375, 9.0263671875, 9.42626953125, 9.826171875, 10.22607421875, 10.6259765625, 11.02587890625, 11.42578125, 11.82568359375, 12.2255859375, 12.62548828125, 13.025390625, 13.42529296875, 13.8251953125, 14.22509765625, 14.625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 10.0, 13.0, 14.0, 24.0, 47.0, 58.0, 72.0, 118.0, 180.0, 285.0, 402.0, 550.0, 823.0, 1225.0, 1921.0, 2973.0, 4602.0, 7481.0, 12223.0, 21825.0, 40416.0, 80334.0, 177162.0, 338302.0, 179681.0, 81396.0, 41284.0, 21522.0, 12629.0, 7482.0, 4766.0, 2896.0, 1900.0, 1340.0, 848.0, 549.0, 365.0, 271.0, 179.0, 120.0, 86.0, 55.0, 36.0, 30.0, 20.0, 18.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.29931640625, -12.8486328125, -12.39794921875, -11.947265625, -11.49658203125, -11.0458984375, -10.59521484375, -10.14453125, -9.69384765625, -9.2431640625, -8.79248046875, -8.341796875, -7.89111328125, -7.4404296875, -6.98974609375, -6.5390625, -6.08837890625, -5.6376953125, -5.18701171875, -4.736328125, -4.28564453125, -3.8349609375, -3.38427734375, -2.93359375, -2.48291015625, -2.0322265625, -1.58154296875, -1.130859375, -0.68017578125, -0.2294921875, 0.22119140625, 0.671875, 1.12255859375, 1.5732421875, 2.02392578125, 2.474609375, 2.92529296875, 3.3759765625, 3.82666015625, 4.27734375, 4.72802734375, 5.1787109375, 5.62939453125, 6.080078125, 6.53076171875, 6.9814453125, 7.43212890625, 7.8828125, 8.33349609375, 8.7841796875, 9.23486328125, 9.685546875, 10.13623046875, 10.5869140625, 11.03759765625, 11.48828125, 11.93896484375, 12.3896484375, 12.84033203125, 13.291015625, 13.74169921875, 14.1923828125, 14.64306640625, 15.09375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 5.0, 7.0, 4.0, 13.0, 12.0, 9.0, 12.0, 11.0, 14.0, 24.0, 16.0, 32.0, 30.0, 35.0, 52.0, 37.0, 52.0, 60.0, 62.0, 129.0, 252.0, 1375.0, 238.0, 109.0, 73.0, 63.0, 41.0, 47.0, 39.0, 31.0, 23.0, 20.0, 14.0, 17.0, 19.0, 15.0, 12.0, 6.0, 8.0, 7.0, 11.0, 6.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.810302734375, -24.90185546875, -23.993408203125, -23.0849609375, -22.176513671875, -21.26806640625, -20.359619140625, -19.451171875, -18.542724609375, -17.63427734375, -16.725830078125, -15.8173828125, -14.908935546875, -14.00048828125, -13.092041015625, -12.18359375, -11.275146484375, -10.36669921875, -9.458251953125, -8.5498046875, -7.641357421875, -6.73291015625, -5.824462890625, -4.916015625, -4.007568359375, -3.09912109375, -2.190673828125, -1.2822265625, -0.373779296875, 0.53466796875, 1.443115234375, 2.3515625, 3.260009765625, 4.16845703125, 5.076904296875, 5.9853515625, 6.893798828125, 7.80224609375, 8.710693359375, 9.619140625, 10.527587890625, 11.43603515625, 12.344482421875, 13.2529296875, 14.161376953125, 15.06982421875, 15.978271484375, 16.88671875, 17.795166015625, 18.70361328125, 19.612060546875, 20.5205078125, 21.428955078125, 22.33740234375, 23.245849609375, 24.154296875, 25.062744140625, 25.97119140625, 26.879638671875, 27.7880859375, 28.696533203125, 29.60498046875, 30.513427734375, 31.421875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 22.0, 24.0, 37.0, 59.0, 81.0, 134.0, 187.0, 408.0, 875.0, 2839.0, 11760.0, 64051.0, 1147007.0, 1818166.0, 80581.0, 13997.0, 3256.0, 1088.0, 448.0, 250.0, 130.0, 89.0, 68.0, 48.0, 29.0, 22.0, 14.0, 9.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5625, -37.2353515625, -35.908203125, -34.5810546875, -33.25390625, -31.9267578125, -30.599609375, -29.2724609375, -27.9453125, -26.6181640625, -25.291015625, -23.9638671875, -22.63671875, -21.3095703125, -19.982421875, -18.6552734375, -17.328125, -16.0009765625, -14.673828125, -13.3466796875, -12.01953125, -10.6923828125, -9.365234375, -8.0380859375, -6.7109375, -5.3837890625, -4.056640625, -2.7294921875, -1.40234375, -0.0751953125, 1.251953125, 2.5791015625, 3.90625, 5.2333984375, 6.560546875, 7.8876953125, 9.21484375, 10.5419921875, 11.869140625, 13.1962890625, 14.5234375, 15.8505859375, 17.177734375, 18.5048828125, 19.83203125, 21.1591796875, 22.486328125, 23.8134765625, 25.140625, 26.4677734375, 27.794921875, 29.1220703125, 30.44921875, 31.7763671875, 33.103515625, 34.4306640625, 35.7578125, 37.0849609375, 38.412109375, 39.7392578125, 41.06640625, 42.3935546875, 43.720703125, 45.0478515625, 46.375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 29.0, 118.0, 271.0, 303.0, 181.0, 74.0, 18.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.94976806640625, -106.17694091796875, -101.40411376953125, -96.63127899169922, -91.85845184326172, -87.08562469482422, -82.31278991699219, -77.53996276855469, -72.76713562011719, -67.99430847167969, -63.22147750854492, -58.448646545410156, -53.675819396972656, -48.902992248535156, -44.13016128540039, -39.357330322265625, -34.584503173828125, -29.811674118041992, -25.03884506225586, -20.266016006469727, -15.493186950683594, -10.720357894897461, -5.947528839111328, -1.1746978759765625, 3.5981292724609375, 8.37095832824707, 13.143787384033203, 17.916616439819336, 22.68944549560547, 27.4622745513916, 32.235103607177734, 37.0079345703125, 41.78077697753906, 46.55360412597656, 51.32643508911133, 56.099266052246094, 60.872093200683594, 65.6449203491211, 70.41775512695312, 75.19058227539062, 79.96340942382812, 84.73623657226562, 89.50906372070312, 94.28189849853516, 99.05472564697266, 103.82755279541016, 108.60038757324219, 113.37321472167969, 118.14604187011719, 122.91886901855469, 127.69169616699219, 132.4645233154297, 137.23736572265625, 142.01019287109375, 146.78302001953125, 151.55584716796875, 156.32867431640625, 161.10150146484375, 165.87432861328125, 170.64715576171875, 175.41998291015625, 180.1928253173828, 184.9656524658203, 189.7384796142578, 194.5113067626953]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 5.0, 6.0, 4.0, 2.0, 3.0, 10.0, 2.0, 9.0, 21.0, 22.0, 17.0, 17.0, 19.0, 22.0, 33.0, 32.0, 30.0, 26.0, 36.0, 33.0, 32.0, 46.0, 42.0, 31.0, 42.0, 34.0, 42.0, 39.0, 40.0, 35.0, 25.0, 41.0, 31.0, 30.0, 14.0, 20.0, 15.0, 25.0, 15.0, 11.0, 5.0, 10.0, 5.0, 8.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.461021423339844, -61.39417266845703, -59.32732391357422, -57.260475158691406, -55.193626403808594, -53.12677764892578, -51.05992889404297, -48.993080139160156, -46.926231384277344, -44.85938262939453, -42.79253387451172, -40.725685119628906, -38.658836364746094, -36.59198760986328, -34.52513885498047, -32.458290100097656, -30.391441345214844, -28.32459259033203, -26.25774383544922, -24.190895080566406, -22.124046325683594, -20.05719757080078, -17.99034881591797, -15.923500061035156, -13.856651306152344, -11.789802551269531, -9.722953796386719, -7.656105041503906, -5.589256286621094, -3.5224075317382812, -1.4555587768554688, 0.6112899780273438, 2.678131103515625, 4.7449798583984375, 6.81182861328125, 8.878677368164062, 10.945526123046875, 13.012374877929688, 15.0792236328125, 17.146072387695312, 19.212921142578125, 21.279769897460938, 23.34661865234375, 25.413467407226562, 27.480316162109375, 29.547164916992188, 31.614013671875, 33.68086242675781, 35.747711181640625, 37.81455993652344, 39.88140869140625, 41.94825744628906, 44.015106201171875, 46.08195495605469, 48.1488037109375, 50.21565246582031, 52.282501220703125, 54.34934997558594, 56.41619873046875, 58.48304748535156, 60.549896240234375, 62.61674499511719, 64.68359375, 66.75044250488281, 68.81729125976562]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 5.0, 13.0, 8.0, 17.0, 19.0, 20.0, 16.0, 29.0, 24.0, 34.0, 38.0, 29.0, 46.0, 39.0, 39.0, 39.0, 44.0, 36.0, 54.0, 49.0, 48.0, 41.0, 43.0, 42.0, 33.0, 30.0, 26.0, 20.0, 14.0, 15.0, 14.0, 14.0, 8.0, 10.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.9879150390625, -10.585205078125, -10.1824951171875, -9.77978515625, -9.3770751953125, -8.974365234375, -8.5716552734375, -8.1689453125, -7.7662353515625, -7.363525390625, -6.9608154296875, -6.55810546875, -6.1553955078125, -5.752685546875, -5.3499755859375, -4.947265625, -4.5445556640625, -4.141845703125, -3.7391357421875, -3.33642578125, -2.9337158203125, -2.531005859375, -2.1282958984375, -1.7255859375, -1.3228759765625, -0.920166015625, -0.5174560546875, -0.11474609375, 0.2879638671875, 0.690673828125, 1.0933837890625, 1.49609375, 1.8988037109375, 2.301513671875, 2.7042236328125, 3.10693359375, 3.5096435546875, 3.912353515625, 4.3150634765625, 4.7177734375, 5.1204833984375, 5.523193359375, 5.9259033203125, 6.32861328125, 6.7313232421875, 7.134033203125, 7.5367431640625, 7.939453125, 8.3421630859375, 8.744873046875, 9.1475830078125, 9.55029296875, 9.9530029296875, 10.355712890625, 10.7584228515625, 11.1611328125, 11.5638427734375, 11.966552734375, 12.3692626953125, 12.77197265625, 13.1746826171875, 13.577392578125, 13.9801025390625, 14.3828125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 3.0, 7.0, 18.0, 15.0, 14.0, 30.0, 42.0, 60.0, 75.0, 144.0, 180.0, 255.0, 375.0, 553.0, 810.0, 1218.0, 1961.0, 3175.0, 5163.0, 8922.0, 15927.0, 32486.0, 84763.0, 354102.0, 1735327.0, 1511900.0, 295826.0, 74354.0, 29494.0, 14888.0, 8494.0, 4830.0, 3053.0, 1992.0, 1270.0, 789.0, 560.0, 371.0, 243.0, 164.0, 112.0, 101.0, 67.0, 38.0, 31.0, 17.0, 17.0, 10.0, 10.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.90625, -19.31982421875, -18.7333984375, -18.14697265625, -17.560546875, -16.97412109375, -16.3876953125, -15.80126953125, -15.21484375, -14.62841796875, -14.0419921875, -13.45556640625, -12.869140625, -12.28271484375, -11.6962890625, -11.10986328125, -10.5234375, -9.93701171875, -9.3505859375, -8.76416015625, -8.177734375, -7.59130859375, -7.0048828125, -6.41845703125, -5.83203125, -5.24560546875, -4.6591796875, -4.07275390625, -3.486328125, -2.89990234375, -2.3134765625, -1.72705078125, -1.140625, -0.55419921875, 0.0322265625, 0.61865234375, 1.205078125, 1.79150390625, 2.3779296875, 2.96435546875, 3.55078125, 4.13720703125, 4.7236328125, 5.31005859375, 5.896484375, 6.48291015625, 7.0693359375, 7.65576171875, 8.2421875, 8.82861328125, 9.4150390625, 10.00146484375, 10.587890625, 11.17431640625, 11.7607421875, 12.34716796875, 12.93359375, 13.52001953125, 14.1064453125, 14.69287109375, 15.279296875, 15.86572265625, 16.4521484375, 17.03857421875, 17.625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 10.0, 5.0, 11.0, 14.0, 21.0, 19.0, 23.0, 32.0, 27.0, 68.0, 73.0, 100.0, 159.0, 218.0, 312.0, 510.0, 633.0, 561.0, 392.0, 259.0, 170.0, 120.0, 75.0, 62.0, 51.0, 23.0, 24.0, 23.0, 11.0, 11.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.203125, -21.563232421875, -20.92333984375, -20.283447265625, -19.6435546875, -19.003662109375, -18.36376953125, -17.723876953125, -17.083984375, -16.444091796875, -15.80419921875, -15.164306640625, -14.5244140625, -13.884521484375, -13.24462890625, -12.604736328125, -11.96484375, -11.324951171875, -10.68505859375, -10.045166015625, -9.4052734375, -8.765380859375, -8.12548828125, -7.485595703125, -6.845703125, -6.205810546875, -5.56591796875, -4.926025390625, -4.2861328125, -3.646240234375, -3.00634765625, -2.366455078125, -1.7265625, -1.086669921875, -0.44677734375, 0.193115234375, 0.8330078125, 1.472900390625, 2.11279296875, 2.752685546875, 3.392578125, 4.032470703125, 4.67236328125, 5.312255859375, 5.9521484375, 6.592041015625, 7.23193359375, 7.871826171875, 8.51171875, 9.151611328125, 9.79150390625, 10.431396484375, 11.0712890625, 11.711181640625, 12.35107421875, 12.990966796875, 13.630859375, 14.270751953125, 14.91064453125, 15.550537109375, 16.1904296875, 16.830322265625, 17.47021484375, 18.110107421875, 18.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 6.0, 23.0, 10.0, 18.0, 34.0, 42.0, 55.0, 86.0, 117.0, 169.0, 282.0, 492.0, 846.0, 1672.0, 3237.0, 6668.0, 14396.0, 35064.0, 106600.0, 586565.0, 2803919.0, 480308.0, 95215.0, 32324.0, 13523.0, 5972.0, 2975.0, 1578.0, 793.0, 473.0, 270.0, 179.0, 87.0, 84.0, 49.0, 39.0, 37.0, 26.0, 10.0, 11.0, 5.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.109375, -28.153564453125, -27.19775390625, -26.241943359375, -25.2861328125, -24.330322265625, -23.37451171875, -22.418701171875, -21.462890625, -20.507080078125, -19.55126953125, -18.595458984375, -17.6396484375, -16.683837890625, -15.72802734375, -14.772216796875, -13.81640625, -12.860595703125, -11.90478515625, -10.948974609375, -9.9931640625, -9.037353515625, -8.08154296875, -7.125732421875, -6.169921875, -5.214111328125, -4.25830078125, -3.302490234375, -2.3466796875, -1.390869140625, -0.43505859375, 0.520751953125, 1.4765625, 2.432373046875, 3.38818359375, 4.343994140625, 5.2998046875, 6.255615234375, 7.21142578125, 8.167236328125, 9.123046875, 10.078857421875, 11.03466796875, 11.990478515625, 12.9462890625, 13.902099609375, 14.85791015625, 15.813720703125, 16.76953125, 17.725341796875, 18.68115234375, 19.636962890625, 20.5927734375, 21.548583984375, 22.50439453125, 23.460205078125, 24.416015625, 25.371826171875, 26.32763671875, 27.283447265625, 28.2392578125, 29.195068359375, 30.15087890625, 31.106689453125, 32.0625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 31.0, 47.0, 73.0, 110.0, 161.0, 179.0, 143.0, 110.0, 73.0, 29.0, 21.0, 9.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.40711212158203, -116.99440002441406, -112.58168029785156, -108.1689682006836, -103.75625610351562, -99.34353637695312, -94.93082427978516, -90.51811218261719, -86.10539245605469, -81.69268035888672, -77.27996063232422, -72.86724853515625, -68.45453643798828, -64.04182434082031, -59.62910461425781, -55.216392517089844, -50.803680419921875, -46.39096450805664, -41.97825241088867, -37.56553649902344, -33.15282440185547, -28.740108489990234, -24.327392578125, -19.9146785736084, -15.501964569091797, -11.089250564575195, -6.676535606384277, -2.2638206481933594, 2.148893356323242, 6.561607360839844, 10.974323272705078, 15.38703727722168, 19.799758911132812, 24.212472915649414, 28.625186920166016, 33.03790283203125, 37.45061492919922, 41.86333084106445, 46.27604675292969, 50.688758850097656, 55.10147476196289, 59.514190673828125, 63.926902770996094, 68.33961486816406, 72.75233459472656, 77.16504669189453, 81.5777587890625, 85.990478515625, 90.40319061279297, 94.81590270996094, 99.22862243652344, 103.6413345336914, 108.05404663085938, 112.46676635742188, 116.87947845458984, 121.29219055175781, 125.70491027832031, 130.1176300048828, 134.53033447265625, 138.94305419921875, 143.35577392578125, 147.7684783935547, 152.1811981201172, 156.5939178466797, 161.00662231445312]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 12.0, 15.0, 13.0, 20.0, 12.0, 22.0, 18.0, 25.0, 33.0, 22.0, 33.0, 33.0, 36.0, 23.0, 42.0, 44.0, 41.0, 43.0, 38.0, 30.0, 35.0, 29.0, 35.0, 42.0, 25.0, 38.0, 32.0, 38.0, 25.0, 23.0, 18.0, 20.0, 11.0, 11.0, 10.0, 5.0, 8.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-74.04548645019531, -71.90771484375, -69.76993560791016, -67.63216400146484, -65.49439239501953, -63.35661315917969, -61.218841552734375, -59.0810661315918, -56.94329071044922, -54.80551528930664, -52.66774368286133, -50.52996826171875, -48.39219284057617, -46.254417419433594, -44.11664581298828, -41.9788703918457, -39.84109878540039, -37.70332336425781, -35.5655517578125, -33.42777633666992, -31.290000915527344, -29.1522274017334, -27.014453887939453, -24.876678466796875, -22.73890495300293, -20.601131439208984, -18.463356018066406, -16.32558250427246, -14.1878080368042, -12.050033569335938, -9.912260055541992, -7.7744855880737305, -5.636711120605469, -3.498936891555786, -1.3611626625061035, 0.776611328125, 2.9143857955932617, 5.052160263061523, 7.189933776855469, 9.32770824432373, 11.465482711791992, 13.603257179260254, 15.741031646728516, 17.87880516052246, 20.016578674316406, 22.154354095458984, 24.29212760925293, 26.429901123046875, 28.567676544189453, 30.7054500579834, 32.843223571777344, 34.98099899291992, 37.1187744140625, 39.25654602050781, 41.39432144165039, 43.53209686279297, 45.66986846923828, 47.80764389038086, 49.94541549682617, 52.08319091796875, 54.22096633911133, 56.358741760253906, 58.49651336669922, 60.6342887878418, 62.772064208984375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 10.0, 8.0, 17.0, 17.0, 23.0, 15.0, 36.0, 27.0, 24.0, 21.0, 40.0, 28.0, 39.0, 42.0, 36.0, 38.0, 35.0, 34.0, 36.0, 45.0, 39.0, 40.0, 29.0, 40.0, 34.0, 26.0, 28.0, 29.0, 20.0, 15.0, 20.0, 12.0, 8.0, 12.0, 13.0, 7.0, 2.0, 5.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.4140625, -12.0390625, -11.6640625, -11.2890625, -10.9140625, -10.5390625, -10.1640625, -9.7890625, -9.4140625, -9.0390625, -8.6640625, -8.2890625, -7.9140625, -7.5390625, -7.1640625, -6.7890625, -6.4140625, -6.0390625, -5.6640625, -5.2890625, -4.9140625, -4.5390625, -4.1640625, -3.7890625, -3.4140625, -3.0390625, -2.6640625, -2.2890625, -1.9140625, -1.5390625, -1.1640625, -0.7890625, -0.4140625, -0.0390625, 0.3359375, 0.7109375, 1.0859375, 1.4609375, 1.8359375, 2.2109375, 2.5859375, 2.9609375, 3.3359375, 3.7109375, 4.0859375, 4.4609375, 4.8359375, 5.2109375, 5.5859375, 5.9609375, 6.3359375, 6.7109375, 7.0859375, 7.4609375, 7.8359375, 8.2109375, 8.5859375, 8.9609375, 9.3359375, 9.7109375, 10.0859375, 10.4609375, 10.8359375, 11.2109375, 11.5859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 10.0, 7.0, 20.0, 13.0, 39.0, 49.0, 47.0, 61.0, 106.0, 155.0, 203.0, 319.0, 514.0, 764.0, 1080.0, 1856.0, 3009.0, 4930.0, 8207.0, 14012.0, 24670.0, 45167.0, 85517.0, 161265.0, 261549.0, 198696.0, 106909.0, 56227.0, 30482.0, 17305.0, 9863.0, 5849.0, 3471.0, 2215.0, 1362.0, 882.0, 579.0, 344.0, 228.0, 174.0, 149.0, 72.0, 60.0, 41.0, 27.0, 17.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.861328125, -1.8025665283203125, -1.743804931640625, -1.6850433349609375, -1.62628173828125, -1.5675201416015625, -1.508758544921875, -1.4499969482421875, -1.3912353515625, -1.3324737548828125, -1.273712158203125, -1.2149505615234375, -1.15618896484375, -1.0974273681640625, -1.038665771484375, -0.9799041748046875, -0.921142578125, -0.8623809814453125, -0.803619384765625, -0.7448577880859375, -0.68609619140625, -0.6273345947265625, -0.568572998046875, -0.5098114013671875, -0.4510498046875, -0.3922882080078125, -0.333526611328125, -0.2747650146484375, -0.21600341796875, -0.1572418212890625, -0.098480224609375, -0.0397186279296875, 0.01904296875, 0.0778045654296875, 0.136566162109375, 0.1953277587890625, 0.25408935546875, 0.3128509521484375, 0.371612548828125, 0.4303741455078125, 0.4891357421875, 0.5478973388671875, 0.606658935546875, 0.6654205322265625, 0.72418212890625, 0.7829437255859375, 0.841705322265625, 0.9004669189453125, 0.959228515625, 1.0179901123046875, 1.076751708984375, 1.1355133056640625, 1.19427490234375, 1.2530364990234375, 1.311798095703125, 1.3705596923828125, 1.4293212890625, 1.4880828857421875, 1.546844482421875, 1.6056060791015625, 1.66436767578125, 1.7231292724609375, 1.781890869140625, 1.8406524658203125, 1.8994140625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 6.0, 3.0, 7.0, 8.0, 9.0, 10.0, 11.0, 14.0, 16.0, 17.0, 15.0, 22.0, 29.0, 15.0, 34.0, 32.0, 34.0, 29.0, 32.0, 38.0, 56.0, 27.0, 1054.0, 48.0, 34.0, 41.0, 36.0, 36.0, 27.0, 27.0, 25.0, 28.0, 25.0, 24.0, 18.0, 21.0, 21.0, 12.0, 21.0, 13.0, 10.0, 7.0, 15.0, 7.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.5694580078125, -6.334228515625, -6.0989990234375, -5.86376953125, -5.6285400390625, -5.393310546875, -5.1580810546875, -4.9228515625, -4.6876220703125, -4.452392578125, -4.2171630859375, -3.98193359375, -3.7467041015625, -3.511474609375, -3.2762451171875, -3.041015625, -2.8057861328125, -2.570556640625, -2.3353271484375, -2.10009765625, -1.8648681640625, -1.629638671875, -1.3944091796875, -1.1591796875, -0.9239501953125, -0.688720703125, -0.4534912109375, -0.21826171875, 0.0169677734375, 0.252197265625, 0.4874267578125, 0.72265625, 0.9578857421875, 1.193115234375, 1.4283447265625, 1.66357421875, 1.8988037109375, 2.134033203125, 2.3692626953125, 2.6044921875, 2.8397216796875, 3.074951171875, 3.3101806640625, 3.54541015625, 3.7806396484375, 4.015869140625, 4.2510986328125, 4.486328125, 4.7215576171875, 4.956787109375, 5.1920166015625, 5.42724609375, 5.6624755859375, 5.897705078125, 6.1329345703125, 6.3681640625, 6.6033935546875, 6.838623046875, 7.0738525390625, 7.30908203125, 7.5443115234375, 7.779541015625, 8.0147705078125, 8.25]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 4.0, 10.0, 11.0, 14.0, 25.0, 30.0, 56.0, 78.0, 128.0, 170.0, 285.0, 376.0, 647.0, 1166.0, 2036.0, 3794.0, 7241.0, 14558.0, 30572.0, 65779.0, 151593.0, 1218099.0, 369897.0, 124042.0, 54697.0, 25389.0, 12408.0, 6284.0, 3217.0, 1806.0, 1007.0, 581.0, 385.0, 240.0, 134.0, 116.0, 71.0, 55.0, 31.0, 22.0, 16.0, 11.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0], "bins": [-1.275390625, -1.23883056640625, -1.2022705078125, -1.16571044921875, -1.129150390625, -1.09259033203125, -1.0560302734375, -1.01947021484375, -0.98291015625, -0.94635009765625, -0.9097900390625, -0.87322998046875, -0.836669921875, -0.80010986328125, -0.7635498046875, -0.72698974609375, -0.6904296875, -0.65386962890625, -0.6173095703125, -0.58074951171875, -0.544189453125, -0.50762939453125, -0.4710693359375, -0.43450927734375, -0.39794921875, -0.36138916015625, -0.3248291015625, -0.28826904296875, -0.251708984375, -0.21514892578125, -0.1785888671875, -0.14202880859375, -0.10546875, -0.06890869140625, -0.0323486328125, 0.00421142578125, 0.040771484375, 0.07733154296875, 0.1138916015625, 0.15045166015625, 0.18701171875, 0.22357177734375, 0.2601318359375, 0.29669189453125, 0.333251953125, 0.36981201171875, 0.4063720703125, 0.44293212890625, 0.4794921875, 0.51605224609375, 0.5526123046875, 0.58917236328125, 0.625732421875, 0.66229248046875, 0.6988525390625, 0.73541259765625, 0.77197265625, 0.80853271484375, 0.8450927734375, 0.88165283203125, 0.918212890625, 0.95477294921875, 0.9913330078125, 1.02789306640625, 1.064453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 3.0, 5.0, 5.0, 8.0, 9.0, 12.0, 19.0, 32.0, 44.0, 92.0, 462.0, 110.0, 54.0, 24.0, 18.0, 9.0, 6.0, 9.0, 6.0, 2.0, 6.0, 9.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.445556640625, -0.4322547912597656, -0.41895294189453125, -0.4056510925292969, -0.3923492431640625, -0.3790473937988281, -0.36574554443359375, -0.3524436950683594, -0.339141845703125, -0.3258399963378906, -0.31253814697265625, -0.2992362976074219, -0.2859344482421875, -0.2726325988769531, -0.25933074951171875, -0.24602890014648438, -0.23272705078125, -0.21942520141601562, -0.20612335205078125, -0.19282150268554688, -0.1795196533203125, -0.16621780395507812, -0.15291595458984375, -0.13961410522460938, -0.126312255859375, -0.11301040649414062, -0.09970855712890625, -0.08640670776367188, -0.0731048583984375, -0.059803009033203125, -0.04650115966796875, -0.033199310302734375, -0.0198974609375, -0.006595611572265625, 0.00670623779296875, 0.020008087158203125, 0.0333099365234375, 0.046611785888671875, 0.05991363525390625, 0.07321548461914062, 0.086517333984375, 0.09981918334960938, 0.11312103271484375, 0.12642288208007812, 0.1397247314453125, 0.15302658081054688, 0.16632843017578125, 0.17963027954101562, 0.19293212890625, 0.20623397827148438, 0.21953582763671875, 0.23283767700195312, 0.2461395263671875, 0.2594413757324219, 0.27274322509765625, 0.2860450744628906, 0.299346923828125, 0.3126487731933594, 0.32595062255859375, 0.3392524719238281, 0.3525543212890625, 0.3658561706542969, 0.37915802001953125, 0.3924598693847656, 0.40576171875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 8.0, 6.0, 12.0, 10.0, 8.0, 10.0, 18.0, 25.0, 21.0, 48.0, 69.0, 161.0, 604.0, 8852.0, 1028661.0, 8999.0, 592.0, 163.0, 78.0, 50.0, 27.0, 20.0, 16.0, 12.0, 10.0, 8.0, 6.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.68359375, -7.43170166015625, -7.1798095703125, -6.92791748046875, -6.676025390625, -6.42413330078125, -6.1722412109375, -5.92034912109375, -5.66845703125, -5.41656494140625, -5.1646728515625, -4.91278076171875, -4.660888671875, -4.40899658203125, -4.1571044921875, -3.90521240234375, -3.6533203125, -3.40142822265625, -3.1495361328125, -2.89764404296875, -2.645751953125, -2.39385986328125, -2.1419677734375, -1.89007568359375, -1.63818359375, -1.38629150390625, -1.1343994140625, -0.88250732421875, -0.630615234375, -0.37872314453125, -0.1268310546875, 0.12506103515625, 0.376953125, 0.62884521484375, 0.8807373046875, 1.13262939453125, 1.384521484375, 1.63641357421875, 1.8883056640625, 2.14019775390625, 2.39208984375, 2.64398193359375, 2.8958740234375, 3.14776611328125, 3.399658203125, 3.65155029296875, 3.9034423828125, 4.15533447265625, 4.4072265625, 4.65911865234375, 4.9110107421875, 5.16290283203125, 5.414794921875, 5.66668701171875, 5.9185791015625, 6.17047119140625, 6.42236328125, 6.67425537109375, 6.9261474609375, 7.17803955078125, 7.429931640625, 7.68182373046875, 7.9337158203125, 8.18560791015625, 8.4375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 15.0, 22.0, 31.0, 90.0, 235.0, 408.0, 119.0, 53.0, 13.0, 13.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0584172010421753, -1.0036890506744385, -0.9489607810974121, -0.8942325711250305, -0.8395043611526489, -0.7847761511802673, -0.7300479412078857, -0.6753197312355042, -0.6205915212631226, -0.565863311290741, -0.5111351013183594, -0.4564068913459778, -0.4016786813735962, -0.3469504714012146, -0.292222261428833, -0.23749405145645142, -0.18276584148406982, -0.12803763151168823, -0.07330942153930664, -0.01858121156692505, 0.03614699840545654, 0.09087520837783813, 0.14560341835021973, 0.20033162832260132, 0.2550598382949829, 0.3097880482673645, 0.3645162582397461, 0.4192444682121277, 0.4739726781845093, 0.5287008881568909, 0.5834290981292725, 0.638157308101654, 0.6928856372833252, 0.7476138472557068, 0.8023420572280884, 0.85707026720047, 0.9117984771728516, 0.9665266871452332, 1.0212548971176147, 1.0759830474853516, 1.130711317062378, 1.1854395866394043, 1.2401677370071411, 1.294895887374878, 1.3496241569519043, 1.4043524265289307, 1.4590805768966675, 1.5138087272644043, 1.5685369968414307, 1.623265266418457, 1.6779934167861938, 1.7327215671539307, 1.787449836730957, 1.8421781063079834, 1.8969062566757202, 1.951634407043457, 2.0063626766204834, 2.0610909461975098, 2.115818977355957, 2.1705472469329834, 2.2252755165100098, 2.280003786087036, 2.3347320556640625, 2.3894600868225098, 2.444188356399536]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 7.0, 4.0, 9.0, 8.0, 11.0, 16.0, 24.0, 14.0, 20.0, 20.0, 27.0, 13.0, 36.0, 25.0, 34.0, 34.0, 35.0, 36.0, 44.0, 39.0, 57.0, 33.0, 35.0, 33.0, 48.0, 36.0, 29.0, 22.0, 27.0, 22.0, 19.0, 25.0, 18.0, 20.0, 22.0, 15.0, 17.0, 7.0, 14.0, 10.0, 2.0, 7.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.5580988526344299, -0.5399051904678345, -0.521711528301239, -0.5035178661346436, -0.4853241741657257, -0.46713051199913025, -0.4489368200302124, -0.43074315786361694, -0.4125494956970215, -0.394355833530426, -0.37616217136383057, -0.3579684793949127, -0.33977481722831726, -0.3215811550617218, -0.30338746309280396, -0.2851938009262085, -0.26700013875961304, -0.24880647659301758, -0.23061279952526093, -0.21241912245750427, -0.1942254602909088, -0.17603179812431335, -0.1578381210565567, -0.13964444398880005, -0.12145078182220459, -0.10325711220502853, -0.08506344258785248, -0.06686977297067642, -0.048676103353500366, -0.03048243373632431, -0.012288764119148254, 0.0059049129486083984, 0.024098515510559082, 0.04229218512773514, 0.060485854744911194, 0.07867952436208725, 0.0968731939792633, 0.11506686359643936, 0.13326053321361542, 0.15145421028137207, 0.16964787244796753, 0.187841534614563, 0.20603521168231964, 0.2242288887500763, 0.24242255091667175, 0.2606162130832672, 0.27880990505218506, 0.2970035672187805, 0.315197229385376, 0.33339089155197144, 0.3515845537185669, 0.36977824568748474, 0.3879719078540802, 0.40616557002067566, 0.4243592619895935, 0.44255292415618896, 0.4607465863227844, 0.4789402484893799, 0.49713391065597534, 0.5153275728225708, 0.533521294593811, 0.5517149567604065, 0.569908618927002, 0.5881022810935974, 0.6062959432601929]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 6.0, 10.0, 10.0, 9.0, 14.0, 19.0, 22.0, 16.0, 35.0, 28.0, 24.0, 22.0, 39.0, 28.0, 39.0, 41.0, 35.0, 40.0, 33.0, 34.0, 39.0, 40.0, 41.0, 42.0, 31.0, 36.0, 36.0, 26.0, 27.0, 27.0, 24.0, 13.0, 19.0, 12.0, 9.0, 12.0, 13.0, 7.0, 2.0, 4.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.4140625, -12.0389404296875, -11.663818359375, -11.2886962890625, -10.91357421875, -10.5384521484375, -10.163330078125, -9.7882080078125, -9.4130859375, -9.0379638671875, -8.662841796875, -8.2877197265625, -7.91259765625, -7.5374755859375, -7.162353515625, -6.7872314453125, -6.412109375, -6.0369873046875, -5.661865234375, -5.2867431640625, -4.91162109375, -4.5364990234375, -4.161376953125, -3.7862548828125, -3.4111328125, -3.0360107421875, -2.660888671875, -2.2857666015625, -1.91064453125, -1.5355224609375, -1.160400390625, -0.7852783203125, -0.41015625, -0.0350341796875, 0.340087890625, 0.7152099609375, 1.09033203125, 1.4654541015625, 1.840576171875, 2.2156982421875, 2.5908203125, 2.9659423828125, 3.341064453125, 3.7161865234375, 4.09130859375, 4.4664306640625, 4.841552734375, 5.2166748046875, 5.591796875, 5.9669189453125, 6.342041015625, 6.7171630859375, 7.09228515625, 7.4674072265625, 7.842529296875, 8.2176513671875, 8.5927734375, 8.9678955078125, 9.343017578125, 9.7181396484375, 10.09326171875, 10.4683837890625, 10.843505859375, 11.2186279296875, 11.59375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 15.0, 23.0, 28.0, 46.0, 46.0, 92.0, 122.0, 165.0, 251.0, 404.0, 611.0, 963.0, 1510.0, 2428.0, 4171.0, 7168.0, 13051.0, 25144.0, 50447.0, 114347.0, 324507.0, 296869.0, 105698.0, 47192.0, 23397.0, 12454.0, 6823.0, 4021.0, 2350.0, 1436.0, 938.0, 609.0, 394.0, 271.0, 170.0, 114.0, 86.0, 50.0, 33.0, 17.0, 29.0, 15.0, 14.0, 9.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-20.0625, -19.4716796875, -18.880859375, -18.2900390625, -17.69921875, -17.1083984375, -16.517578125, -15.9267578125, -15.3359375, -14.7451171875, -14.154296875, -13.5634765625, -12.97265625, -12.3818359375, -11.791015625, -11.2001953125, -10.609375, -10.0185546875, -9.427734375, -8.8369140625, -8.24609375, -7.6552734375, -7.064453125, -6.4736328125, -5.8828125, -5.2919921875, -4.701171875, -4.1103515625, -3.51953125, -2.9287109375, -2.337890625, -1.7470703125, -1.15625, -0.5654296875, 0.025390625, 0.6162109375, 1.20703125, 1.7978515625, 2.388671875, 2.9794921875, 3.5703125, 4.1611328125, 4.751953125, 5.3427734375, 5.93359375, 6.5244140625, 7.115234375, 7.7060546875, 8.296875, 8.8876953125, 9.478515625, 10.0693359375, 10.66015625, 11.2509765625, 11.841796875, 12.4326171875, 13.0234375, 13.6142578125, 14.205078125, 14.7958984375, 15.38671875, 15.9775390625, 16.568359375, 17.1591796875, 17.75]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 8.0, 10.0, 14.0, 24.0, 20.0, 30.0, 34.0, 36.0, 40.0, 47.0, 76.0, 76.0, 111.0, 192.0, 1424.0, 279.0, 148.0, 91.0, 73.0, 46.0, 35.0, 25.0, 39.0, 29.0, 25.0, 18.0, 13.0, 12.0, 16.0, 9.0, 7.0, 9.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.0078125, -27.921875, -26.8359375, -25.75, -24.6640625, -23.578125, -22.4921875, -21.40625, -20.3203125, -19.234375, -18.1484375, -17.0625, -15.9765625, -14.890625, -13.8046875, -12.71875, -11.6328125, -10.546875, -9.4609375, -8.375, -7.2890625, -6.203125, -5.1171875, -4.03125, -2.9453125, -1.859375, -0.7734375, 0.3125, 1.3984375, 2.484375, 3.5703125, 4.65625, 5.7421875, 6.828125, 7.9140625, 9.0, 10.0859375, 11.171875, 12.2578125, 13.34375, 14.4296875, 15.515625, 16.6015625, 17.6875, 18.7734375, 19.859375, 20.9453125, 22.03125, 23.1171875, 24.203125, 25.2890625, 26.375, 27.4609375, 28.546875, 29.6328125, 30.71875, 31.8046875, 32.890625, 33.9765625, 35.0625, 36.1484375, 37.234375, 38.3203125, 39.40625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 11.0, 10.0, 11.0, 11.0, 16.0, 15.0, 41.0, 41.0, 60.0, 73.0, 80.0, 143.0, 203.0, 343.0, 656.0, 1441.0, 3850.0, 12756.0, 56524.0, 607476.0, 2299758.0, 128661.0, 22802.0, 6335.0, 2191.0, 886.0, 448.0, 245.0, 177.0, 105.0, 76.0, 54.0, 38.0, 39.0, 33.0, 18.0, 13.0, 8.0, 11.0, 9.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0], "bins": [-43.84375, -42.5986328125, -41.353515625, -40.1083984375, -38.86328125, -37.6181640625, -36.373046875, -35.1279296875, -33.8828125, -32.6376953125, -31.392578125, -30.1474609375, -28.90234375, -27.6572265625, -26.412109375, -25.1669921875, -23.921875, -22.6767578125, -21.431640625, -20.1865234375, -18.94140625, -17.6962890625, -16.451171875, -15.2060546875, -13.9609375, -12.7158203125, -11.470703125, -10.2255859375, -8.98046875, -7.7353515625, -6.490234375, -5.2451171875, -4.0, -2.7548828125, -1.509765625, -0.2646484375, 0.98046875, 2.2255859375, 3.470703125, 4.7158203125, 5.9609375, 7.2060546875, 8.451171875, 9.6962890625, 10.94140625, 12.1865234375, 13.431640625, 14.6767578125, 15.921875, 17.1669921875, 18.412109375, 19.6572265625, 20.90234375, 22.1474609375, 23.392578125, 24.6376953125, 25.8828125, 27.1279296875, 28.373046875, 29.6181640625, 30.86328125, 32.1083984375, 33.353515625, 34.5986328125, 35.84375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 144.0, 611.0, 235.0, 19.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.13589477539062, -175.244140625, -162.35238647460938, -149.46063232421875, -136.56887817382812, -123.67711639404297, -110.78535461425781, -97.89360046386719, -85.00184631347656, -72.11009216308594, -59.21833419799805, -46.326576232910156, -33.43482208251953, -20.543067932128906, -7.65130615234375, 5.240447998046875, 18.1322021484375, 31.023958206176758, 43.915714263916016, 56.807472229003906, 69.69922637939453, 82.59098052978516, 95.48274230957031, 108.37449645996094, 121.26625061035156, 134.1580047607422, 147.0497589111328, 159.9415283203125, 172.83328247070312, 185.72503662109375, 198.61679077148438, 211.508544921875, 224.4002685546875, 237.29202270507812, 250.18377685546875, 263.0755310058594, 275.96728515625, 288.8590393066406, 301.75079345703125, 314.642578125, 327.5343017578125, 340.4260559082031, 353.31781005859375, 366.2095642089844, 379.101318359375, 391.9930725097656, 404.88482666015625, 417.776611328125, 430.6683654785156, 443.56011962890625, 456.4518737792969, 469.3436279296875, 482.2353820800781, 495.12713623046875, 508.0189208984375, 520.91064453125, 533.8024291992188, 546.6942138671875, 559.5859375, 572.4777221679688, 585.3694458007812, 598.26123046875, 611.1529541015625, 624.0447387695312, 636.9364624023438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 6.0, 10.0, 7.0, 7.0, 15.0, 10.0, 18.0, 17.0, 15.0, 27.0, 18.0, 30.0, 28.0, 38.0, 31.0, 37.0, 40.0, 32.0, 32.0, 33.0, 25.0, 42.0, 35.0, 47.0, 40.0, 37.0, 35.0, 26.0, 30.0, 29.0, 24.0, 26.0, 21.0, 16.0, 22.0, 7.0, 11.0, 14.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0], "bins": [-73.77397155761719, -71.63825988769531, -69.50255584716797, -67.3668441772461, -65.23114013671875, -63.095428466796875, -60.959720611572266, -58.824012756347656, -56.68830108642578, -54.55259323120117, -52.41688537597656, -50.28117370605469, -48.14546585083008, -46.00975799560547, -43.87405014038086, -41.73834228515625, -39.60263442993164, -37.46692657470703, -35.33121871948242, -33.19551086425781, -31.059799194335938, -28.924091339111328, -26.78838348388672, -24.65267562866211, -22.516965866088867, -20.381258010864258, -18.245548248291016, -16.109840393066406, -13.97413158416748, -11.838422775268555, -9.702714920043945, -7.5670061111450195, -5.431301116943359, -3.2955925464630127, -1.159883975982666, 0.9758243560791016, 3.1115331649780273, 5.247241973876953, 7.3829498291015625, 9.518658638000488, 11.654367446899414, 13.79007625579834, 15.925785064697266, 18.061492919921875, 20.197200775146484, 22.332910537719727, 24.468618392944336, 26.604328155517578, 28.740036010742188, 30.875743865966797, 33.011451721191406, 35.14716339111328, 37.28287124633789, 39.4185791015625, 41.55428695678711, 43.68999481201172, 45.825706481933594, 47.9614143371582, 50.09712219238281, 52.23283386230469, 54.3685417175293, 56.504249572753906, 58.639957427978516, 60.775665283203125, 62.911373138427734]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 5.0, 3.0, 12.0, 14.0, 16.0, 13.0, 19.0, 22.0, 32.0, 23.0, 33.0, 22.0, 34.0, 25.0, 37.0, 31.0, 41.0, 49.0, 39.0, 40.0, 51.0, 43.0, 35.0, 37.0, 33.0, 32.0, 32.0, 29.0, 29.0, 21.0, 14.0, 21.0, 20.0, 14.0, 14.0, 9.0, 9.0, 7.0, 3.0, 10.0, 1.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.921875, -12.533935546875, -12.14599609375, -11.758056640625, -11.3701171875, -10.982177734375, -10.59423828125, -10.206298828125, -9.818359375, -9.430419921875, -9.04248046875, -8.654541015625, -8.2666015625, -7.878662109375, -7.49072265625, -7.102783203125, -6.71484375, -6.326904296875, -5.93896484375, -5.551025390625, -5.1630859375, -4.775146484375, -4.38720703125, -3.999267578125, -3.611328125, -3.223388671875, -2.83544921875, -2.447509765625, -2.0595703125, -1.671630859375, -1.28369140625, -0.895751953125, -0.5078125, -0.119873046875, 0.26806640625, 0.656005859375, 1.0439453125, 1.431884765625, 1.81982421875, 2.207763671875, 2.595703125, 2.983642578125, 3.37158203125, 3.759521484375, 4.1474609375, 4.535400390625, 4.92333984375, 5.311279296875, 5.69921875, 6.087158203125, 6.47509765625, 6.863037109375, 7.2509765625, 7.638916015625, 8.02685546875, 8.414794921875, 8.802734375, 9.190673828125, 9.57861328125, 9.966552734375, 10.3544921875, 10.742431640625, 11.13037109375, 11.518310546875, 11.90625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 9.0, 12.0, 20.0, 22.0, 35.0, 33.0, 42.0, 51.0, 90.0, 111.0, 184.0, 344.0, 778.0, 2566.0, 14877.0, 671443.0, 3468596.0, 29101.0, 3806.0, 1014.0, 415.0, 215.0, 120.0, 81.0, 55.0, 51.0, 38.0, 30.0, 25.0, 16.0, 15.0, 16.0, 12.0, 11.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.8125, -91.6669921875, -88.521484375, -85.3759765625, -82.23046875, -79.0849609375, -75.939453125, -72.7939453125, -69.6484375, -66.5029296875, -63.357421875, -60.2119140625, -57.06640625, -53.9208984375, -50.775390625, -47.6298828125, -44.484375, -41.3388671875, -38.193359375, -35.0478515625, -31.90234375, -28.7568359375, -25.611328125, -22.4658203125, -19.3203125, -16.1748046875, -13.029296875, -9.8837890625, -6.73828125, -3.5927734375, -0.447265625, 2.6982421875, 5.84375, 8.9892578125, 12.134765625, 15.2802734375, 18.42578125, 21.5712890625, 24.716796875, 27.8623046875, 31.0078125, 34.1533203125, 37.298828125, 40.4443359375, 43.58984375, 46.7353515625, 49.880859375, 53.0263671875, 56.171875, 59.3173828125, 62.462890625, 65.6083984375, 68.75390625, 71.8994140625, 75.044921875, 78.1904296875, 81.3359375, 84.4814453125, 87.626953125, 90.7724609375, 93.91796875, 97.0634765625, 100.208984375, 103.3544921875, 106.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 0.0, 9.0, 10.0, 8.0, 11.0, 25.0, 20.0, 30.0, 39.0, 65.0, 80.0, 105.0, 141.0, 231.0, 395.0, 692.0, 776.0, 505.0, 290.0, 167.0, 129.0, 87.0, 69.0, 47.0, 29.0, 31.0, 19.0, 18.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.595458984375, -18.84716796875, -18.098876953125, -17.3505859375, -16.602294921875, -15.85400390625, -15.105712890625, -14.357421875, -13.609130859375, -12.86083984375, -12.112548828125, -11.3642578125, -10.615966796875, -9.86767578125, -9.119384765625, -8.37109375, -7.622802734375, -6.87451171875, -6.126220703125, -5.3779296875, -4.629638671875, -3.88134765625, -3.133056640625, -2.384765625, -1.636474609375, -0.88818359375, -0.139892578125, 0.6083984375, 1.356689453125, 2.10498046875, 2.853271484375, 3.6015625, 4.349853515625, 5.09814453125, 5.846435546875, 6.5947265625, 7.343017578125, 8.09130859375, 8.839599609375, 9.587890625, 10.336181640625, 11.08447265625, 11.832763671875, 12.5810546875, 13.329345703125, 14.07763671875, 14.825927734375, 15.57421875, 16.322509765625, 17.07080078125, 17.819091796875, 18.5673828125, 19.315673828125, 20.06396484375, 20.812255859375, 21.560546875, 22.308837890625, 23.05712890625, 23.805419921875, 24.5537109375, 25.302001953125, 26.05029296875, 26.798583984375, 27.546875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 13.0, 15.0, 15.0, 29.0, 37.0, 59.0, 102.0, 180.0, 378.0, 899.0, 2317.0, 7714.0, 32981.0, 240137.0, 3472915.0, 378698.0, 43446.0, 9624.0, 2768.0, 985.0, 420.0, 225.0, 111.0, 64.0, 36.0, 40.0, 29.0, 20.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.75, -61.03466796875, -59.3193359375, -57.60400390625, -55.888671875, -54.17333984375, -52.4580078125, -50.74267578125, -49.02734375, -47.31201171875, -45.5966796875, -43.88134765625, -42.166015625, -40.45068359375, -38.7353515625, -37.02001953125, -35.3046875, -33.58935546875, -31.8740234375, -30.15869140625, -28.443359375, -26.72802734375, -25.0126953125, -23.29736328125, -21.58203125, -19.86669921875, -18.1513671875, -16.43603515625, -14.720703125, -13.00537109375, -11.2900390625, -9.57470703125, -7.859375, -6.14404296875, -4.4287109375, -2.71337890625, -0.998046875, 0.71728515625, 2.4326171875, 4.14794921875, 5.86328125, 7.57861328125, 9.2939453125, 11.00927734375, 12.724609375, 14.43994140625, 16.1552734375, 17.87060546875, 19.5859375, 21.30126953125, 23.0166015625, 24.73193359375, 26.447265625, 28.16259765625, 29.8779296875, 31.59326171875, 33.30859375, 35.02392578125, 36.7392578125, 38.45458984375, 40.169921875, 41.88525390625, 43.6005859375, 45.31591796875, 47.03125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 10.0, 12.0, 11.0, 26.0, 36.0, 40.0, 60.0, 116.0, 103.0, 128.0, 117.0, 93.0, 70.0, 64.0, 36.0, 32.0, 25.0, 14.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.65469360351562, -92.7312240600586, -89.80774688720703, -86.88427734375, -83.96080017089844, -81.0373306274414, -78.11386108398438, -75.19038391113281, -72.26691436767578, -69.34344482421875, -66.41996765136719, -63.496498107910156, -60.57302474975586, -57.64955139160156, -54.726078033447266, -51.80260467529297, -48.87913131713867, -45.955657958984375, -43.03218460083008, -40.10871124267578, -37.18524169921875, -34.26176834106445, -31.338294982910156, -28.414823532104492, -25.491350173950195, -22.5678768157959, -19.644405364990234, -16.720932006835938, -13.797459602355957, -10.873987197875977, -7.95051383972168, -5.027042388916016, -2.1035690307617188, 0.8199036121368408, 3.7433762550354004, 6.666849136352539, 9.59032154083252, 12.5137939453125, 15.437267303466797, 18.36073875427246, 21.284212112426758, 24.207685470581055, 27.13115692138672, 30.054630279541016, 32.97810363769531, 35.901573181152344, 38.825050354003906, 41.74851989746094, 44.671993255615234, 47.59546661376953, 50.51893997192383, 53.442413330078125, 56.365882873535156, 59.28935623168945, 62.21282958984375, 65.13629913330078, 68.05977630615234, 70.98324584960938, 73.90672302246094, 76.83019256591797, 79.75366973876953, 82.67713928222656, 85.60061645507812, 88.52408599853516, 91.44755554199219]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 12.0, 5.0, 10.0, 8.0, 20.0, 11.0, 18.0, 28.0, 9.0, 31.0, 22.0, 34.0, 33.0, 30.0, 33.0, 41.0, 44.0, 38.0, 43.0, 49.0, 39.0, 41.0, 38.0, 33.0, 30.0, 36.0, 36.0, 24.0, 39.0, 28.0, 21.0, 14.0, 23.0, 10.0, 12.0, 11.0, 14.0, 14.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.27718353271484, -73.09468841552734, -70.91220092773438, -68.72970581054688, -66.5472183227539, -64.3647232055664, -62.18223571777344, -59.99974060058594, -57.81725311279297, -55.634761810302734, -53.4522705078125, -51.269779205322266, -49.08728790283203, -46.9047966003418, -44.72230529785156, -42.53981018066406, -40.35731887817383, -38.174827575683594, -35.99233627319336, -33.809844970703125, -31.62735366821289, -29.444862365722656, -27.26236915588379, -25.079877853393555, -22.89738655090332, -20.714895248413086, -18.53240394592285, -16.349910736083984, -14.167420387268066, -11.984929084777832, -9.802436828613281, -7.619945526123047, -5.4374542236328125, -3.254962682723999, -1.0724711418151855, 1.110020637512207, 3.2925119400024414, 5.475003242492676, 7.657495498657227, 9.839986801147461, 12.022478103637695, 14.20496940612793, 16.387460708618164, 18.56995391845703, 20.752445220947266, 22.9349365234375, 25.117427825927734, 27.29991912841797, 29.482410430908203, 31.664901733398438, 33.84739303588867, 36.029884338378906, 38.21237564086914, 40.394866943359375, 42.577362060546875, 44.759849548339844, 46.942344665527344, 49.12483596801758, 51.30732727050781, 53.48981857299805, 55.67230987548828, 57.854801177978516, 60.03729248046875, 62.21978759765625, 64.40227508544922]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 8.0, 10.0, 10.0, 11.0, 9.0, 16.0, 21.0, 26.0, 15.0, 21.0, 24.0, 31.0, 32.0, 43.0, 39.0, 39.0, 46.0, 48.0, 50.0, 38.0, 57.0, 35.0, 43.0, 41.0, 33.0, 34.0, 20.0, 33.0, 32.0, 19.0, 15.0, 17.0, 9.0, 6.0, 12.0, 11.0, 5.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0], "bins": [-14.7578125, -14.345458984375, -13.93310546875, -13.520751953125, -13.1083984375, -12.696044921875, -12.28369140625, -11.871337890625, -11.458984375, -11.046630859375, -10.63427734375, -10.221923828125, -9.8095703125, -9.397216796875, -8.98486328125, -8.572509765625, -8.16015625, -7.747802734375, -7.33544921875, -6.923095703125, -6.5107421875, -6.098388671875, -5.68603515625, -5.273681640625, -4.861328125, -4.448974609375, -4.03662109375, -3.624267578125, -3.2119140625, -2.799560546875, -2.38720703125, -1.974853515625, -1.5625, -1.150146484375, -0.73779296875, -0.325439453125, 0.0869140625, 0.499267578125, 0.91162109375, 1.323974609375, 1.736328125, 2.148681640625, 2.56103515625, 2.973388671875, 3.3857421875, 3.798095703125, 4.21044921875, 4.622802734375, 5.03515625, 5.447509765625, 5.85986328125, 6.272216796875, 6.6845703125, 7.096923828125, 7.50927734375, 7.921630859375, 8.333984375, 8.746337890625, 9.15869140625, 9.571044921875, 9.9833984375, 10.395751953125, 10.80810546875, 11.220458984375, 11.6328125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 18.0, 18.0, 29.0, 62.0, 72.0, 108.0, 177.0, 264.0, 374.0, 629.0, 1000.0, 1647.0, 2898.0, 4890.0, 8377.0, 15051.0, 27147.0, 50111.0, 93757.0, 171531.0, 250232.0, 188504.0, 105068.0, 56557.0, 30665.0, 16855.0, 9335.0, 5271.0, 3088.0, 1802.0, 1082.0, 649.0, 439.0, 248.0, 198.0, 128.0, 96.0, 49.0, 37.0, 24.0, 15.0, 18.0, 6.0, 10.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7724609375, -1.719696044921875, -1.66693115234375, -1.614166259765625, -1.5614013671875, -1.508636474609375, -1.45587158203125, -1.403106689453125, -1.350341796875, -1.297576904296875, -1.24481201171875, -1.192047119140625, -1.1392822265625, -1.086517333984375, -1.03375244140625, -0.980987548828125, -0.92822265625, -0.875457763671875, -0.82269287109375, -0.769927978515625, -0.7171630859375, -0.664398193359375, -0.61163330078125, -0.558868408203125, -0.506103515625, -0.453338623046875, -0.40057373046875, -0.347808837890625, -0.2950439453125, -0.242279052734375, -0.18951416015625, -0.136749267578125, -0.083984375, -0.031219482421875, 0.02154541015625, 0.074310302734375, 0.1270751953125, 0.179840087890625, 0.23260498046875, 0.285369873046875, 0.338134765625, 0.390899658203125, 0.44366455078125, 0.496429443359375, 0.5491943359375, 0.601959228515625, 0.65472412109375, 0.707489013671875, 0.76025390625, 0.813018798828125, 0.86578369140625, 0.918548583984375, 0.9713134765625, 1.024078369140625, 1.07684326171875, 1.129608154296875, 1.182373046875, 1.235137939453125, 1.28790283203125, 1.340667724609375, 1.3934326171875, 1.446197509765625, 1.49896240234375, 1.551727294921875, 1.6044921875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 11.0, 7.0, 15.0, 11.0, 15.0, 18.0, 25.0, 21.0, 19.0, 25.0, 27.0, 24.0, 37.0, 32.0, 44.0, 41.0, 38.0, 38.0, 41.0, 1063.0, 36.0, 41.0, 50.0, 40.0, 23.0, 32.0, 28.0, 31.0, 22.0, 27.0, 22.0, 18.0, 31.0, 13.0, 13.0, 8.0, 6.0, 4.0, 8.0, 5.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.12567138671875, -6.8646240234375, -6.60357666015625, -6.342529296875, -6.08148193359375, -5.8204345703125, -5.55938720703125, -5.29833984375, -5.03729248046875, -4.7762451171875, -4.51519775390625, -4.254150390625, -3.99310302734375, -3.7320556640625, -3.47100830078125, -3.2099609375, -2.94891357421875, -2.6878662109375, -2.42681884765625, -2.165771484375, -1.90472412109375, -1.6436767578125, -1.38262939453125, -1.12158203125, -0.86053466796875, -0.5994873046875, -0.33843994140625, -0.077392578125, 0.18365478515625, 0.4447021484375, 0.70574951171875, 0.966796875, 1.22784423828125, 1.4888916015625, 1.74993896484375, 2.010986328125, 2.27203369140625, 2.5330810546875, 2.79412841796875, 3.05517578125, 3.31622314453125, 3.5772705078125, 3.83831787109375, 4.099365234375, 4.36041259765625, 4.6214599609375, 4.88250732421875, 5.1435546875, 5.40460205078125, 5.6656494140625, 5.92669677734375, 6.187744140625, 6.44879150390625, 6.7098388671875, 6.97088623046875, 7.23193359375, 7.49298095703125, 7.7540283203125, 8.01507568359375, 8.276123046875, 8.53717041015625, 8.7982177734375, 9.05926513671875, 9.3203125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 8.0, 8.0, 9.0, 24.0, 35.0, 65.0, 81.0, 110.0, 163.0, 268.0, 380.0, 573.0, 998.0, 1601.0, 2486.0, 3954.0, 6271.0, 10118.0, 16517.0, 26974.0, 45124.0, 77681.0, 134987.0, 660228.0, 777741.0, 136294.0, 78034.0, 45680.0, 27123.0, 16380.0, 10215.0, 6247.0, 3947.0, 2496.0, 1488.0, 982.0, 624.0, 433.0, 254.0, 198.0, 107.0, 82.0, 48.0, 31.0, 26.0, 11.0, 12.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73193359375, -0.7083282470703125, -0.684722900390625, -0.6611175537109375, -0.63751220703125, -0.6139068603515625, -0.590301513671875, -0.5666961669921875, -0.5430908203125, -0.5194854736328125, -0.495880126953125, -0.4722747802734375, -0.44866943359375, -0.4250640869140625, -0.401458740234375, -0.3778533935546875, -0.354248046875, -0.3306427001953125, -0.307037353515625, -0.2834320068359375, -0.25982666015625, -0.2362213134765625, -0.212615966796875, -0.1890106201171875, -0.1654052734375, -0.1417999267578125, -0.118194580078125, -0.0945892333984375, -0.07098388671875, -0.0473785400390625, -0.023773193359375, -0.0001678466796875, 0.0234375, 0.0470428466796875, 0.070648193359375, 0.0942535400390625, 0.11785888671875, 0.1414642333984375, 0.165069580078125, 0.1886749267578125, 0.2122802734375, 0.2358856201171875, 0.259490966796875, 0.2830963134765625, 0.30670166015625, 0.3303070068359375, 0.353912353515625, 0.3775177001953125, 0.401123046875, 0.4247283935546875, 0.448333740234375, 0.4719390869140625, 0.49554443359375, 0.5191497802734375, 0.542755126953125, 0.5663604736328125, 0.5899658203125, 0.6135711669921875, 0.637176513671875, 0.6607818603515625, 0.68438720703125, 0.7079925537109375, 0.731597900390625, 0.7552032470703125, 0.77880859375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 8.0, 15.0, 23.0, 49.0, 102.0, 197.0, 368.0, 104.0, 49.0, 32.0, 12.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2442626953125, -0.2341442108154297, -0.22402572631835938, -0.21390724182128906, -0.20378875732421875, -0.19367027282714844, -0.18355178833007812, -0.1734333038330078, -0.1633148193359375, -0.1531963348388672, -0.14307785034179688, -0.13295936584472656, -0.12284088134765625, -0.11272239685058594, -0.10260391235351562, -0.09248542785644531, -0.082366943359375, -0.07224845886230469, -0.062129974365234375, -0.05201148986816406, -0.04189300537109375, -0.03177452087402344, -0.021656036376953125, -0.011537551879882812, -0.0014190673828125, 0.008699417114257812, 0.018817901611328125, 0.028936386108398438, 0.03905487060546875, 0.04917335510253906, 0.059291839599609375, 0.06941032409667969, 0.07952880859375, 0.08964729309082031, 0.09976577758789062, 0.10988426208496094, 0.12000274658203125, 0.13012123107910156, 0.14023971557617188, 0.1503582000732422, 0.1604766845703125, 0.1705951690673828, 0.18071365356445312, 0.19083213806152344, 0.20095062255859375, 0.21106910705566406, 0.22118759155273438, 0.2313060760498047, 0.241424560546875, 0.2515430450439453, 0.2616615295410156, 0.27178001403808594, 0.28189849853515625, 0.29201698303222656, 0.3021354675292969, 0.3122539520263672, 0.3223724365234375, 0.3324909210205078, 0.3426094055175781, 0.35272789001464844, 0.36284637451171875, 0.37296485900878906, 0.3830833435058594, 0.3932018280029297, 0.4033203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 14.0, 16.0, 40.0, 74.0, 280.0, 1993.0, 983556.0, 61070.0, 1098.0, 222.0, 74.0, 29.0, 21.0, 9.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.5625, -7.372802734375, -7.18310546875, -6.993408203125, -6.8037109375, -6.614013671875, -6.42431640625, -6.234619140625, -6.044921875, -5.855224609375, -5.66552734375, -5.475830078125, -5.2861328125, -5.096435546875, -4.90673828125, -4.717041015625, -4.52734375, -4.337646484375, -4.14794921875, -3.958251953125, -3.7685546875, -3.578857421875, -3.38916015625, -3.199462890625, -3.009765625, -2.820068359375, -2.63037109375, -2.440673828125, -2.2509765625, -2.061279296875, -1.87158203125, -1.681884765625, -1.4921875, -1.302490234375, -1.11279296875, -0.923095703125, -0.7333984375, -0.543701171875, -0.35400390625, -0.164306640625, 0.025390625, 0.215087890625, 0.40478515625, 0.594482421875, 0.7841796875, 0.973876953125, 1.16357421875, 1.353271484375, 1.54296875, 1.732666015625, 1.92236328125, 2.112060546875, 2.3017578125, 2.491455078125, 2.68115234375, 2.870849609375, 3.060546875, 3.250244140625, 3.43994140625, 3.629638671875, 3.8193359375, 4.009033203125, 4.19873046875, 4.388427734375, 4.578125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 14.0, 29.0, 61.0, 203.0, 483.0, 144.0, 44.0, 23.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3135902881622314, -1.2673454284667969, -1.2211005687713623, -1.1748557090759277, -1.1286108493804932, -1.0823659896850586, -1.036121129989624, -0.9898763298988342, -0.9436314702033997, -0.8973866105079651, -0.8511417508125305, -0.8048969507217407, -0.7586520910263062, -0.7124072313308716, -0.666162371635437, -0.6199175119400024, -0.5736726522445679, -0.5274277925491333, -0.48118293285369873, -0.43493810296058655, -0.388693243265152, -0.3424483835697174, -0.2962035536766052, -0.24995869398117065, -0.20371383428573608, -0.1574689745903015, -0.11122412979602814, -0.06497928500175476, -0.01873442530632019, 0.02751043438911438, 0.07375526428222656, 0.12000012397766113, 0.1662449836730957, 0.21248984336853027, 0.25873470306396484, 0.304979532957077, 0.3512243926525116, 0.39746925234794617, 0.44371408224105835, 0.4899589419364929, 0.5362038016319275, 0.5824486613273621, 0.6286935210227966, 0.6749383211135864, 0.721183180809021, 0.7674280405044556, 0.8136729001998901, 0.8599177598953247, 0.9061626195907593, 0.9524074792861938, 0.9986523389816284, 1.044897198677063, 1.0911420583724976, 1.1373869180679321, 1.1836316585540771, 1.2298765182495117, 1.2761213779449463, 1.3223662376403809, 1.3686110973358154, 1.41485595703125, 1.4611008167266846, 1.5073456764221191, 1.5535905361175537, 1.5998353958129883, 1.6460802555084229]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 6.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 6.0, 5.0, 10.0, 15.0, 19.0, 15.0, 14.0, 31.0, 29.0, 27.0, 23.0, 33.0, 25.0, 21.0, 32.0, 49.0, 37.0, 39.0, 42.0, 39.0, 36.0, 29.0, 35.0, 34.0, 18.0, 33.0, 39.0, 36.0, 21.0, 22.0, 21.0, 15.0, 15.0, 25.0, 15.0, 10.0, 10.0, 9.0, 10.0, 5.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.2591186761856079, -0.2505349814891815, -0.24195128679275513, -0.23336759209632874, -0.22478389739990234, -0.21620020270347595, -0.20761650800704956, -0.19903281331062317, -0.19044911861419678, -0.18186542391777039, -0.173281729221344, -0.1646980345249176, -0.1561143398284912, -0.14753064513206482, -0.13894695043563843, -0.13036325573921204, -0.12177957594394684, -0.11319588124752045, -0.10461218655109406, -0.09602849185466766, -0.08744479715824127, -0.07886110246181488, -0.07027741521596909, -0.061693720519542694, -0.0531100258231163, -0.04452633112668991, -0.03594263643026352, -0.027358945459127426, -0.018775250762701035, -0.010191556066274643, -0.0016078650951385498, 0.006975829601287842, 0.015559524297714233, 0.024143218994140625, 0.03272691369056702, 0.04131060466170311, 0.0498942993581295, 0.05847799405455589, 0.06706168502569199, 0.07564537972211838, 0.08422907441854477, 0.09281276911497116, 0.10139646381139755, 0.10998015105724335, 0.11856384575366974, 0.12714754045009613, 0.13573123514652252, 0.1443149298429489, 0.1528986245393753, 0.1614823192358017, 0.1700660139322281, 0.17864970862865448, 0.18723340332508087, 0.19581709802150726, 0.20440077781677246, 0.21298447251319885, 0.22156816720962524, 0.23015186190605164, 0.23873555660247803, 0.24731925129890442, 0.2559029459953308, 0.2644866406917572, 0.2730703353881836, 0.28165403008461, 0.2902377247810364]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 8.0, 11.0, 10.0, 10.0, 10.0, 15.0, 21.0, 26.0, 15.0, 20.0, 25.0, 34.0, 33.0, 41.0, 37.0, 40.0, 48.0, 46.0, 49.0, 40.0, 55.0, 36.0, 42.0, 42.0, 32.0, 34.0, 20.0, 32.0, 35.0, 17.0, 14.0, 18.0, 9.0, 6.0, 13.0, 10.0, 5.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-14.7421875, -14.330078125, -13.91796875, -13.505859375, -13.09375, -12.681640625, -12.26953125, -11.857421875, -11.4453125, -11.033203125, -10.62109375, -10.208984375, -9.796875, -9.384765625, -8.97265625, -8.560546875, -8.1484375, -7.736328125, -7.32421875, -6.912109375, -6.5, -6.087890625, -5.67578125, -5.263671875, -4.8515625, -4.439453125, -4.02734375, -3.615234375, -3.203125, -2.791015625, -2.37890625, -1.966796875, -1.5546875, -1.142578125, -0.73046875, -0.318359375, 0.09375, 0.505859375, 0.91796875, 1.330078125, 1.7421875, 2.154296875, 2.56640625, 2.978515625, 3.390625, 3.802734375, 4.21484375, 4.626953125, 5.0390625, 5.451171875, 5.86328125, 6.275390625, 6.6875, 7.099609375, 7.51171875, 7.923828125, 8.3359375, 8.748046875, 9.16015625, 9.572265625, 9.984375, 10.396484375, 10.80859375, 11.220703125, 11.6328125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 15.0, 29.0, 41.0, 35.0, 53.0, 71.0, 105.0, 152.0, 199.0, 271.0, 390.0, 548.0, 779.0, 1238.0, 1770.0, 2956.0, 4960.0, 9263.0, 18445.0, 39176.0, 86474.0, 222359.0, 368469.0, 160423.0, 65899.0, 30623.0, 14424.0, 7611.0, 4115.0, 2545.0, 1588.0, 1056.0, 693.0, 522.0, 347.0, 255.0, 164.0, 146.0, 85.0, 72.0, 51.0, 37.0, 22.0, 13.0, 9.0, 16.0, 16.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.703125, -20.04248046875, -19.3818359375, -18.72119140625, -18.060546875, -17.39990234375, -16.7392578125, -16.07861328125, -15.41796875, -14.75732421875, -14.0966796875, -13.43603515625, -12.775390625, -12.11474609375, -11.4541015625, -10.79345703125, -10.1328125, -9.47216796875, -8.8115234375, -8.15087890625, -7.490234375, -6.82958984375, -6.1689453125, -5.50830078125, -4.84765625, -4.18701171875, -3.5263671875, -2.86572265625, -2.205078125, -1.54443359375, -0.8837890625, -0.22314453125, 0.4375, 1.09814453125, 1.7587890625, 2.41943359375, 3.080078125, 3.74072265625, 4.4013671875, 5.06201171875, 5.72265625, 6.38330078125, 7.0439453125, 7.70458984375, 8.365234375, 9.02587890625, 9.6865234375, 10.34716796875, 11.0078125, 11.66845703125, 12.3291015625, 12.98974609375, 13.650390625, 14.31103515625, 14.9716796875, 15.63232421875, 16.29296875, 16.95361328125, 17.6142578125, 18.27490234375, 18.935546875, 19.59619140625, 20.2568359375, 20.91748046875, 21.578125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 6.0, 10.0, 13.0, 9.0, 16.0, 18.0, 30.0, 34.0, 21.0, 42.0, 38.0, 48.0, 39.0, 66.0, 118.0, 215.0, 1358.0, 321.0, 175.0, 95.0, 57.0, 43.0, 34.0, 43.0, 33.0, 28.0, 26.0, 19.0, 16.0, 15.0, 9.0, 10.0, 8.0, 4.0, 9.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-34.71875, -33.6904296875, -32.662109375, -31.6337890625, -30.60546875, -29.5771484375, -28.548828125, -27.5205078125, -26.4921875, -25.4638671875, -24.435546875, -23.4072265625, -22.37890625, -21.3505859375, -20.322265625, -19.2939453125, -18.265625, -17.2373046875, -16.208984375, -15.1806640625, -14.15234375, -13.1240234375, -12.095703125, -11.0673828125, -10.0390625, -9.0107421875, -7.982421875, -6.9541015625, -5.92578125, -4.8974609375, -3.869140625, -2.8408203125, -1.8125, -0.7841796875, 0.244140625, 1.2724609375, 2.30078125, 3.3291015625, 4.357421875, 5.3857421875, 6.4140625, 7.4423828125, 8.470703125, 9.4990234375, 10.52734375, 11.5556640625, 12.583984375, 13.6123046875, 14.640625, 15.6689453125, 16.697265625, 17.7255859375, 18.75390625, 19.7822265625, 20.810546875, 21.8388671875, 22.8671875, 23.8955078125, 24.923828125, 25.9521484375, 26.98046875, 28.0087890625, 29.037109375, 30.0654296875, 31.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 4.0, 10.0, 13.0, 29.0, 25.0, 56.0, 62.0, 95.0, 123.0, 191.0, 288.0, 469.0, 927.0, 4099.0, 193104.0, 2929448.0, 13701.0, 1390.0, 585.0, 348.0, 221.0, 150.0, 101.0, 58.0, 54.0, 25.0, 32.0, 26.0, 13.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.6875, -84.0654296875, -80.443359375, -76.8212890625, -73.19921875, -69.5771484375, -65.955078125, -62.3330078125, -58.7109375, -55.0888671875, -51.466796875, -47.8447265625, -44.22265625, -40.6005859375, -36.978515625, -33.3564453125, -29.734375, -26.1123046875, -22.490234375, -18.8681640625, -15.24609375, -11.6240234375, -8.001953125, -4.3798828125, -0.7578125, 2.8642578125, 6.486328125, 10.1083984375, 13.73046875, 17.3525390625, 20.974609375, 24.5966796875, 28.21875, 31.8408203125, 35.462890625, 39.0849609375, 42.70703125, 46.3291015625, 49.951171875, 53.5732421875, 57.1953125, 60.8173828125, 64.439453125, 68.0615234375, 71.68359375, 75.3056640625, 78.927734375, 82.5498046875, 86.171875, 89.7939453125, 93.416015625, 97.0380859375, 100.66015625, 104.2822265625, 107.904296875, 111.5263671875, 115.1484375, 118.7705078125, 122.392578125, 126.0146484375, 129.63671875, 133.2587890625, 136.880859375, 140.5029296875, 144.125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 37.0, 107.0, 209.0, 296.0, 208.0, 88.0, 36.0, 11.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.4510498046875, -235.21420288085938, -227.9773712158203, -220.7405242919922, -213.50367736816406, -206.266845703125, -199.02999877929688, -191.79315185546875, -184.55630493164062, -177.3194580078125, -170.08262634277344, -162.8457794189453, -155.6089324951172, -148.37210083007812, -141.13525390625, -133.89840698242188, -126.66156768798828, -119.42472839355469, -112.18788146972656, -104.95104217529297, -97.71419525146484, -90.47735595703125, -83.24050903320312, -76.00366973876953, -68.76683044433594, -61.52998733520508, -54.29314422607422, -47.056304931640625, -39.8194580078125, -32.582618713378906, -25.345775604248047, -18.108932495117188, -10.872085571289062, -3.6352429389953613, 3.60159969329834, 10.838441848754883, 18.075284957885742, 25.31212615966797, 32.54896926879883, 39.78581237792969, 47.02265548706055, 54.259498596191406, 61.496341705322266, 68.73318481445312, 75.97002410888672, 83.20686340332031, 90.44371032714844, 97.68055725097656, 104.91739654541016, 112.15423583984375, 119.39108276367188, 126.62792205810547, 133.86476135253906, 141.1016082763672, 148.3384552001953, 155.57528686523438, 162.8121337890625, 170.04898071289062, 177.2858123779297, 184.5226593017578, 191.75950622558594, 198.996337890625, 206.23318481445312, 213.47003173828125, 220.70687866210938]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 11.0, 14.0, 14.0, 13.0, 16.0, 23.0, 25.0, 24.0, 33.0, 30.0, 34.0, 37.0, 45.0, 38.0, 37.0, 29.0, 41.0, 42.0, 40.0, 38.0, 35.0, 41.0, 39.0, 29.0, 36.0, 33.0, 17.0, 20.0, 18.0, 23.0, 23.0, 17.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-85.57408142089844, -82.92086791992188, -80.26764678955078, -77.61443328857422, -74.96121215820312, -72.30799865722656, -69.65477752685547, -67.0015640258789, -64.34834289550781, -61.695125579833984, -59.041908264160156, -56.38869094848633, -53.7354736328125, -51.08226013183594, -48.42904281616211, -45.77582550048828, -43.12261199951172, -40.46939468383789, -37.81617736816406, -35.162960052490234, -32.509742736816406, -29.85652732849121, -27.203311920166016, -24.550094604492188, -21.89687728881836, -19.24365997314453, -16.590442657470703, -13.937227249145508, -11.28400993347168, -8.630792617797852, -5.97757625579834, -3.324359893798828, -0.671142578125, 1.98207426071167, 4.63529109954834, 7.28850793838501, 9.94172477722168, 12.594942092895508, 15.24815845489502, 17.90137481689453, 20.55459213256836, 23.207809448242188, 25.861026763916016, 28.51424217224121, 31.16745948791504, 33.8206787109375, 36.47389221191406, 39.12710952758789, 41.78032684326172, 44.43354415893555, 47.086761474609375, 49.7399787902832, 52.39319610595703, 55.046409606933594, 57.69962692260742, 60.35284423828125, 63.00606155395508, 65.6592788696289, 68.31249237060547, 70.96571350097656, 73.61892700195312, 76.27214813232422, 78.92536163330078, 81.57858276367188, 84.23179626464844]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 1.0, 8.0, 12.0, 10.0, 17.0, 10.0, 13.0, 17.0, 17.0, 28.0, 24.0, 34.0, 38.0, 40.0, 44.0, 46.0, 44.0, 38.0, 51.0, 52.0, 37.0, 40.0, 37.0, 31.0, 49.0, 41.0, 29.0, 22.0, 34.0, 16.0, 12.0, 13.0, 18.0, 10.0, 16.0, 8.0, 7.0, 9.0, 11.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-14.9296875, -14.5035400390625, -14.077392578125, -13.6512451171875, -13.22509765625, -12.7989501953125, -12.372802734375, -11.9466552734375, -11.5205078125, -11.0943603515625, -10.668212890625, -10.2420654296875, -9.81591796875, -9.3897705078125, -8.963623046875, -8.5374755859375, -8.111328125, -7.6851806640625, -7.259033203125, -6.8328857421875, -6.40673828125, -5.9805908203125, -5.554443359375, -5.1282958984375, -4.7021484375, -4.2760009765625, -3.849853515625, -3.4237060546875, -2.99755859375, -2.5714111328125, -2.145263671875, -1.7191162109375, -1.29296875, -0.8668212890625, -0.440673828125, -0.0145263671875, 0.41162109375, 0.8377685546875, 1.263916015625, 1.6900634765625, 2.1162109375, 2.5423583984375, 2.968505859375, 3.3946533203125, 3.82080078125, 4.2469482421875, 4.673095703125, 5.0992431640625, 5.525390625, 5.9515380859375, 6.377685546875, 6.8038330078125, 7.22998046875, 7.6561279296875, 8.082275390625, 8.5084228515625, 8.9345703125, 9.3607177734375, 9.786865234375, 10.2130126953125, 10.63916015625, 11.0653076171875, 11.491455078125, 11.9176025390625, 12.34375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 11.0, 10.0, 11.0, 23.0, 25.0, 35.0, 43.0, 68.0, 94.0, 126.0, 206.0, 274.0, 416.0, 657.0, 1188.0, 2258.0, 4591.0, 11600.0, 39929.0, 254809.0, 1912177.0, 1686555.0, 221339.0, 37438.0, 10778.0, 4426.0, 2084.0, 1149.0, 670.0, 405.0, 251.0, 169.0, 134.0, 86.0, 69.0, 46.0, 39.0, 24.0, 20.0, 16.0, 12.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.25, -28.3349609375, -27.419921875, -26.5048828125, -25.58984375, -24.6748046875, -23.759765625, -22.8447265625, -21.9296875, -21.0146484375, -20.099609375, -19.1845703125, -18.26953125, -17.3544921875, -16.439453125, -15.5244140625, -14.609375, -13.6943359375, -12.779296875, -11.8642578125, -10.94921875, -10.0341796875, -9.119140625, -8.2041015625, -7.2890625, -6.3740234375, -5.458984375, -4.5439453125, -3.62890625, -2.7138671875, -1.798828125, -0.8837890625, 0.03125, 0.9462890625, 1.861328125, 2.7763671875, 3.69140625, 4.6064453125, 5.521484375, 6.4365234375, 7.3515625, 8.2666015625, 9.181640625, 10.0966796875, 11.01171875, 11.9267578125, 12.841796875, 13.7568359375, 14.671875, 15.5869140625, 16.501953125, 17.4169921875, 18.33203125, 19.2470703125, 20.162109375, 21.0771484375, 21.9921875, 22.9072265625, 23.822265625, 24.7373046875, 25.65234375, 26.5673828125, 27.482421875, 28.3974609375, 29.3125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 9.0, 16.0, 19.0, 11.0, 23.0, 33.0, 56.0, 58.0, 74.0, 96.0, 146.0, 198.0, 306.0, 357.0, 510.0, 540.0, 416.0, 301.0, 217.0, 188.0, 98.0, 105.0, 64.0, 52.0, 39.0, 39.0, 24.0, 25.0, 14.0, 9.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.3212890625, -16.658203125, -15.9951171875, -15.33203125, -14.6689453125, -14.005859375, -13.3427734375, -12.6796875, -12.0166015625, -11.353515625, -10.6904296875, -10.02734375, -9.3642578125, -8.701171875, -8.0380859375, -7.375, -6.7119140625, -6.048828125, -5.3857421875, -4.72265625, -4.0595703125, -3.396484375, -2.7333984375, -2.0703125, -1.4072265625, -0.744140625, -0.0810546875, 0.58203125, 1.2451171875, 1.908203125, 2.5712890625, 3.234375, 3.8974609375, 4.560546875, 5.2236328125, 5.88671875, 6.5498046875, 7.212890625, 7.8759765625, 8.5390625, 9.2021484375, 9.865234375, 10.5283203125, 11.19140625, 11.8544921875, 12.517578125, 13.1806640625, 13.84375, 14.5068359375, 15.169921875, 15.8330078125, 16.49609375, 17.1591796875, 17.822265625, 18.4853515625, 19.1484375, 19.8115234375, 20.474609375, 21.1376953125, 21.80078125, 22.4638671875, 23.126953125, 23.7900390625, 24.453125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 1.0, 9.0, 10.0, 13.0, 20.0, 36.0, 31.0, 52.0, 81.0, 162.0, 175.0, 350.0, 571.0, 1058.0, 2198.0, 5119.0, 14840.0, 52404.0, 252844.0, 2135960.0, 1475340.0, 190293.0, 41773.0, 12232.0, 4528.0, 1870.0, 942.0, 464.0, 328.0, 184.0, 126.0, 78.0, 60.0, 38.0, 20.0, 22.0, 13.0, 14.0, 6.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.15625, -32.1787109375, -31.201171875, -30.2236328125, -29.24609375, -28.2685546875, -27.291015625, -26.3134765625, -25.3359375, -24.3583984375, -23.380859375, -22.4033203125, -21.42578125, -20.4482421875, -19.470703125, -18.4931640625, -17.515625, -16.5380859375, -15.560546875, -14.5830078125, -13.60546875, -12.6279296875, -11.650390625, -10.6728515625, -9.6953125, -8.7177734375, -7.740234375, -6.7626953125, -5.78515625, -4.8076171875, -3.830078125, -2.8525390625, -1.875, -0.8974609375, 0.080078125, 1.0576171875, 2.03515625, 3.0126953125, 3.990234375, 4.9677734375, 5.9453125, 6.9228515625, 7.900390625, 8.8779296875, 9.85546875, 10.8330078125, 11.810546875, 12.7880859375, 13.765625, 14.7431640625, 15.720703125, 16.6982421875, 17.67578125, 18.6533203125, 19.630859375, 20.6083984375, 21.5859375, 22.5634765625, 23.541015625, 24.5185546875, 25.49609375, 26.4736328125, 27.451171875, 28.4287109375, 29.40625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 31.0, 187.0, 531.0, 234.0, 24.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.2575988769531, -248.2565155029297, -232.2554473876953, -216.25436401367188, -200.2532958984375, -184.25221252441406, -168.25112915039062, -152.25006103515625, -136.2489776611328, -120.2479019165039, -104.246826171875, -88.24574279785156, -72.24466705322266, -56.24359130859375, -40.24250793457031, -24.241432189941406, -8.2403564453125, 7.760721206665039, 23.761798858642578, 39.76287841796875, 55.763954162597656, 71.76502990722656, 87.76611328125, 103.7671890258789, 119.76826477050781, 135.76934814453125, 151.77041625976562, 167.77149963378906, 183.7725830078125, 199.77365112304688, 215.7747344970703, 231.77581787109375, 247.77691650390625, 263.7779846191406, 279.7790832519531, 295.7801513671875, 311.7812194824219, 327.78228759765625, 343.78338623046875, 359.7844543457031, 375.7855224609375, 391.7865905761719, 407.7876892089844, 423.78875732421875, 439.7898254394531, 455.7908935546875, 471.7919921875, 487.7930603027344, 503.7941589355469, 519.7952270507812, 535.7963256835938, 551.79736328125, 567.7984619140625, 583.799560546875, 599.8006591796875, 615.8016967773438, 631.8027954101562, 647.8038940429688, 663.804931640625, 679.8060302734375, 695.80712890625, 711.8081665039062, 727.8092651367188, 743.8103637695312, 759.8114013671875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 9.0, 4.0, 7.0, 6.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 12.0, 16.0, 22.0, 28.0, 25.0, 32.0, 22.0, 33.0, 33.0, 30.0, 29.0, 37.0, 36.0, 36.0, 36.0, 38.0, 38.0, 42.0, 30.0, 39.0, 28.0, 27.0, 29.0, 30.0, 17.0, 20.0, 22.0, 18.0, 23.0, 12.0, 12.0, 14.0, 11.0, 10.0, 8.0, 10.0, 2.0, 7.0, 7.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-62.77647399902344, -60.68628692626953, -58.596099853515625, -56.50591278076172, -54.41572189331055, -52.32553482055664, -50.235347747802734, -48.14516067504883, -46.054969787597656, -43.96478271484375, -41.874595642089844, -39.78440856933594, -37.694217681884766, -35.60403060913086, -33.51384353637695, -31.423656463623047, -29.33346939086914, -27.243282318115234, -25.153093338012695, -23.06290626525879, -20.97271728515625, -18.882530212402344, -16.792343139648438, -14.702155113220215, -12.611967086791992, -10.52177906036377, -8.431591033935547, -6.341403961181641, -4.251215934753418, -2.1610279083251953, -0.07084083557128906, 2.0193471908569336, 4.109535217285156, 6.199723243713379, 8.289911270141602, 10.380098342895508, 12.47028636932373, 14.560474395751953, 16.65066146850586, 18.740848541259766, 20.831037521362305, 22.92122459411621, 25.01141357421875, 27.101600646972656, 29.191787719726562, 31.2819766998291, 33.372161865234375, 35.46235275268555, 37.55253982543945, 39.64272689819336, 41.732913970947266, 43.82310485839844, 45.913291931152344, 48.00347900390625, 50.093666076660156, 52.18385314941406, 54.27404022216797, 56.364227294921875, 58.45441436767578, 60.54460144042969, 62.63479232788086, 64.7249755859375, 66.81517028808594, 68.90535736083984, 70.99554443359375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 9.0, 9.0, 9.0, 12.0, 14.0, 22.0, 15.0, 26.0, 38.0, 32.0, 41.0, 31.0, 33.0, 50.0, 36.0, 40.0, 48.0, 40.0, 40.0, 41.0, 32.0, 43.0, 33.0, 38.0, 22.0, 32.0, 31.0, 32.0, 27.0, 15.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.58544921875, -11.1943359375, -10.80322265625, -10.412109375, -10.02099609375, -9.6298828125, -9.23876953125, -8.84765625, -8.45654296875, -8.0654296875, -7.67431640625, -7.283203125, -6.89208984375, -6.5009765625, -6.10986328125, -5.71875, -5.32763671875, -4.9365234375, -4.54541015625, -4.154296875, -3.76318359375, -3.3720703125, -2.98095703125, -2.58984375, -2.19873046875, -1.8076171875, -1.41650390625, -1.025390625, -0.63427734375, -0.2431640625, 0.14794921875, 0.5390625, 0.93017578125, 1.3212890625, 1.71240234375, 2.103515625, 2.49462890625, 2.8857421875, 3.27685546875, 3.66796875, 4.05908203125, 4.4501953125, 4.84130859375, 5.232421875, 5.62353515625, 6.0146484375, 6.40576171875, 6.796875, 7.18798828125, 7.5791015625, 7.97021484375, 8.361328125, 8.75244140625, 9.1435546875, 9.53466796875, 9.92578125, 10.31689453125, 10.7080078125, 11.09912109375, 11.490234375, 11.88134765625, 12.2724609375, 12.66357421875, 13.0546875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 14.0, 21.0, 30.0, 33.0, 60.0, 82.0, 99.0, 183.0, 234.0, 397.0, 545.0, 885.0, 1410.0, 2253.0, 3573.0, 6066.0, 10013.0, 17485.0, 30418.0, 54965.0, 99215.0, 176363.0, 239062.0, 176027.0, 100136.0, 55128.0, 30617.0, 17365.0, 9996.0, 6090.0, 3554.0, 2230.0, 1393.0, 881.0, 580.0, 363.0, 250.0, 149.0, 115.0, 85.0, 57.0, 36.0, 20.0, 23.0, 14.0, 14.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.19158935546875, -1.1497802734375, -1.10797119140625, -1.066162109375, -1.02435302734375, -0.9825439453125, -0.94073486328125, -0.89892578125, -0.85711669921875, -0.8153076171875, -0.77349853515625, -0.731689453125, -0.68988037109375, -0.6480712890625, -0.60626220703125, -0.564453125, -0.52264404296875, -0.4808349609375, -0.43902587890625, -0.397216796875, -0.35540771484375, -0.3135986328125, -0.27178955078125, -0.22998046875, -0.18817138671875, -0.1463623046875, -0.10455322265625, -0.062744140625, -0.02093505859375, 0.0208740234375, 0.06268310546875, 0.1044921875, 0.14630126953125, 0.1881103515625, 0.22991943359375, 0.271728515625, 0.31353759765625, 0.3553466796875, 0.39715576171875, 0.43896484375, 0.48077392578125, 0.5225830078125, 0.56439208984375, 0.606201171875, 0.64801025390625, 0.6898193359375, 0.73162841796875, 0.7734375, 0.81524658203125, 0.8570556640625, 0.89886474609375, 0.940673828125, 0.98248291015625, 1.0242919921875, 1.06610107421875, 1.10791015625, 1.14971923828125, 1.1915283203125, 1.23333740234375, 1.275146484375, 1.31695556640625, 1.3587646484375, 1.40057373046875, 1.4423828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 3.0, 7.0, 4.0, 10.0, 10.0, 10.0, 16.0, 9.0, 17.0, 20.0, 19.0, 21.0, 21.0, 29.0, 36.0, 44.0, 27.0, 35.0, 46.0, 48.0, 26.0, 1066.0, 39.0, 48.0, 42.0, 51.0, 49.0, 39.0, 31.0, 24.0, 28.0, 27.0, 15.0, 23.0, 17.0, 21.0, 10.0, 6.0, 10.0, 12.0, 3.0, 9.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66015625, -6.39324951171875, -6.1263427734375, -5.85943603515625, -5.592529296875, -5.32562255859375, -5.0587158203125, -4.79180908203125, -4.52490234375, -4.25799560546875, -3.9910888671875, -3.72418212890625, -3.457275390625, -3.19036865234375, -2.9234619140625, -2.65655517578125, -2.3896484375, -2.12274169921875, -1.8558349609375, -1.58892822265625, -1.322021484375, -1.05511474609375, -0.7882080078125, -0.52130126953125, -0.25439453125, 0.01251220703125, 0.2794189453125, 0.54632568359375, 0.813232421875, 1.08013916015625, 1.3470458984375, 1.61395263671875, 1.880859375, 2.14776611328125, 2.4146728515625, 2.68157958984375, 2.948486328125, 3.21539306640625, 3.4822998046875, 3.74920654296875, 4.01611328125, 4.28302001953125, 4.5499267578125, 4.81683349609375, 5.083740234375, 5.35064697265625, 5.6175537109375, 5.88446044921875, 6.1513671875, 6.41827392578125, 6.6851806640625, 6.95208740234375, 7.218994140625, 7.48590087890625, 7.7528076171875, 8.01971435546875, 8.28662109375, 8.55352783203125, 8.8204345703125, 9.08734130859375, 9.354248046875, 9.62115478515625, 9.8880615234375, 10.15496826171875, 10.421875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 11.0, 17.0, 11.0, 28.0, 29.0, 59.0, 60.0, 95.0, 177.0, 244.0, 360.0, 538.0, 796.0, 1195.0, 1909.0, 2888.0, 4402.0, 6902.0, 10528.0, 16433.0, 26225.0, 43269.0, 71527.0, 123039.0, 294848.0, 1143718.0, 138739.0, 80740.0, 47715.0, 29115.0, 18343.0, 11645.0, 7387.0, 4685.0, 3249.0, 2073.0, 1353.0, 923.0, 610.0, 379.0, 291.0, 197.0, 112.0, 83.0, 53.0, 38.0, 34.0, 17.0, 18.0, 13.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.64306640625, -0.6230392456054688, -0.6030120849609375, -0.5829849243164062, -0.562957763671875, -0.5429306030273438, -0.5229034423828125, -0.5028762817382812, -0.48284912109375, -0.46282196044921875, -0.4427947998046875, -0.42276763916015625, -0.402740478515625, -0.38271331787109375, -0.3626861572265625, -0.34265899658203125, -0.3226318359375, -0.30260467529296875, -0.2825775146484375, -0.26255035400390625, -0.242523193359375, -0.22249603271484375, -0.2024688720703125, -0.18244171142578125, -0.16241455078125, -0.14238739013671875, -0.1223602294921875, -0.10233306884765625, -0.082305908203125, -0.06227874755859375, -0.0422515869140625, -0.02222442626953125, -0.002197265625, 0.01782989501953125, 0.0378570556640625, 0.05788421630859375, 0.077911376953125, 0.09793853759765625, 0.1179656982421875, 0.13799285888671875, 0.15802001953125, 0.17804718017578125, 0.1980743408203125, 0.21810150146484375, 0.238128662109375, 0.25815582275390625, 0.2781829833984375, 0.29821014404296875, 0.3182373046875, 0.33826446533203125, 0.3582916259765625, 0.37831878662109375, 0.398345947265625, 0.41837310791015625, 0.4384002685546875, 0.45842742919921875, 0.47845458984375, 0.49848175048828125, 0.5185089111328125, 0.5385360717773438, 0.558563232421875, 0.5785903930664062, 0.5986175537109375, 0.6186447143554688, 0.638671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 2.0, 6.0, 5.0, 9.0, 9.0, 8.0, 19.0, 31.0, 39.0, 40.0, 100.0, 142.0, 187.0, 128.0, 74.0, 38.0, 36.0, 18.0, 12.0, 17.0, 9.0, 10.0, 12.0, 6.0, 4.0, 6.0, 7.0, 2.0, 0.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07232666015625, -0.07021903991699219, -0.06811141967773438, -0.06600379943847656, -0.06389617919921875, -0.06178855895996094, -0.059680938720703125, -0.05757331848144531, -0.0554656982421875, -0.05335807800292969, -0.051250457763671875, -0.04914283752441406, -0.04703521728515625, -0.04492759704589844, -0.042819976806640625, -0.04071235656738281, -0.038604736328125, -0.03649711608886719, -0.034389495849609375, -0.03228187561035156, -0.03017425537109375, -0.028066635131835938, -0.025959014892578125, -0.023851394653320312, -0.0217437744140625, -0.019636154174804688, -0.017528533935546875, -0.015420913696289062, -0.01331329345703125, -0.011205673217773438, -0.009098052978515625, -0.0069904327392578125, -0.0048828125, -0.0027751922607421875, -0.000667572021484375, 0.0014400482177734375, 0.00354766845703125, 0.0056552886962890625, 0.007762908935546875, 0.009870529174804688, 0.0119781494140625, 0.014085769653320312, 0.016193389892578125, 0.018301010131835938, 0.02040863037109375, 0.022516250610351562, 0.024623870849609375, 0.026731491088867188, 0.028839111328125, 0.030946731567382812, 0.033054351806640625, 0.03516197204589844, 0.03726959228515625, 0.03937721252441406, 0.041484832763671875, 0.04359245300292969, 0.0457000732421875, 0.04780769348144531, 0.049915313720703125, 0.05202293395996094, 0.05413055419921875, 0.05623817443847656, 0.058345794677734375, 0.06045341491699219, 0.06256103515625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 10.0, 3.0, 7.0, 1.0, 9.0, 8.0, 6.0, 10.0, 8.0, 15.0, 19.0, 24.0, 25.0, 57.0, 48.0, 95.0, 139.0, 306.0, 839.0, 2932.0, 19867.0, 966673.0, 50682.0, 4648.0, 1210.0, 415.0, 161.0, 98.0, 63.0, 34.0, 35.0, 25.0, 20.0, 8.0, 12.0, 7.0, 8.0, 6.0, 7.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.05859375, -1.02288818359375, -0.9871826171875, -0.95147705078125, -0.915771484375, -0.88006591796875, -0.8443603515625, -0.80865478515625, -0.77294921875, -0.73724365234375, -0.7015380859375, -0.66583251953125, -0.630126953125, -0.59442138671875, -0.5587158203125, -0.52301025390625, -0.4873046875, -0.45159912109375, -0.4158935546875, -0.38018798828125, -0.344482421875, -0.30877685546875, -0.2730712890625, -0.23736572265625, -0.20166015625, -0.16595458984375, -0.1302490234375, -0.09454345703125, -0.058837890625, -0.02313232421875, 0.0125732421875, 0.04827880859375, 0.083984375, 0.11968994140625, 0.1553955078125, 0.19110107421875, 0.226806640625, 0.26251220703125, 0.2982177734375, 0.33392333984375, 0.36962890625, 0.40533447265625, 0.4410400390625, 0.47674560546875, 0.512451171875, 0.54815673828125, 0.5838623046875, 0.61956787109375, 0.6552734375, 0.69097900390625, 0.7266845703125, 0.76239013671875, 0.798095703125, 0.83380126953125, 0.8695068359375, 0.90521240234375, 0.94091796875, 0.97662353515625, 1.0123291015625, 1.04803466796875, 1.083740234375, 1.11944580078125, 1.1551513671875, 1.19085693359375, 1.2265625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 20.0, 48.0, 149.0, 433.0, 226.0, 77.0, 32.0, 9.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9330242872238159, -0.9146406650543213, -0.8962571024894714, -0.8778734803199768, -0.859489917755127, -0.8411062955856323, -0.8227227330207825, -0.8043391108512878, -0.785955548286438, -0.7675719261169434, -0.7491883635520935, -0.7308047413825989, -0.712421178817749, -0.6940375566482544, -0.6756539940834045, -0.6572703719139099, -0.6388868093490601, -0.6205031871795654, -0.6021196246147156, -0.583736002445221, -0.5653524398803711, -0.5469688177108765, -0.5285852551460266, -0.510201632976532, -0.49181801080703735, -0.4734344184398651, -0.45505082607269287, -0.43666723370552063, -0.4182836413383484, -0.39990004897117615, -0.3815164566040039, -0.3631328344345093, -0.3447492718696594, -0.3263656795024872, -0.30798208713531494, -0.2895984947681427, -0.27121490240097046, -0.2528313100337982, -0.23444770276546478, -0.21606411039829254, -0.1976805329322815, -0.17929694056510925, -0.160913348197937, -0.14252975583076477, -0.12414615601301193, -0.10576256364583969, -0.08737896382808685, -0.06899537146091461, -0.05061177909374237, -0.03222818672657013, -0.01384459063410759, 0.00453900545835495, 0.02292259782552719, 0.04130619019269943, 0.05968979001045227, 0.07807338237762451, 0.09645697474479675, 0.114840567111969, 0.13322415947914124, 0.15160775184631348, 0.16999134421348572, 0.18837493658065796, 0.2067585438489914, 0.22514213621616364, 0.24352572858333588]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 2.0, 9.0, 10.0, 11.0, 13.0, 21.0, 26.0, 19.0, 25.0, 27.0, 16.0, 40.0, 35.0, 43.0, 30.0, 29.0, 40.0, 26.0, 51.0, 45.0, 42.0, 48.0, 46.0, 33.0, 43.0, 25.0, 31.0, 38.0, 29.0, 26.0, 15.0, 24.0, 23.0, 13.0, 13.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05482608079910278, -0.05288701131939888, -0.05094794183969498, -0.049008868634700775, -0.04706979915499687, -0.04513072967529297, -0.04319165647029877, -0.041252586990594864, -0.03931351751089096, -0.03737444803118706, -0.035435378551483154, -0.03349630534648895, -0.03155723586678505, -0.029618166387081146, -0.027679095044732094, -0.02574002370238304, -0.023800954222679138, -0.021861884742975235, -0.019922813400626183, -0.01798374205827713, -0.016044672578573227, -0.014105602167546749, -0.012166531756520271, -0.010227461345493793, -0.008288390934467316, -0.006349320523440838, -0.00441025011241436, -0.0024711797013878822, -0.0005321092903614044, 0.0014069611206650734, 0.003346031531691551, 0.005285101942718029, 0.007224172353744507, 0.009163242764770985, 0.011102313175797462, 0.01304138358682394, 0.014980453997850418, 0.01691952347755432, 0.018858594819903374, 0.020797666162252426, 0.02273673564195633, 0.024675805121660233, 0.026614876464009285, 0.028553947806358337, 0.03049301728606224, 0.032432086765766144, 0.034371159970760345, 0.03631022945046425, 0.03824929893016815, 0.040188368409872055, 0.04212743788957596, 0.04406651109457016, 0.04600558057427406, 0.047944650053977966, 0.04988372325897217, 0.05182279273867607, 0.053761862218379974, 0.05570093169808388, 0.05764000117778778, 0.05957907438278198, 0.061518143862485886, 0.06345721334218979, 0.06539628654718399, 0.0673353523015976, 0.0692744255065918]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 9.0, 9.0, 9.0, 12.0, 14.0, 22.0, 18.0, 23.0, 38.0, 32.0, 41.0, 31.0, 33.0, 51.0, 36.0, 41.0, 47.0, 39.0, 40.0, 42.0, 31.0, 43.0, 33.0, 38.0, 23.0, 31.0, 31.0, 32.0, 28.0, 14.0, 18.0, 15.0, 14.0, 11.0, 9.0, 7.0, 5.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.5853271484375, -11.194091796875, -10.8028564453125, -10.41162109375, -10.0203857421875, -9.629150390625, -9.2379150390625, -8.8466796875, -8.4554443359375, -8.064208984375, -7.6729736328125, -7.28173828125, -6.8905029296875, -6.499267578125, -6.1080322265625, -5.716796875, -5.3255615234375, -4.934326171875, -4.5430908203125, -4.15185546875, -3.7606201171875, -3.369384765625, -2.9781494140625, -2.5869140625, -2.1956787109375, -1.804443359375, -1.4132080078125, -1.02197265625, -0.6307373046875, -0.239501953125, 0.1517333984375, 0.54296875, 0.9342041015625, 1.325439453125, 1.7166748046875, 2.10791015625, 2.4991455078125, 2.890380859375, 3.2816162109375, 3.6728515625, 4.0640869140625, 4.455322265625, 4.8465576171875, 5.23779296875, 5.6290283203125, 6.020263671875, 6.4114990234375, 6.802734375, 7.1939697265625, 7.585205078125, 7.9764404296875, 8.36767578125, 8.7589111328125, 9.150146484375, 9.5413818359375, 9.9326171875, 10.3238525390625, 10.715087890625, 11.1063232421875, 11.49755859375, 11.8887939453125, 12.280029296875, 12.6712646484375, 13.0625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 10.0, 4.0, 17.0, 22.0, 23.0, 33.0, 44.0, 68.0, 89.0, 119.0, 151.0, 240.0, 331.0, 474.0, 680.0, 1044.0, 1727.0, 2910.0, 5432.0, 11494.0, 27993.0, 85445.0, 327636.0, 413140.0, 107337.0, 33857.0, 13288.0, 6123.0, 3224.0, 1817.0, 1233.0, 799.0, 507.0, 396.0, 246.0, 151.0, 121.0, 100.0, 56.0, 47.0, 35.0, 26.0, 19.0, 12.0, 12.0, 7.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.625, -23.880859375, -23.13671875, -22.392578125, -21.6484375, -20.904296875, -20.16015625, -19.416015625, -18.671875, -17.927734375, -17.18359375, -16.439453125, -15.6953125, -14.951171875, -14.20703125, -13.462890625, -12.71875, -11.974609375, -11.23046875, -10.486328125, -9.7421875, -8.998046875, -8.25390625, -7.509765625, -6.765625, -6.021484375, -5.27734375, -4.533203125, -3.7890625, -3.044921875, -2.30078125, -1.556640625, -0.8125, -0.068359375, 0.67578125, 1.419921875, 2.1640625, 2.908203125, 3.65234375, 4.396484375, 5.140625, 5.884765625, 6.62890625, 7.373046875, 8.1171875, 8.861328125, 9.60546875, 10.349609375, 11.09375, 11.837890625, 12.58203125, 13.326171875, 14.0703125, 14.814453125, 15.55859375, 16.302734375, 17.046875, 17.791015625, 18.53515625, 19.279296875, 20.0234375, 20.767578125, 21.51171875, 22.255859375, 23.0]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 11.0, 7.0, 14.0, 15.0, 14.0, 19.0, 21.0, 30.0, 32.0, 42.0, 38.0, 36.0, 62.0, 95.0, 127.0, 204.0, 1422.0, 269.0, 122.0, 82.0, 68.0, 58.0, 37.0, 44.0, 27.0, 26.0, 25.0, 15.0, 17.0, 16.0, 12.0, 5.0, 8.0, 5.0, 4.0, 8.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.3125, -28.35205078125, -27.3916015625, -26.43115234375, -25.470703125, -24.51025390625, -23.5498046875, -22.58935546875, -21.62890625, -20.66845703125, -19.7080078125, -18.74755859375, -17.787109375, -16.82666015625, -15.8662109375, -14.90576171875, -13.9453125, -12.98486328125, -12.0244140625, -11.06396484375, -10.103515625, -9.14306640625, -8.1826171875, -7.22216796875, -6.26171875, -5.30126953125, -4.3408203125, -3.38037109375, -2.419921875, -1.45947265625, -0.4990234375, 0.46142578125, 1.421875, 2.38232421875, 3.3427734375, 4.30322265625, 5.263671875, 6.22412109375, 7.1845703125, 8.14501953125, 9.10546875, 10.06591796875, 11.0263671875, 11.98681640625, 12.947265625, 13.90771484375, 14.8681640625, 15.82861328125, 16.7890625, 17.74951171875, 18.7099609375, 19.67041015625, 20.630859375, 21.59130859375, 22.5517578125, 23.51220703125, 24.47265625, 25.43310546875, 26.3935546875, 27.35400390625, 28.314453125, 29.27490234375, 30.2353515625, 31.19580078125, 32.15625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 10.0, 11.0, 13.0, 14.0, 19.0, 33.0, 70.0, 120.0, 207.0, 393.0, 694.0, 1805.0, 28312.0, 3098305.0, 12875.0, 1422.0, 615.0, 324.0, 170.0, 105.0, 74.0, 41.0, 19.0, 14.0, 11.0, 9.0, 7.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-142.875, -138.72265625, -134.5703125, -130.41796875, -126.265625, -122.11328125, -117.9609375, -113.80859375, -109.65625, -105.50390625, -101.3515625, -97.19921875, -93.046875, -88.89453125, -84.7421875, -80.58984375, -76.4375, -72.28515625, -68.1328125, -63.98046875, -59.828125, -55.67578125, -51.5234375, -47.37109375, -43.21875, -39.06640625, -34.9140625, -30.76171875, -26.609375, -22.45703125, -18.3046875, -14.15234375, -10.0, -5.84765625, -1.6953125, 2.45703125, 6.609375, 10.76171875, 14.9140625, 19.06640625, 23.21875, 27.37109375, 31.5234375, 35.67578125, 39.828125, 43.98046875, 48.1328125, 52.28515625, 56.4375, 60.58984375, 64.7421875, 68.89453125, 73.046875, 77.19921875, 81.3515625, 85.50390625, 89.65625, 93.80859375, 97.9609375, 102.11328125, 106.265625, 110.41796875, 114.5703125, 118.72265625, 122.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 135.0, 559.0, 288.0, 26.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-315.3527526855469, -298.56707763671875, -281.78143310546875, -264.9957580566406, -248.21009826660156, -231.4244384765625, -214.63876342773438, -197.8531036376953, -181.06744384765625, -164.2817840576172, -147.49612426757812, -130.71044921875, -113.92478942871094, -97.13912963867188, -80.35346221923828, -63.56779479980469, -46.782135009765625, -29.996471405029297, -13.210807800292969, 3.5748558044433594, 20.360519409179688, 37.14617919921875, 53.931846618652344, 70.71751403808594, 87.503173828125, 104.28883361816406, 121.07450103759766, 137.86016845703125, 154.6458282470703, 171.43148803710938, 188.2171630859375, 205.00282287597656, 221.78851318359375, 238.5741729736328, 255.35983276367188, 272.1455078125, 288.93115234375, 305.7168273925781, 322.50250244140625, 339.28814697265625, 356.0738220214844, 372.8594970703125, 389.6451416015625, 406.4308166503906, 423.21649169921875, 440.00213623046875, 456.7878112792969, 473.573486328125, 490.359130859375, 507.1448059082031, 523.9304809570312, 540.7161254882812, 557.5017700195312, 574.2874755859375, 591.0731201171875, 607.8587646484375, 624.6444091796875, 641.4300537109375, 658.2157592773438, 675.0014038085938, 691.7870483398438, 708.57275390625, 725.3583984375, 742.14404296875, 758.9297485351562]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 8.0, 6.0, 11.0, 7.0, 14.0, 8.0, 19.0, 24.0, 27.0, 23.0, 28.0, 35.0, 37.0, 38.0, 36.0, 40.0, 53.0, 57.0, 47.0, 44.0, 37.0, 40.0, 48.0, 42.0, 40.0, 43.0, 27.0, 28.0, 27.0, 17.0, 17.0, 19.0, 14.0, 14.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-96.4081802368164, -93.58419799804688, -90.76020812988281, -87.93622589111328, -85.11224365234375, -82.28825378417969, -79.46427154541016, -76.64028930664062, -73.81629943847656, -70.99231719970703, -68.16832733154297, -65.34434509277344, -62.520362854003906, -59.69637680053711, -56.87239074707031, -54.04840850830078, -51.22442626953125, -48.40044021606445, -45.57645797729492, -42.752471923828125, -39.928489685058594, -37.1045036315918, -34.280517578125, -31.456533432006836, -28.632549285888672, -25.808565139770508, -22.984580993652344, -20.160594940185547, -17.336610794067383, -14.512626647949219, -11.688640594482422, -8.864656448364258, -6.040679931640625, -3.2166953086853027, -0.39271068572998047, 2.4312744140625, 5.255258560180664, 8.079242706298828, 10.903228759765625, 13.727212905883789, 16.551197052001953, 19.375181198120117, 22.19916534423828, 25.023151397705078, 27.847135543823242, 30.671119689941406, 33.4951057434082, 36.319091796875, 39.14307403564453, 41.96706008911133, 44.79104232788086, 47.615028381347656, 50.43901062011719, 53.262996673583984, 56.08698272705078, 58.91096496582031, 61.73495101928711, 64.5589370727539, 67.38291931152344, 70.2069091796875, 73.03089141845703, 75.85487365722656, 78.67886352539062, 81.50284576416016, 84.32682800292969]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 10.0, 10.0, 13.0, 19.0, 15.0, 15.0, 26.0, 17.0, 21.0, 25.0, 31.0, 27.0, 17.0, 34.0, 42.0, 46.0, 47.0, 29.0, 45.0, 31.0, 39.0, 32.0, 22.0, 40.0, 32.0, 29.0, 23.0, 26.0, 31.0, 20.0, 20.0, 17.0, 28.0, 11.0, 20.0, 11.0, 7.0, 9.0, 10.0, 7.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-11.4296875, -11.063232421875, -10.69677734375, -10.330322265625, -9.9638671875, -9.597412109375, -9.23095703125, -8.864501953125, -8.498046875, -8.131591796875, -7.76513671875, -7.398681640625, -7.0322265625, -6.665771484375, -6.29931640625, -5.932861328125, -5.56640625, -5.199951171875, -4.83349609375, -4.467041015625, -4.1005859375, -3.734130859375, -3.36767578125, -3.001220703125, -2.634765625, -2.268310546875, -1.90185546875, -1.535400390625, -1.1689453125, -0.802490234375, -0.43603515625, -0.069580078125, 0.296875, 0.663330078125, 1.02978515625, 1.396240234375, 1.7626953125, 2.129150390625, 2.49560546875, 2.862060546875, 3.228515625, 3.594970703125, 3.96142578125, 4.327880859375, 4.6943359375, 5.060791015625, 5.42724609375, 5.793701171875, 6.16015625, 6.526611328125, 6.89306640625, 7.259521484375, 7.6259765625, 7.992431640625, 8.35888671875, 8.725341796875, 9.091796875, 9.458251953125, 9.82470703125, 10.191162109375, 10.5576171875, 10.924072265625, 11.29052734375, 11.656982421875, 12.0234375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 9.0, 9.0, 10.0, 23.0, 27.0, 43.0, 52.0, 80.0, 105.0, 126.0, 212.0, 252.0, 392.0, 552.0, 859.0, 1344.0, 2325.0, 4645.0, 11164.0, 37799.0, 234563.0, 1713534.0, 1869484.0, 253496.0, 40475.0, 11468.0, 4675.0, 2340.0, 1363.0, 890.0, 541.0, 391.0, 279.0, 225.0, 152.0, 96.0, 82.0, 53.0, 55.0, 25.0, 22.0, 17.0, 12.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.40625, -25.4638671875, -24.521484375, -23.5791015625, -22.63671875, -21.6943359375, -20.751953125, -19.8095703125, -18.8671875, -17.9248046875, -16.982421875, -16.0400390625, -15.09765625, -14.1552734375, -13.212890625, -12.2705078125, -11.328125, -10.3857421875, -9.443359375, -8.5009765625, -7.55859375, -6.6162109375, -5.673828125, -4.7314453125, -3.7890625, -2.8466796875, -1.904296875, -0.9619140625, -0.01953125, 0.9228515625, 1.865234375, 2.8076171875, 3.75, 4.6923828125, 5.634765625, 6.5771484375, 7.51953125, 8.4619140625, 9.404296875, 10.3466796875, 11.2890625, 12.2314453125, 13.173828125, 14.1162109375, 15.05859375, 16.0009765625, 16.943359375, 17.8857421875, 18.828125, 19.7705078125, 20.712890625, 21.6552734375, 22.59765625, 23.5400390625, 24.482421875, 25.4248046875, 26.3671875, 27.3095703125, 28.251953125, 29.1943359375, 30.13671875, 31.0791015625, 32.021484375, 32.9638671875, 33.90625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 7.0, 5.0, 5.0, 5.0, 12.0, 9.0, 34.0, 48.0, 76.0, 86.0, 140.0, 193.0, 287.0, 397.0, 526.0, 635.0, 526.0, 321.0, 246.0, 185.0, 98.0, 74.0, 41.0, 43.0, 26.0, 15.0, 15.0, 8.0, 5.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.576171875, -22.74609375, -21.916015625, -21.0859375, -20.255859375, -19.42578125, -18.595703125, -17.765625, -16.935546875, -16.10546875, -15.275390625, -14.4453125, -13.615234375, -12.78515625, -11.955078125, -11.125, -10.294921875, -9.46484375, -8.634765625, -7.8046875, -6.974609375, -6.14453125, -5.314453125, -4.484375, -3.654296875, -2.82421875, -1.994140625, -1.1640625, -0.333984375, 0.49609375, 1.326171875, 2.15625, 2.986328125, 3.81640625, 4.646484375, 5.4765625, 6.306640625, 7.13671875, 7.966796875, 8.796875, 9.626953125, 10.45703125, 11.287109375, 12.1171875, 12.947265625, 13.77734375, 14.607421875, 15.4375, 16.267578125, 17.09765625, 17.927734375, 18.7578125, 19.587890625, 20.41796875, 21.248046875, 22.078125, 22.908203125, 23.73828125, 24.568359375, 25.3984375, 26.228515625, 27.05859375, 27.888671875, 28.71875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 12.0, 15.0, 24.0, 39.0, 67.0, 90.0, 168.0, 277.0, 586.0, 1398.0, 4496.0, 23831.0, 344274.0, 3500460.0, 290177.0, 21427.0, 4167.0, 1509.0, 556.0, 275.0, 172.0, 95.0, 52.0, 32.0, 21.0, 17.0, 9.0, 5.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.4375, -52.8583984375, -51.279296875, -49.7001953125, -48.12109375, -46.5419921875, -44.962890625, -43.3837890625, -41.8046875, -40.2255859375, -38.646484375, -37.0673828125, -35.48828125, -33.9091796875, -32.330078125, -30.7509765625, -29.171875, -27.5927734375, -26.013671875, -24.4345703125, -22.85546875, -21.2763671875, -19.697265625, -18.1181640625, -16.5390625, -14.9599609375, -13.380859375, -11.8017578125, -10.22265625, -8.6435546875, -7.064453125, -5.4853515625, -3.90625, -2.3271484375, -0.748046875, 0.8310546875, 2.41015625, 3.9892578125, 5.568359375, 7.1474609375, 8.7265625, 10.3056640625, 11.884765625, 13.4638671875, 15.04296875, 16.6220703125, 18.201171875, 19.7802734375, 21.359375, 22.9384765625, 24.517578125, 26.0966796875, 27.67578125, 29.2548828125, 30.833984375, 32.4130859375, 33.9921875, 35.5712890625, 37.150390625, 38.7294921875, 40.30859375, 41.8876953125, 43.466796875, 45.0458984375, 46.625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 21.0, 103.0, 343.0, 351.0, 156.0, 30.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-475.1687316894531, -462.69586181640625, -450.2230224609375, -437.7501525878906, -425.27728271484375, -412.804443359375, -400.3315734863281, -387.85870361328125, -375.3858642578125, -362.9129943847656, -350.4401550292969, -337.96728515625, -325.49444580078125, -313.0215759277344, -300.5487060546875, -288.07586669921875, -275.6029968261719, -263.130126953125, -250.65728759765625, -238.18441772460938, -225.71156311035156, -213.23870849609375, -200.76583862304688, -188.29298400878906, -175.82012939453125, -163.34727478027344, -150.87442016601562, -138.40155029296875, -125.92869567871094, -113.45584106445312, -100.98297882080078, -88.51011657714844, -76.0372314453125, -63.56437301635742, -51.091514587402344, -38.618656158447266, -26.145797729492188, -13.67293930053711, -1.2000808715820312, 11.272781372070312, 23.745635986328125, 36.2184944152832, 48.69135284423828, 61.16421127319336, 73.63706970214844, 86.10992431640625, 98.5827865600586, 111.05564880371094, 123.52850341796875, 136.00135803222656, 148.47421264648438, 160.94708251953125, 173.41993713378906, 185.89279174804688, 198.36566162109375, 210.83851623535156, 223.31137084960938, 235.7842254638672, 248.257080078125, 260.7299499511719, 273.20281982421875, 285.6756591796875, 298.1485290527344, 310.62139892578125, 323.09423828125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 7.0, 6.0, 9.0, 15.0, 12.0, 17.0, 24.0, 20.0, 34.0, 27.0, 36.0, 40.0, 47.0, 56.0, 53.0, 38.0, 57.0, 57.0, 42.0, 42.0, 49.0, 48.0, 30.0, 36.0, 26.0, 27.0, 36.0, 19.0, 22.0, 11.0, 10.0, 14.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-95.26493835449219, -92.54150390625, -89.81807708740234, -87.09464263916016, -84.37120819091797, -81.64778137207031, -78.92434692382812, -76.20091247558594, -73.47747802734375, -70.75404357910156, -68.0306167602539, -65.30718231201172, -62.58374786376953, -59.86031723022461, -57.13688659667969, -54.4134521484375, -51.690025329589844, -48.96659469604492, -46.243160247802734, -43.51972961425781, -40.796295166015625, -38.0728645324707, -35.34943389892578, -32.625999450683594, -29.902568817138672, -27.179136276245117, -24.455703735351562, -21.73227310180664, -19.008840560913086, -16.28540802001953, -13.56197738647461, -10.838544845581055, -8.115119934082031, -5.391687870025635, -2.6682558059692383, 0.05517578125, 2.7786083221435547, 5.502040863037109, 8.225471496582031, 10.948904037475586, 13.67233657836914, 16.395769119262695, 19.11920166015625, 21.842632293701172, 24.566064834594727, 27.28949737548828, 30.012928009033203, 32.736358642578125, 35.45979309082031, 38.183223724365234, 40.90665817260742, 43.630088806152344, 46.35352325439453, 49.07695388793945, 51.800384521484375, 54.52381896972656, 57.247249603271484, 59.970680236816406, 62.694114685058594, 65.41754150390625, 68.14097595214844, 70.86441040039062, 73.58784484863281, 76.31127166748047, 79.03470611572266]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 14.0, 6.0, 7.0, 6.0, 17.0, 9.0, 14.0, 19.0, 16.0, 21.0, 25.0, 24.0, 31.0, 32.0, 36.0, 37.0, 31.0, 33.0, 42.0, 44.0, 42.0, 37.0, 31.0, 31.0, 32.0, 31.0, 30.0, 40.0, 27.0, 28.0, 16.0, 15.0, 24.0, 22.0, 19.0, 14.0, 13.0, 14.0, 7.0, 8.0, 11.0, 7.0, 4.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.125, -9.7969970703125, -9.468994140625, -9.1409912109375, -8.81298828125, -8.4849853515625, -8.156982421875, -7.8289794921875, -7.5009765625, -7.1729736328125, -6.844970703125, -6.5169677734375, -6.18896484375, -5.8609619140625, -5.532958984375, -5.2049560546875, -4.876953125, -4.5489501953125, -4.220947265625, -3.8929443359375, -3.56494140625, -3.2369384765625, -2.908935546875, -2.5809326171875, -2.2529296875, -1.9249267578125, -1.596923828125, -1.2689208984375, -0.94091796875, -0.6129150390625, -0.284912109375, 0.0430908203125, 0.37109375, 0.6990966796875, 1.027099609375, 1.3551025390625, 1.68310546875, 2.0111083984375, 2.339111328125, 2.6671142578125, 2.9951171875, 3.3231201171875, 3.651123046875, 3.9791259765625, 4.30712890625, 4.6351318359375, 4.963134765625, 5.2911376953125, 5.619140625, 5.9471435546875, 6.275146484375, 6.6031494140625, 6.93115234375, 7.2591552734375, 7.587158203125, 7.9151611328125, 8.2431640625, 8.5711669921875, 8.899169921875, 9.2271728515625, 9.55517578125, 9.8831787109375, 10.211181640625, 10.5391845703125, 10.8671875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 11.0, 14.0, 24.0, 32.0, 39.0, 49.0, 88.0, 122.0, 211.0, 280.0, 438.0, 719.0, 1179.0, 1823.0, 3113.0, 5480.0, 9730.0, 17814.0, 34040.0, 66705.0, 137368.0, 255473.0, 247001.0, 131038.0, 63567.0, 32512.0, 17084.0, 9478.0, 5210.0, 3003.0, 1691.0, 1227.0, 682.0, 424.0, 286.0, 194.0, 141.0, 74.0, 62.0, 50.0, 23.0, 17.0, 14.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.4298248291015625, -1.382110595703125, -1.3343963623046875, -1.28668212890625, -1.2389678955078125, -1.191253662109375, -1.1435394287109375, -1.0958251953125, -1.0481109619140625, -1.000396728515625, -0.9526824951171875, -0.90496826171875, -0.8572540283203125, -0.809539794921875, -0.7618255615234375, -0.714111328125, -0.6663970947265625, -0.618682861328125, -0.5709686279296875, -0.52325439453125, -0.4755401611328125, -0.427825927734375, -0.3801116943359375, -0.3323974609375, -0.2846832275390625, -0.236968994140625, -0.1892547607421875, -0.14154052734375, -0.0938262939453125, -0.046112060546875, 0.0016021728515625, 0.04931640625, 0.0970306396484375, 0.144744873046875, 0.1924591064453125, 0.24017333984375, 0.2878875732421875, 0.335601806640625, 0.3833160400390625, 0.4310302734375, 0.4787445068359375, 0.526458740234375, 0.5741729736328125, 0.62188720703125, 0.6696014404296875, 0.717315673828125, 0.7650299072265625, 0.812744140625, 0.8604583740234375, 0.908172607421875, 0.9558868408203125, 1.00360107421875, 1.0513153076171875, 1.099029541015625, 1.1467437744140625, 1.1944580078125, 1.2421722412109375, 1.289886474609375, 1.3376007080078125, 1.38531494140625, 1.4330291748046875, 1.480743408203125, 1.5284576416015625, 1.576171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 18.0, 19.0, 26.0, 30.0, 35.0, 24.0, 37.0, 29.0, 51.0, 51.0, 40.0, 51.0, 43.0, 1067.0, 47.0, 45.0, 53.0, 38.0, 50.0, 28.0, 36.0, 38.0, 24.0, 23.0, 24.0, 12.0, 17.0, 10.0, 11.0, 8.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.1593017578125, -9.857666015625, -9.5560302734375, -9.25439453125, -8.9527587890625, -8.651123046875, -8.3494873046875, -8.0478515625, -7.7462158203125, -7.444580078125, -7.1429443359375, -6.84130859375, -6.5396728515625, -6.238037109375, -5.9364013671875, -5.634765625, -5.3331298828125, -5.031494140625, -4.7298583984375, -4.42822265625, -4.1265869140625, -3.824951171875, -3.5233154296875, -3.2216796875, -2.9200439453125, -2.618408203125, -2.3167724609375, -2.01513671875, -1.7135009765625, -1.411865234375, -1.1102294921875, -0.80859375, -0.5069580078125, -0.205322265625, 0.0963134765625, 0.39794921875, 0.6995849609375, 1.001220703125, 1.3028564453125, 1.6044921875, 1.9061279296875, 2.207763671875, 2.5093994140625, 2.81103515625, 3.1126708984375, 3.414306640625, 3.7159423828125, 4.017578125, 4.3192138671875, 4.620849609375, 4.9224853515625, 5.22412109375, 5.5257568359375, 5.827392578125, 6.1290283203125, 6.4306640625, 6.7322998046875, 7.033935546875, 7.3355712890625, 7.63720703125, 7.9388427734375, 8.240478515625, 8.5421142578125, 8.84375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 17.0, 17.0, 27.0, 42.0, 77.0, 113.0, 138.0, 206.0, 303.0, 448.0, 752.0, 1047.0, 1562.0, 2496.0, 3943.0, 6366.0, 10113.0, 16593.0, 27673.0, 46345.0, 81239.0, 142735.0, 1113394.0, 331973.0, 128759.0, 72851.0, 42393.0, 25007.0, 15179.0, 9166.0, 5790.0, 3640.0, 2288.0, 1568.0, 937.0, 629.0, 434.0, 256.0, 200.0, 153.0, 80.0, 59.0, 36.0, 24.0, 17.0, 23.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6189346313476562, -0.5967559814453125, -0.5745773315429688, -0.552398681640625, -0.5302200317382812, -0.5080413818359375, -0.48586273193359375, -0.46368408203125, -0.44150543212890625, -0.4193267822265625, -0.39714813232421875, -0.374969482421875, -0.35279083251953125, -0.3306121826171875, -0.30843353271484375, -0.2862548828125, -0.26407623291015625, -0.2418975830078125, -0.21971893310546875, -0.197540283203125, -0.17536163330078125, -0.1531829833984375, -0.13100433349609375, -0.10882568359375, -0.08664703369140625, -0.0644683837890625, -0.04228973388671875, -0.020111083984375, 0.00206756591796875, 0.0242462158203125, 0.04642486572265625, 0.068603515625, 0.09078216552734375, 0.1129608154296875, 0.13513946533203125, 0.157318115234375, 0.17949676513671875, 0.2016754150390625, 0.22385406494140625, 0.24603271484375, 0.26821136474609375, 0.2903900146484375, 0.31256866455078125, 0.334747314453125, 0.35692596435546875, 0.3791046142578125, 0.40128326416015625, 0.4234619140625, 0.44564056396484375, 0.4678192138671875, 0.48999786376953125, 0.512176513671875, 0.5343551635742188, 0.5565338134765625, 0.5787124633789062, 0.60089111328125, 0.6230697631835938, 0.6452484130859375, 0.6674270629882812, 0.689605712890625, 0.7117843627929688, 0.7339630126953125, 0.7561416625976562, 0.7783203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 9.0, 5.0, 11.0, 22.0, 22.0, 35.0, 43.0, 52.0, 72.0, 173.0, 189.0, 93.0, 50.0, 44.0, 39.0, 30.0, 13.0, 17.0, 12.0, 14.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.09540462493896484, -0.09260368347167969, -0.08980274200439453, -0.08700180053710938, -0.08420085906982422, -0.08139991760253906, -0.0785989761352539, -0.07579803466796875, -0.0729970932006836, -0.07019615173339844, -0.06739521026611328, -0.06459426879882812, -0.06179332733154297, -0.05899238586425781, -0.056191444396972656, -0.0533905029296875, -0.050589561462402344, -0.04778861999511719, -0.04498767852783203, -0.042186737060546875, -0.03938579559326172, -0.03658485412597656, -0.033783912658691406, -0.03098297119140625, -0.028182029724121094, -0.025381088256835938, -0.02258014678955078, -0.019779205322265625, -0.01697826385498047, -0.014177322387695312, -0.011376380920410156, -0.008575439453125, -0.005774497985839844, -0.0029735565185546875, -0.00017261505126953125, 0.002628326416015625, 0.005429267883300781, 0.008230209350585938, 0.011031150817871094, 0.01383209228515625, 0.016633033752441406, 0.019433975219726562, 0.02223491668701172, 0.025035858154296875, 0.02783679962158203, 0.030637741088867188, 0.033438682556152344, 0.0362396240234375, 0.039040565490722656, 0.04184150695800781, 0.04464244842529297, 0.047443389892578125, 0.05024433135986328, 0.05304527282714844, 0.055846214294433594, 0.05864715576171875, 0.061448097229003906, 0.06424903869628906, 0.06704998016357422, 0.06985092163085938, 0.07265186309814453, 0.07545280456542969, 0.07825374603271484, 0.0810546875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 10.0, 13.0, 12.0, 21.0, 34.0, 26.0, 45.0, 59.0, 68.0, 116.0, 184.0, 340.0, 1528.0, 27429.0, 1004232.0, 12554.0, 1059.0, 296.0, 153.0, 109.0, 61.0, 64.0, 27.0, 26.0, 25.0, 14.0, 12.0, 11.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30078125, -1.25653076171875, -1.2122802734375, -1.16802978515625, -1.123779296875, -1.07952880859375, -1.0352783203125, -0.99102783203125, -0.94677734375, -0.90252685546875, -0.8582763671875, -0.81402587890625, -0.769775390625, -0.72552490234375, -0.6812744140625, -0.63702392578125, -0.5927734375, -0.54852294921875, -0.5042724609375, -0.46002197265625, -0.415771484375, -0.37152099609375, -0.3272705078125, -0.28302001953125, -0.23876953125, -0.19451904296875, -0.1502685546875, -0.10601806640625, -0.061767578125, -0.01751708984375, 0.0267333984375, 0.07098388671875, 0.115234375, 0.15948486328125, 0.2037353515625, 0.24798583984375, 0.292236328125, 0.33648681640625, 0.3807373046875, 0.42498779296875, 0.46923828125, 0.51348876953125, 0.5577392578125, 0.60198974609375, 0.646240234375, 0.69049072265625, 0.7347412109375, 0.77899169921875, 0.8232421875, 0.86749267578125, 0.9117431640625, 0.95599365234375, 1.000244140625, 1.04449462890625, 1.0887451171875, 1.13299560546875, 1.17724609375, 1.22149658203125, 1.2657470703125, 1.30999755859375, 1.354248046875, 1.39849853515625, 1.4427490234375, 1.48699951171875, 1.53125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 153.0, 786.0, 47.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1769012212753296, -1.1405539512634277, -1.1042068004608154, -1.0678595304489136, -1.0315123796463013, -0.9951651096343994, -0.9588178992271423, -0.9224706888198853, -0.8861234784126282, -0.8497762680053711, -0.813429057598114, -0.7770818471908569, -0.7407345771789551, -0.7043874263763428, -0.6680401563644409, -0.6316929459571838, -0.5953457355499268, -0.5589985251426697, -0.5226513147354126, -0.48630407452583313, -0.44995686411857605, -0.41360965371131897, -0.3772624135017395, -0.3409152030944824, -0.30456799268722534, -0.26822078227996826, -0.23187355697155, -0.1955263316631317, -0.15917912125587463, -0.12283191084861755, -0.08648468554019928, -0.050137460231781006, -0.013790130615234375, 0.022557087242603302, 0.05890430510044098, 0.09525152295827866, 0.13159874081611633, 0.1679459512233734, 0.2042931765317917, 0.24064040184020996, 0.27698761224746704, 0.3133348226547241, 0.3496820330619812, 0.38602927327156067, 0.42237648367881775, 0.45872369408607483, 0.4950709342956543, 0.5314181447029114, 0.5677653551101685, 0.6041125655174255, 0.6404597759246826, 0.6768069863319397, 0.7131541967391968, 0.7495014667510986, 0.7858486771583557, 0.8221958875656128, 0.8585430979728699, 0.894890308380127, 0.931237518787384, 0.9675847291946411, 1.003931999206543, 1.0402791500091553, 1.0766264200210571, 1.112973690032959, 1.1493208408355713]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 4.0, 5.0, 9.0, 11.0, 17.0, 13.0, 10.0, 29.0, 19.0, 19.0, 38.0, 23.0, 33.0, 38.0, 53.0, 52.0, 27.0, 38.0, 46.0, 43.0, 28.0, 49.0, 30.0, 41.0, 33.0, 34.0, 32.0, 37.0, 29.0, 22.0, 16.0, 22.0, 14.0, 13.0, 11.0, 12.0, 12.0, 11.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.13943535089492798, -0.13538265228271484, -0.13132993876934052, -0.1272772252559662, -0.12322452664375305, -0.11917182058095932, -0.11511911451816559, -0.11106640845537186, -0.10701370239257812, -0.1029609963297844, -0.09890829026699066, -0.09485558420419693, -0.0908028781414032, -0.08675017207860947, -0.08269746601581573, -0.078644759953022, -0.07459205389022827, -0.07053934782743454, -0.06648664176464081, -0.062433935701847076, -0.058381229639053345, -0.05432852357625961, -0.05027581751346588, -0.04622311145067215, -0.04217040538787842, -0.038117699325084686, -0.034064993262290955, -0.030012287199497223, -0.02595958113670349, -0.02190687507390976, -0.017854169011116028, -0.013801462948322296, -0.009748756885528564, -0.005696050822734833, -0.001643344759941101, 0.0024093613028526306, 0.006462067365646362, 0.010514773428440094, 0.014567479491233826, 0.018620185554027557, 0.02267289161682129, 0.02672559767961502, 0.030778303742408752, 0.034831009805202484, 0.038883715867996216, 0.04293642193078995, 0.04698912799358368, 0.05104183405637741, 0.05509454011917114, 0.059147246181964874, 0.0631999522447586, 0.06725265830755234, 0.07130536437034607, 0.0753580704331398, 0.07941077649593353, 0.08346348255872726, 0.087516188621521, 0.09156889468431473, 0.09562160074710846, 0.09967430680990219, 0.10372701287269592, 0.10777971893548965, 0.11183242499828339, 0.11588513106107712, 0.11993783712387085]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 14.0, 6.0, 7.0, 6.0, 17.0, 9.0, 16.0, 17.0, 17.0, 21.0, 24.0, 24.0, 33.0, 30.0, 36.0, 36.0, 32.0, 34.0, 42.0, 41.0, 44.0, 37.0, 30.0, 32.0, 32.0, 30.0, 30.0, 40.0, 28.0, 26.0, 17.0, 16.0, 23.0, 21.0, 20.0, 15.0, 12.0, 15.0, 7.0, 7.0, 12.0, 7.0, 4.0, 9.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.1171875, -9.78955078125, -9.4619140625, -9.13427734375, -8.806640625, -8.47900390625, -8.1513671875, -7.82373046875, -7.49609375, -7.16845703125, -6.8408203125, -6.51318359375, -6.185546875, -5.85791015625, -5.5302734375, -5.20263671875, -4.875, -4.54736328125, -4.2197265625, -3.89208984375, -3.564453125, -3.23681640625, -2.9091796875, -2.58154296875, -2.25390625, -1.92626953125, -1.5986328125, -1.27099609375, -0.943359375, -0.61572265625, -0.2880859375, 0.03955078125, 0.3671875, 0.69482421875, 1.0224609375, 1.35009765625, 1.677734375, 2.00537109375, 2.3330078125, 2.66064453125, 2.98828125, 3.31591796875, 3.6435546875, 3.97119140625, 4.298828125, 4.62646484375, 4.9541015625, 5.28173828125, 5.609375, 5.93701171875, 6.2646484375, 6.59228515625, 6.919921875, 7.24755859375, 7.5751953125, 7.90283203125, 8.23046875, 8.55810546875, 8.8857421875, 9.21337890625, 9.541015625, 9.86865234375, 10.1962890625, 10.52392578125, 10.8515625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 9.0, 6.0, 16.0, 19.0, 16.0, 18.0, 42.0, 31.0, 51.0, 54.0, 78.0, 92.0, 122.0, 156.0, 197.0, 261.0, 334.0, 501.0, 631.0, 1064.0, 1780.0, 3064.0, 5737.0, 12099.0, 28024.0, 74291.0, 218728.0, 384708.0, 198432.0, 67692.0, 25554.0, 11223.0, 5393.0, 2881.0, 1610.0, 1049.0, 655.0, 474.0, 327.0, 260.0, 214.0, 142.0, 130.0, 75.0, 71.0, 48.0, 50.0, 38.0, 38.0, 19.0, 22.0, 13.0, 7.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.1484375, -12.7166748046875, -12.284912109375, -11.8531494140625, -11.42138671875, -10.9896240234375, -10.557861328125, -10.1260986328125, -9.6943359375, -9.2625732421875, -8.830810546875, -8.3990478515625, -7.96728515625, -7.5355224609375, -7.103759765625, -6.6719970703125, -6.240234375, -5.8084716796875, -5.376708984375, -4.9449462890625, -4.51318359375, -4.0814208984375, -3.649658203125, -3.2178955078125, -2.7861328125, -2.3543701171875, -1.922607421875, -1.4908447265625, -1.05908203125, -0.6273193359375, -0.195556640625, 0.2362060546875, 0.66796875, 1.0997314453125, 1.531494140625, 1.9632568359375, 2.39501953125, 2.8267822265625, 3.258544921875, 3.6903076171875, 4.1220703125, 4.5538330078125, 4.985595703125, 5.4173583984375, 5.84912109375, 6.2808837890625, 6.712646484375, 7.1444091796875, 7.576171875, 8.0079345703125, 8.439697265625, 8.8714599609375, 9.30322265625, 9.7349853515625, 10.166748046875, 10.5985107421875, 11.0302734375, 11.4620361328125, 11.893798828125, 12.3255615234375, 12.75732421875, 13.1890869140625, 13.620849609375, 14.0526123046875, 14.484375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 9.0, 5.0, 11.0, 12.0, 16.0, 17.0, 15.0, 25.0, 29.0, 31.0, 44.0, 40.0, 51.0, 74.0, 118.0, 178.0, 1436.0, 339.0, 164.0, 92.0, 57.0, 49.0, 33.0, 34.0, 27.0, 26.0, 16.0, 19.0, 10.0, 14.0, 5.0, 9.0, 10.0, 4.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-37.75, -36.568359375, -35.38671875, -34.205078125, -33.0234375, -31.841796875, -30.66015625, -29.478515625, -28.296875, -27.115234375, -25.93359375, -24.751953125, -23.5703125, -22.388671875, -21.20703125, -20.025390625, -18.84375, -17.662109375, -16.48046875, -15.298828125, -14.1171875, -12.935546875, -11.75390625, -10.572265625, -9.390625, -8.208984375, -7.02734375, -5.845703125, -4.6640625, -3.482421875, -2.30078125, -1.119140625, 0.0625, 1.244140625, 2.42578125, 3.607421875, 4.7890625, 5.970703125, 7.15234375, 8.333984375, 9.515625, 10.697265625, 11.87890625, 13.060546875, 14.2421875, 15.423828125, 16.60546875, 17.787109375, 18.96875, 20.150390625, 21.33203125, 22.513671875, 23.6953125, 24.876953125, 26.05859375, 27.240234375, 28.421875, 29.603515625, 30.78515625, 31.966796875, 33.1484375, 34.330078125, 35.51171875, 36.693359375, 37.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 5.0, 6.0, 9.0, 9.0, 15.0, 22.0, 30.0, 41.0, 48.0, 70.0, 102.0, 137.0, 250.0, 537.0, 1411.0, 10688.0, 2814923.0, 310744.0, 4426.0, 1018.0, 421.0, 247.0, 155.0, 111.0, 53.0, 51.0, 43.0, 26.0, 22.0, 16.0, 15.0, 9.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.8125, -69.4052734375, -66.998046875, -64.5908203125, -62.18359375, -59.7763671875, -57.369140625, -54.9619140625, -52.5546875, -50.1474609375, -47.740234375, -45.3330078125, -42.92578125, -40.5185546875, -38.111328125, -35.7041015625, -33.296875, -30.8896484375, -28.482421875, -26.0751953125, -23.66796875, -21.2607421875, -18.853515625, -16.4462890625, -14.0390625, -11.6318359375, -9.224609375, -6.8173828125, -4.41015625, -2.0029296875, 0.404296875, 2.8115234375, 5.21875, 7.6259765625, 10.033203125, 12.4404296875, 14.84765625, 17.2548828125, 19.662109375, 22.0693359375, 24.4765625, 26.8837890625, 29.291015625, 31.6982421875, 34.10546875, 36.5126953125, 38.919921875, 41.3271484375, 43.734375, 46.1416015625, 48.548828125, 50.9560546875, 53.36328125, 55.7705078125, 58.177734375, 60.5849609375, 62.9921875, 65.3994140625, 67.806640625, 70.2138671875, 72.62109375, 75.0283203125, 77.435546875, 79.8427734375, 82.25]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 149.0, 591.0, 240.0, 19.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-664.5567626953125, -649.9706420898438, -635.384521484375, -620.7984008789062, -606.2122802734375, -591.626220703125, -577.0400390625, -562.4539794921875, -547.8678588867188, -533.28173828125, -518.6956176757812, -504.1094970703125, -489.5234069824219, -474.9372863769531, -460.3511657714844, -445.7650451660156, -431.1789245605469, -416.5928039550781, -402.0066833496094, -387.42059326171875, -372.83447265625, -358.24835205078125, -343.6622314453125, -329.07611083984375, -314.489990234375, -299.90386962890625, -285.3177490234375, -270.73162841796875, -256.1455383300781, -241.55941772460938, -226.97329711914062, -212.38717651367188, -197.80108642578125, -183.2149658203125, -168.6288604736328, -154.04273986816406, -139.45663452148438, -124.87051391601562, -110.28439331054688, -95.69828033447266, -81.11216735839844, -66.52605438232422, -51.939937591552734, -37.35382080078125, -22.76770782470703, -8.181594848632812, 6.4045257568359375, 20.990638732910156, 35.576751708984375, 50.162864685058594, 64.74897766113281, 79.33509826660156, 93.92121124267578, 108.50732421875, 123.09344482421875, 137.6795654296875, 152.2656707763672, 166.85179138183594, 181.43789672851562, 196.02401733398438, 210.61013793945312, 225.1962432861328, 239.78236389160156, 254.36846923828125, 268.95458984375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 19.0, 23.0, 21.0, 56.0, 49.0, 54.0, 70.0, 78.0, 81.0, 72.0, 93.0, 64.0, 59.0, 65.0, 59.0, 35.0, 32.0, 27.0, 15.0, 8.0, 2.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.67172241210938, -166.9735870361328, -162.2754669189453, -157.57733154296875, -152.87921142578125, -148.1810760498047, -143.48294067382812, -138.78482055664062, -134.08668518066406, -129.3885498046875, -124.6904296875, -119.99229431152344, -115.2941665649414, -110.59603881835938, -105.89790344238281, -101.19977569580078, -96.50164794921875, -91.80352020263672, -87.10539245605469, -82.40725708007812, -77.7091293334961, -73.01100158691406, -68.3128662109375, -63.61473846435547, -58.91661071777344, -54.218482971191406, -49.52035140991211, -44.82221984863281, -40.12409210205078, -35.42596435546875, -30.727832794189453, -26.029701232910156, -21.331573486328125, -16.63344383239746, -11.935314178466797, -7.237184524536133, -2.5390548706054688, 2.1590747833251953, 6.857204437255859, 11.555335998535156, 16.253463745117188, 20.95159339904785, 25.649723052978516, 30.34785270690918, 35.045982360839844, 39.744110107421875, 44.44224166870117, 49.14037322998047, 53.8385009765625, 58.53662872314453, 63.23476028442383, 67.93289184570312, 72.63101959228516, 77.32914733886719, 82.02728271484375, 86.72541046142578, 91.42353820800781, 96.12166595458984, 100.81979370117188, 105.51792907714844, 110.21605682373047, 114.9141845703125, 119.61231994628906, 124.3104476928711, 129.00857543945312]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 8.0, 3.0, 5.0, 5.0, 6.0, 10.0, 15.0, 10.0, 16.0, 12.0, 18.0, 21.0, 22.0, 14.0, 30.0, 23.0, 34.0, 45.0, 26.0, 35.0, 34.0, 39.0, 40.0, 38.0, 41.0, 33.0, 25.0, 37.0, 41.0, 31.0, 32.0, 35.0, 20.0, 26.0, 21.0, 21.0, 16.0, 17.0, 15.0, 11.0, 14.0, 6.0, 13.0, 4.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0], "bins": [-12.0078125, -11.62744140625, -11.2470703125, -10.86669921875, -10.486328125, -10.10595703125, -9.7255859375, -9.34521484375, -8.96484375, -8.58447265625, -8.2041015625, -7.82373046875, -7.443359375, -7.06298828125, -6.6826171875, -6.30224609375, -5.921875, -5.54150390625, -5.1611328125, -4.78076171875, -4.400390625, -4.02001953125, -3.6396484375, -3.25927734375, -2.87890625, -2.49853515625, -2.1181640625, -1.73779296875, -1.357421875, -0.97705078125, -0.5966796875, -0.21630859375, 0.1640625, 0.54443359375, 0.9248046875, 1.30517578125, 1.685546875, 2.06591796875, 2.4462890625, 2.82666015625, 3.20703125, 3.58740234375, 3.9677734375, 4.34814453125, 4.728515625, 5.10888671875, 5.4892578125, 5.86962890625, 6.25, 6.63037109375, 7.0107421875, 7.39111328125, 7.771484375, 8.15185546875, 8.5322265625, 8.91259765625, 9.29296875, 9.67333984375, 10.0537109375, 10.43408203125, 10.814453125, 11.19482421875, 11.5751953125, 11.95556640625, 12.3359375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 14.0, 9.0, 8.0, 24.0, 24.0, 35.0, 48.0, 56.0, 96.0, 133.0, 186.0, 274.0, 455.0, 796.0, 1664.0, 5070.0, 24122.0, 244108.0, 3251272.0, 610847.0, 42574.0, 7584.0, 2260.0, 981.0, 539.0, 357.0, 219.0, 154.0, 119.0, 62.0, 53.0, 35.0, 28.0, 18.0, 14.0, 8.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0625, -70.890625, -68.71875, -66.546875, -64.375, -62.203125, -60.03125, -57.859375, -55.6875, -53.515625, -51.34375, -49.171875, -47.0, -44.828125, -42.65625, -40.484375, -38.3125, -36.140625, -33.96875, -31.796875, -29.625, -27.453125, -25.28125, -23.109375, -20.9375, -18.765625, -16.59375, -14.421875, -12.25, -10.078125, -7.90625, -5.734375, -3.5625, -1.390625, 0.78125, 2.953125, 5.125, 7.296875, 9.46875, 11.640625, 13.8125, 15.984375, 18.15625, 20.328125, 22.5, 24.671875, 26.84375, 29.015625, 31.1875, 33.359375, 35.53125, 37.703125, 39.875, 42.046875, 44.21875, 46.390625, 48.5625, 50.734375, 52.90625, 55.078125, 57.25, 59.421875, 61.59375, 63.765625, 65.9375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 18.0, 27.0, 51.0, 51.0, 82.0, 94.0, 134.0, 197.0, 310.0, 410.0, 498.0, 519.0, 429.0, 327.0, 246.0, 179.0, 130.0, 102.0, 72.0, 58.0, 38.0, 24.0, 15.0, 11.0, 10.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-36.90625, -35.91455078125, -34.9228515625, -33.93115234375, -32.939453125, -31.94775390625, -30.9560546875, -29.96435546875, -28.97265625, -27.98095703125, -26.9892578125, -25.99755859375, -25.005859375, -24.01416015625, -23.0224609375, -22.03076171875, -21.0390625, -20.04736328125, -19.0556640625, -18.06396484375, -17.072265625, -16.08056640625, -15.0888671875, -14.09716796875, -13.10546875, -12.11376953125, -11.1220703125, -10.13037109375, -9.138671875, -8.14697265625, -7.1552734375, -6.16357421875, -5.171875, -4.18017578125, -3.1884765625, -2.19677734375, -1.205078125, -0.21337890625, 0.7783203125, 1.77001953125, 2.76171875, 3.75341796875, 4.7451171875, 5.73681640625, 6.728515625, 7.72021484375, 8.7119140625, 9.70361328125, 10.6953125, 11.68701171875, 12.6787109375, 13.67041015625, 14.662109375, 15.65380859375, 16.6455078125, 17.63720703125, 18.62890625, 19.62060546875, 20.6123046875, 21.60400390625, 22.595703125, 23.58740234375, 24.5791015625, 25.57080078125, 26.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 8.0, 4.0, 4.0, 7.0, 11.0, 17.0, 12.0, 22.0, 50.0, 81.0, 162.0, 446.0, 1307.0, 4690.0, 28094.0, 262241.0, 2967154.0, 847359.0, 69353.0, 9826.0, 2148.0, 687.0, 303.0, 124.0, 55.0, 34.0, 24.0, 19.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-62.15625, -60.55078125, -58.9453125, -57.33984375, -55.734375, -54.12890625, -52.5234375, -50.91796875, -49.3125, -47.70703125, -46.1015625, -44.49609375, -42.890625, -41.28515625, -39.6796875, -38.07421875, -36.46875, -34.86328125, -33.2578125, -31.65234375, -30.046875, -28.44140625, -26.8359375, -25.23046875, -23.625, -22.01953125, -20.4140625, -18.80859375, -17.203125, -15.59765625, -13.9921875, -12.38671875, -10.78125, -9.17578125, -7.5703125, -5.96484375, -4.359375, -2.75390625, -1.1484375, 0.45703125, 2.0625, 3.66796875, 5.2734375, 6.87890625, 8.484375, 10.08984375, 11.6953125, 13.30078125, 14.90625, 16.51171875, 18.1171875, 19.72265625, 21.328125, 22.93359375, 24.5390625, 26.14453125, 27.75, 29.35546875, 30.9609375, 32.56640625, 34.171875, 35.77734375, 37.3828125, 38.98828125, 40.59375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 10.0, 9.0, 3.0, 13.0, 17.0, 23.0, 17.0, 30.0, 31.0, 46.0, 38.0, 55.0, 64.0, 60.0, 72.0, 55.0, 66.0, 62.0, 66.0, 54.0, 40.0, 33.0, 22.0, 27.0, 24.0, 18.0, 12.0, 6.0, 12.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-194.50086975097656, -189.0660858154297, -183.63128662109375, -178.19650268554688, -172.76171875, -167.32693481445312, -161.8921356201172, -156.4573516845703, -151.02255249023438, -145.5877685546875, -140.15296936035156, -134.7181854248047, -129.2834014892578, -123.8486099243164, -118.413818359375, -112.97903442382812, -107.54425048828125, -102.10945892333984, -96.67467498779297, -91.23988342285156, -85.80509948730469, -80.37030792236328, -74.93551635742188, -69.500732421875, -64.0659408569336, -58.63115310668945, -53.19636535644531, -47.761573791503906, -42.326786041259766, -36.891998291015625, -31.45720672607422, -26.022418975830078, -20.587646484375, -15.152857780456543, -9.718069076538086, -4.2832794189453125, 1.1515083312988281, 6.586296081542969, 12.021087646484375, 17.455875396728516, 22.890663146972656, 28.325450897216797, 33.76023864746094, 39.195030212402344, 44.629817962646484, 50.064605712890625, 55.49939727783203, 60.93418502807617, 66.36897277832031, 71.80376434326172, 77.2385482788086, 82.67333984375, 88.10812377929688, 93.54291534423828, 98.97770690917969, 104.41249084472656, 109.84728240966797, 115.28207397460938, 120.71685791015625, 126.15164947509766, 131.58644104003906, 137.02122497558594, 142.45602416992188, 147.89080810546875, 153.32559204101562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 6.0, 12.0, 7.0, 8.0, 11.0, 20.0, 21.0, 21.0, 28.0, 25.0, 29.0, 35.0, 46.0, 34.0, 33.0, 49.0, 39.0, 39.0, 49.0, 49.0, 46.0, 39.0, 32.0, 35.0, 37.0, 30.0, 32.0, 23.0, 21.0, 15.0, 22.0, 15.0, 7.0, 13.0, 10.0, 10.0, 8.0, 13.0, 4.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.61731719970703, -123.5925064086914, -119.56768798828125, -115.54287719726562, -111.51805877685547, -107.49324798583984, -103.46842956542969, -99.44361877441406, -95.41880798339844, -91.39399719238281, -87.36917877197266, -83.34436798095703, -79.31954956054688, -75.29473876953125, -71.26992797851562, -67.24510955810547, -63.22029113769531, -59.19547653198242, -55.17066192626953, -51.145851135253906, -47.12103271484375, -43.096221923828125, -39.071407318115234, -35.046592712402344, -31.021778106689453, -26.996963500976562, -22.972148895263672, -18.947336196899414, -14.922521591186523, -10.897706985473633, -6.872894287109375, -2.8480796813964844, 1.176727294921875, 5.201541423797607, 9.22635555267334, 13.251169204711914, 17.275983810424805, 21.300798416137695, 25.325611114501953, 29.350425720214844, 33.375240325927734, 37.400054931640625, 41.424869537353516, 45.449684143066406, 49.47449493408203, 53.49931335449219, 57.52412414550781, 61.5489387512207, 65.5737533569336, 69.59856414794922, 73.62338256835938, 77.648193359375, 81.67301177978516, 85.69782257080078, 89.72264099121094, 93.74745178222656, 97.77226257324219, 101.79707336425781, 105.82189178466797, 109.8467025756836, 113.87152099609375, 117.89633178710938, 121.921142578125, 125.94596099853516, 129.9707794189453]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 5.0, 14.0, 13.0, 18.0, 25.0, 7.0, 27.0, 26.0, 28.0, 27.0, 26.0, 42.0, 27.0, 47.0, 44.0, 52.0, 40.0, 35.0, 40.0, 47.0, 41.0, 49.0, 37.0, 36.0, 35.0, 26.0, 23.0, 21.0, 18.0, 13.0, 15.0, 16.0, 8.0, 10.0, 8.0, 14.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.125, -195.068359375, -188.01171875, -180.955078125, -173.8984375, -166.841796875, -159.78515625, -152.728515625, -145.671875, -138.615234375, -131.55859375, -124.501953125, -117.4453125, -110.388671875, -103.33203125, -96.275390625, -89.21875, -82.162109375, -75.10546875, -68.048828125, -60.9921875, -53.935546875, -46.87890625, -39.822265625, -32.765625, -25.708984375, -18.65234375, -11.595703125, -4.5390625, 2.517578125, 9.57421875, 16.630859375, 23.6875, 30.744140625, 37.80078125, 44.857421875, 51.9140625, 58.970703125, 66.02734375, 73.083984375, 80.140625, 87.197265625, 94.25390625, 101.310546875, 108.3671875, 115.423828125, 122.48046875, 129.537109375, 136.59375, 143.650390625, 150.70703125, 157.763671875, 164.8203125, 171.876953125, 178.93359375, 185.990234375, 193.046875, 200.103515625, 207.16015625, 214.216796875, 221.2734375, 228.330078125, 235.38671875, 242.443359375, 249.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 13.0, 12.0, 30.0, 44.0, 60.0, 84.0, 139.0, 227.0, 349.0, 515.0, 829.0, 1346.0, 1945.0, 3136.0, 4732.0, 7234.0, 10783.0, 16071.0, 25148.0, 38240.0, 58354.0, 87557.0, 129884.0, 169065.0, 157689.0, 113964.0, 76129.0, 49929.0, 32625.0, 21411.0, 14012.0, 9158.0, 6083.0, 4029.0, 2691.0, 1808.0, 1137.0, 769.0, 513.0, 287.0, 177.0, 137.0, 81.0, 51.0, 32.0, 19.0, 10.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.5234375, -10.2122802734375, -9.901123046875, -9.5899658203125, -9.27880859375, -8.9676513671875, -8.656494140625, -8.3453369140625, -8.0341796875, -7.7230224609375, -7.411865234375, -7.1007080078125, -6.78955078125, -6.4783935546875, -6.167236328125, -5.8560791015625, -5.544921875, -5.2337646484375, -4.922607421875, -4.6114501953125, -4.30029296875, -3.9891357421875, -3.677978515625, -3.3668212890625, -3.0556640625, -2.7445068359375, -2.433349609375, -2.1221923828125, -1.81103515625, -1.4998779296875, -1.188720703125, -0.8775634765625, -0.56640625, -0.2552490234375, 0.055908203125, 0.3670654296875, 0.67822265625, 0.9893798828125, 1.300537109375, 1.6116943359375, 1.9228515625, 2.2340087890625, 2.545166015625, 2.8563232421875, 3.16748046875, 3.4786376953125, 3.789794921875, 4.1009521484375, 4.412109375, 4.7232666015625, 5.034423828125, 5.3455810546875, 5.65673828125, 5.9678955078125, 6.279052734375, 6.5902099609375, 6.9013671875, 7.2125244140625, 7.523681640625, 7.8348388671875, 8.14599609375, 8.4571533203125, 8.768310546875, 9.0794677734375, 9.390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 8.0, 4.0, 5.0, 11.0, 20.0, 13.0, 9.0, 25.0, 23.0, 20.0, 23.0, 25.0, 18.0, 21.0, 36.0, 30.0, 37.0, 27.0, 33.0, 35.0, 37.0, 1061.0, 33.0, 40.0, 34.0, 30.0, 37.0, 31.0, 39.0, 29.0, 19.0, 28.0, 22.0, 17.0, 19.0, 28.0, 16.0, 18.0, 12.0, 6.0, 9.0, 3.0, 10.0, 2.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-122.1875, -118.1787109375, -114.169921875, -110.1611328125, -106.15234375, -102.1435546875, -98.134765625, -94.1259765625, -90.1171875, -86.1083984375, -82.099609375, -78.0908203125, -74.08203125, -70.0732421875, -66.064453125, -62.0556640625, -58.046875, -54.0380859375, -50.029296875, -46.0205078125, -42.01171875, -38.0029296875, -33.994140625, -29.9853515625, -25.9765625, -21.9677734375, -17.958984375, -13.9501953125, -9.94140625, -5.9326171875, -1.923828125, 2.0849609375, 6.09375, 10.1025390625, 14.111328125, 18.1201171875, 22.12890625, 26.1376953125, 30.146484375, 34.1552734375, 38.1640625, 42.1728515625, 46.181640625, 50.1904296875, 54.19921875, 58.2080078125, 62.216796875, 66.2255859375, 70.234375, 74.2431640625, 78.251953125, 82.2607421875, 86.26953125, 90.2783203125, 94.287109375, 98.2958984375, 102.3046875, 106.3134765625, 110.322265625, 114.3310546875, 118.33984375, 122.3486328125, 126.357421875, 130.3662109375, 134.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 9.0, 8.0, 8.0, 16.0, 25.0, 49.0, 73.0, 111.0, 163.0, 229.0, 332.0, 532.0, 841.0, 1219.0, 1817.0, 2857.0, 4403.0, 6877.0, 10676.0, 17414.0, 28020.0, 46223.0, 75079.0, 117245.0, 167190.0, 1229433.0, 140743.0, 92970.0, 57786.0, 35689.0, 21793.0, 13430.0, 8399.0, 5364.0, 3471.0, 2252.0, 1511.0, 997.0, 645.0, 451.0, 259.0, 179.0, 134.0, 86.0, 47.0, 33.0, 18.0, 15.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.8724365234375, -7.612060546875, -7.3516845703125, -7.09130859375, -6.8309326171875, -6.570556640625, -6.3101806640625, -6.0498046875, -5.7894287109375, -5.529052734375, -5.2686767578125, -5.00830078125, -4.7479248046875, -4.487548828125, -4.2271728515625, -3.966796875, -3.7064208984375, -3.446044921875, -3.1856689453125, -2.92529296875, -2.6649169921875, -2.404541015625, -2.1441650390625, -1.8837890625, -1.6234130859375, -1.363037109375, -1.1026611328125, -0.84228515625, -0.5819091796875, -0.321533203125, -0.0611572265625, 0.19921875, 0.4595947265625, 0.719970703125, 0.9803466796875, 1.24072265625, 1.5010986328125, 1.761474609375, 2.0218505859375, 2.2822265625, 2.5426025390625, 2.802978515625, 3.0633544921875, 3.32373046875, 3.5841064453125, 3.844482421875, 4.1048583984375, 4.365234375, 4.6256103515625, 4.885986328125, 5.1463623046875, 5.40673828125, 5.6671142578125, 5.927490234375, 6.1878662109375, 6.4482421875, 6.7086181640625, 6.968994140625, 7.2293701171875, 7.48974609375, 7.7501220703125, 8.010498046875, 8.2708740234375, 8.53125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 5.0, 2.0, 10.0, 8.0, 9.0, 8.0, 11.0, 14.0, 25.0, 16.0, 31.0, 47.0, 40.0, 35.0, 41.0, 54.0, 46.0, 43.0, 49.0, 39.0, 43.0, 37.0, 32.0, 36.0, 40.0, 44.0, 31.0, 44.0, 29.0, 23.0, 13.0, 17.0, 16.0, 6.0, 12.0, 7.0, 8.0, 13.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.080322265625, -0.07778644561767578, -0.07525062561035156, -0.07271480560302734, -0.07017898559570312, -0.0676431655883789, -0.06510734558105469, -0.06257152557373047, -0.06003570556640625, -0.05749988555908203, -0.05496406555175781, -0.052428245544433594, -0.049892425537109375, -0.047356605529785156, -0.04482078552246094, -0.04228496551513672, -0.0397491455078125, -0.03721332550048828, -0.03467750549316406, -0.032141685485839844, -0.029605865478515625, -0.027070045471191406, -0.024534225463867188, -0.02199840545654297, -0.01946258544921875, -0.01692676544189453, -0.014390945434570312, -0.011855125427246094, -0.009319305419921875, -0.006783485412597656, -0.0042476654052734375, -0.0017118453979492188, 0.000823974609375, 0.0033597946166992188, 0.0058956146240234375, 0.008431434631347656, 0.010967254638671875, 0.013503074645996094, 0.016038894653320312, 0.01857471466064453, 0.02111053466796875, 0.02364635467529297, 0.026182174682617188, 0.028717994689941406, 0.031253814697265625, 0.033789634704589844, 0.03632545471191406, 0.03886127471923828, 0.0413970947265625, 0.04393291473388672, 0.04646873474121094, 0.049004554748535156, 0.051540374755859375, 0.054076194763183594, 0.05661201477050781, 0.05914783477783203, 0.06168365478515625, 0.06421947479248047, 0.06675529479980469, 0.0692911148071289, 0.07182693481445312, 0.07436275482177734, 0.07689857482910156, 0.07943439483642578, 0.08197021484375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 8.0, 5.0, 17.0, 31.0, 39.0, 43.0, 80.0, 108.0, 184.0, 270.0, 448.0, 828.0, 1381.0, 2764.0, 5610.0, 12385.0, 28610.0, 68096.0, 167438.0, 359454.0, 234856.0, 94404.0, 39158.0, 17017.0, 7488.0, 3513.0, 1813.0, 968.0, 560.0, 357.0, 193.0, 139.0, 93.0, 55.0, 36.0, 37.0, 30.0, 10.0, 4.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.442626953125, -0.42865753173828125, -0.4146881103515625, -0.40071868896484375, -0.386749267578125, -0.37277984619140625, -0.3588104248046875, -0.34484100341796875, -0.33087158203125, -0.31690216064453125, -0.3029327392578125, -0.28896331787109375, -0.274993896484375, -0.26102447509765625, -0.2470550537109375, -0.23308563232421875, -0.2191162109375, -0.20514678955078125, -0.1911773681640625, -0.17720794677734375, -0.163238525390625, -0.14926910400390625, -0.1352996826171875, -0.12133026123046875, -0.10736083984375, -0.09339141845703125, -0.0794219970703125, -0.06545257568359375, -0.051483154296875, -0.03751373291015625, -0.0235443115234375, -0.00957489013671875, 0.00439453125, 0.01836395263671875, 0.0323333740234375, 0.04630279541015625, 0.060272216796875, 0.07424163818359375, 0.0882110595703125, 0.10218048095703125, 0.11614990234375, 0.13011932373046875, 0.1440887451171875, 0.15805816650390625, 0.172027587890625, 0.18599700927734375, 0.1999664306640625, 0.21393585205078125, 0.2279052734375, 0.24187469482421875, 0.2558441162109375, 0.26981353759765625, 0.283782958984375, 0.29775238037109375, 0.3117218017578125, 0.32569122314453125, 0.33966064453125, 0.35363006591796875, 0.3675994873046875, 0.38156890869140625, 0.395538330078125, 0.40950775146484375, 0.4234771728515625, 0.43744659423828125, 0.451416015625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 12.0, 4.0, 12.0, 10.0, 16.0, 9.0, 18.0, 20.0, 47.0, 82.0, 78.0, 122.0, 118.0, 127.0, 90.0, 72.0, 42.0, 32.0, 20.0, 14.0, 17.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.536999523639679, -0.5258423686027527, -0.5146851539611816, -0.5035279989242554, -0.4923708438873291, -0.48121365904808044, -0.4700564742088318, -0.4588993191719055, -0.44774213433265686, -0.4365849494934082, -0.42542779445648193, -0.4142706096172333, -0.4031134247779846, -0.39195626974105835, -0.3807990849018097, -0.36964190006256104, -0.35848474502563477, -0.3473275601863861, -0.33617040514945984, -0.3250132203102112, -0.3138560652732849, -0.30269888043403625, -0.2915416955947876, -0.28038454055786133, -0.26922735571861267, -0.258070170879364, -0.24691301584243774, -0.2357558310031891, -0.22459866106510162, -0.21344149112701416, -0.2022843062877655, -0.19112713634967804, -0.1799699366092682, -0.16881276667118073, -0.15765559673309326, -0.1464984118938446, -0.13534124195575714, -0.12418407201766968, -0.11302689462900162, -0.10186971724033356, -0.0907125473022461, -0.07955537736415863, -0.06839819997549057, -0.05724102631211281, -0.046083852648735046, -0.034926678985357285, -0.023769505321979523, -0.012612327933311462, -0.001455157995223999, 0.009702015668153763, 0.020859189331531525, 0.032016362994909286, 0.04317353665828705, 0.05433071032166481, 0.06548788398504257, 0.07664506137371063, 0.0878022313117981, 0.09895940124988556, 0.11011657863855362, 0.12127375602722168, 0.13243092596530914, 0.1435880959033966, 0.15474528074264526, 0.16590245068073273, 0.1770596206188202]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 8.0, 1.0, 8.0, 7.0, 11.0, 13.0, 12.0, 10.0, 16.0, 14.0, 14.0, 20.0, 24.0, 27.0, 23.0, 36.0, 26.0, 30.0, 27.0, 37.0, 39.0, 30.0, 28.0, 23.0, 43.0, 31.0, 29.0, 27.0, 34.0, 28.0, 40.0, 24.0, 33.0, 16.0, 26.0, 21.0, 28.0, 28.0, 18.0, 17.0, 12.0, 15.0, 11.0, 13.0, 13.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.21002990007400513, -0.20393536984920502, -0.1978408396244049, -0.1917463093996048, -0.1856517791748047, -0.17955724895000458, -0.17346271872520447, -0.16736818850040436, -0.16127365827560425, -0.15517912805080414, -0.14908459782600403, -0.14299006760120392, -0.1368955373764038, -0.1308010071516037, -0.12470647692680359, -0.11861194670200348, -0.11251741647720337, -0.10642288625240326, -0.10032835602760315, -0.09423382580280304, -0.08813929557800293, -0.08204476535320282, -0.07595023512840271, -0.0698557049036026, -0.06376117467880249, -0.05766664445400238, -0.05157211422920227, -0.04547758400440216, -0.03938305377960205, -0.03328852355480194, -0.02719399333000183, -0.02109946310520172, -0.015004932880401611, -0.008910402655601501, -0.0028158724308013916, 0.0032786577939987183, 0.009373188018798828, 0.015467718243598938, 0.021562248468399048, 0.027656778693199158, 0.03375130891799927, 0.03984583914279938, 0.04594036936759949, 0.0520348995923996, 0.05812942981719971, 0.06422396004199982, 0.07031849026679993, 0.07641302049160004, 0.08250755071640015, 0.08860208094120026, 0.09469661116600037, 0.10079114139080048, 0.10688567161560059, 0.1129802018404007, 0.1190747320652008, 0.12516926229000092, 0.13126379251480103, 0.13735832273960114, 0.14345285296440125, 0.14954738318920135, 0.15564191341400146, 0.16173644363880157, 0.16783097386360168, 0.1739255040884018, 0.1800200343132019]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 13.0, 20.0, 22.0, 11.0, 30.0, 20.0, 30.0, 29.0, 22.0, 46.0, 25.0, 47.0, 50.0, 47.0, 40.0, 32.0, 41.0, 49.0, 38.0, 50.0, 38.0, 36.0, 31.0, 27.0, 27.0, 18.0, 16.0, 13.0, 15.0, 16.0, 10.0, 9.0, 8.0, 13.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.375, -193.35546875, -186.3359375, -179.31640625, -172.296875, -165.27734375, -158.2578125, -151.23828125, -144.21875, -137.19921875, -130.1796875, -123.16015625, -116.140625, -109.12109375, -102.1015625, -95.08203125, -88.0625, -81.04296875, -74.0234375, -67.00390625, -59.984375, -52.96484375, -45.9453125, -38.92578125, -31.90625, -24.88671875, -17.8671875, -10.84765625, -3.828125, 3.19140625, 10.2109375, 17.23046875, 24.25, 31.26953125, 38.2890625, 45.30859375, 52.328125, 59.34765625, 66.3671875, 73.38671875, 80.40625, 87.42578125, 94.4453125, 101.46484375, 108.484375, 115.50390625, 122.5234375, 129.54296875, 136.5625, 143.58203125, 150.6015625, 157.62109375, 164.640625, 171.66015625, 178.6796875, 185.69921875, 192.71875, 199.73828125, 206.7578125, 213.77734375, 220.796875, 227.81640625, 234.8359375, 241.85546875, 248.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 15.0, 17.0, 29.0, 36.0, 38.0, 57.0, 78.0, 80.0, 129.0, 178.0, 301.0, 571.0, 1321.0, 4206.0, 19155.0, 132343.0, 592062.0, 252899.0, 35036.0, 6377.0, 1758.0, 706.0, 361.0, 235.0, 142.0, 89.0, 67.0, 40.0, 47.0, 29.0, 32.0, 15.0, 15.0, 9.0, 14.0, 12.0, 7.0, 3.0, 2.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3125, -37.94091796875, -36.5693359375, -35.19775390625, -33.826171875, -32.45458984375, -31.0830078125, -29.71142578125, -28.33984375, -26.96826171875, -25.5966796875, -24.22509765625, -22.853515625, -21.48193359375, -20.1103515625, -18.73876953125, -17.3671875, -15.99560546875, -14.6240234375, -13.25244140625, -11.880859375, -10.50927734375, -9.1376953125, -7.76611328125, -6.39453125, -5.02294921875, -3.6513671875, -2.27978515625, -0.908203125, 0.46337890625, 1.8349609375, 3.20654296875, 4.578125, 5.94970703125, 7.3212890625, 8.69287109375, 10.064453125, 11.43603515625, 12.8076171875, 14.17919921875, 15.55078125, 16.92236328125, 18.2939453125, 19.66552734375, 21.037109375, 22.40869140625, 23.7802734375, 25.15185546875, 26.5234375, 27.89501953125, 29.2666015625, 30.63818359375, 32.009765625, 33.38134765625, 34.7529296875, 36.12451171875, 37.49609375, 38.86767578125, 40.2392578125, 41.61083984375, 42.982421875, 44.35400390625, 45.7255859375, 47.09716796875, 48.46875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 10.0, 15.0, 13.0, 20.0, 23.0, 44.0, 45.0, 51.0, 69.0, 68.0, 72.0, 2109.0, 77.0, 80.0, 49.0, 57.0, 45.0, 42.0, 44.0, 29.0, 18.0, 17.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-581.5, -566.46484375, -551.4296875, -536.39453125, -521.359375, -506.32421875, -491.2890625, -476.25390625, -461.21875, -446.18359375, -431.1484375, -416.11328125, -401.078125, -386.04296875, -371.0078125, -355.97265625, -340.9375, -325.90234375, -310.8671875, -295.83203125, -280.796875, -265.76171875, -250.7265625, -235.69140625, -220.65625, -205.62109375, -190.5859375, -175.55078125, -160.515625, -145.48046875, -130.4453125, -115.41015625, -100.375, -85.33984375, -70.3046875, -55.26953125, -40.234375, -25.19921875, -10.1640625, 4.87109375, 19.90625, 34.94140625, 49.9765625, 65.01171875, 80.046875, 95.08203125, 110.1171875, 125.15234375, 140.1875, 155.22265625, 170.2578125, 185.29296875, 200.328125, 215.36328125, 230.3984375, 245.43359375, 260.46875, 275.50390625, 290.5390625, 305.57421875, 320.609375, 335.64453125, 350.6796875, 365.71484375, 380.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 13.0, 15.0, 27.0, 43.0, 57.0, 117.0, 172.0, 340.0, 706.0, 1646.0, 6081.0, 57493.0, 2732776.0, 319892.0, 20664.0, 3363.0, 1145.0, 464.0, 255.0, 152.0, 96.0, 54.0, 34.0, 23.0, 17.0, 15.0, 8.0, 5.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.34375, -44.83935546875, -43.3349609375, -41.83056640625, -40.326171875, -38.82177734375, -37.3173828125, -35.81298828125, -34.30859375, -32.80419921875, -31.2998046875, -29.79541015625, -28.291015625, -26.78662109375, -25.2822265625, -23.77783203125, -22.2734375, -20.76904296875, -19.2646484375, -17.76025390625, -16.255859375, -14.75146484375, -13.2470703125, -11.74267578125, -10.23828125, -8.73388671875, -7.2294921875, -5.72509765625, -4.220703125, -2.71630859375, -1.2119140625, 0.29248046875, 1.796875, 3.30126953125, 4.8056640625, 6.31005859375, 7.814453125, 9.31884765625, 10.8232421875, 12.32763671875, 13.83203125, 15.33642578125, 16.8408203125, 18.34521484375, 19.849609375, 21.35400390625, 22.8583984375, 24.36279296875, 25.8671875, 27.37158203125, 28.8759765625, 30.38037109375, 31.884765625, 33.38916015625, 34.8935546875, 36.39794921875, 37.90234375, 39.40673828125, 40.9111328125, 42.41552734375, 43.919921875, 45.42431640625, 46.9287109375, 48.43310546875, 49.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 13.0, 24.0, 34.0, 62.0, 162.0, 215.0, 210.0, 123.0, 58.0, 25.0, 19.0, 17.0, 9.0, 6.0, 9.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-657.27001953125, -634.3551635742188, -611.4402465820312, -588.525390625, -565.6104736328125, -542.6956176757812, -519.78076171875, -496.8658752441406, -473.95098876953125, -451.0361022949219, -428.1212158203125, -405.20635986328125, -382.2914733886719, -359.3765869140625, -336.46173095703125, -313.5468444824219, -290.6319580078125, -267.7170715332031, -244.8022003173828, -221.8873291015625, -198.97244262695312, -176.05755615234375, -153.14268493652344, -130.22781372070312, -107.31292724609375, -84.3980484008789, -61.48316955566406, -38.56829071044922, -15.653411865234375, 7.261466979980469, 30.176345825195312, 53.091217041015625, 76.00604248046875, 98.9209213256836, 121.83580017089844, 144.75067138671875, 167.66555786132812, 190.5804443359375, 213.4953155517578, 236.41018676757812, 259.3250732421875, 282.2399597167969, 305.15484619140625, 328.0697021484375, 350.9845886230469, 373.89947509765625, 396.8143310546875, 419.7292175292969, 442.64410400390625, 465.5589904785156, 488.473876953125, 511.38873291015625, 534.3035888671875, 557.218505859375, 580.1333618164062, 603.0482177734375, 625.963134765625, 648.8779907226562, 671.7929077148438, 694.707763671875, 717.6226806640625, 740.5375366210938, 763.452392578125, 786.3673095703125, 809.2821655273438]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 13.0, 12.0, 15.0, 18.0, 18.0, 17.0, 25.0, 30.0, 25.0, 40.0, 45.0, 33.0, 32.0, 30.0, 35.0, 47.0, 45.0, 30.0, 42.0, 37.0, 34.0, 31.0, 35.0, 33.0, 30.0, 30.0, 31.0, 16.0, 12.0, 11.0, 15.0, 20.0, 14.0, 9.0, 13.0, 10.0, 8.0, 7.0, 12.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-464.2268371582031, -450.50079345703125, -436.7747497558594, -423.0487060546875, -409.3226623535156, -395.59661865234375, -381.87060546875, -368.14453125, -354.41851806640625, -340.6924743652344, -326.9664306640625, -313.2403869628906, -299.51434326171875, -285.7882995605469, -272.062255859375, -258.33624267578125, -244.61016845703125, -230.88412475585938, -217.1580810546875, -203.43203735351562, -189.70599365234375, -175.97994995117188, -162.25392150878906, -148.5278778076172, -134.8018341064453, -121.07579040527344, -107.34974670410156, -93.62371063232422, -79.89766693115234, -66.17162322998047, -52.445587158203125, -38.71954345703125, -24.9935302734375, -11.267488479614258, 2.4585533142089844, 16.184593200683594, 29.91063690185547, 43.636680603027344, 57.36271667480469, 71.08876037597656, 84.81480407714844, 98.54084777832031, 112.26689147949219, 125.99292755126953, 139.71896362304688, 153.44500732421875, 167.17105102539062, 180.8970947265625, 194.62313842773438, 208.34918212890625, 222.07522583007812, 235.80126953125, 249.52731323242188, 263.25335693359375, 276.9793701171875, 290.7054443359375, 304.43145751953125, 318.1575012207031, 331.883544921875, 345.6095886230469, 359.33563232421875, 373.0616760253906, 386.7877197265625, 400.51373291015625, 414.23980712890625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 17.0, 19.0, 16.0, 20.0, 34.0, 44.0, 62.0, 73.0, 87.0, 114.0, 132.0, 164.0, 187.0, 234.0, 295.0, 392.0, 572.0, 878.0, 1570.0, 3181.0, 6687.0, 1019128.0, 6599.0, 3154.0, 1617.0, 860.0, 539.0, 383.0, 293.0, 229.0, 166.0, 170.0, 145.0, 103.0, 80.0, 60.0, 57.0, 39.0, 33.0, 23.0, 9.0, 18.0, 13.0, 16.0, 9.0, 1.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-95.81563568115234, -92.77223205566406, -89.72882843017578, -86.6854248046875, -83.64202117919922, -80.59861755371094, -77.55521392822266, -74.51181030273438, -71.4684066772461, -68.42500305175781, -65.38159942626953, -62.33819580078125, -59.29479217529297, -56.25138854980469, -53.207984924316406, -50.164581298828125, -47.12118148803711, -44.07777786254883, -41.03437423706055, -37.990970611572266, -34.947566986083984, -31.904163360595703, -28.860761642456055, -25.817358016967773, -22.773954391479492, -19.73055076599121, -16.68714714050293, -13.643744468688965, -10.600340843200684, -7.556937217712402, -4.5135345458984375, -1.4701309204101562, 1.573272705078125, 4.616676330566406, 7.660079479217529, 10.703482627868652, 13.746886253356934, 16.79029083251953, 19.83369255065918, 22.87709617614746, 25.920499801635742, 28.963903427124023, 32.00730514526367, 35.05070877075195, 38.094112396240234, 41.137516021728516, 44.1809196472168, 47.22432327270508, 50.26772689819336, 53.31113052368164, 56.35453414916992, 59.3979377746582, 62.441341400146484, 65.4847412109375, 68.52814483642578, 71.57154846191406, 74.61495208740234, 77.65835571289062, 80.7017593383789, 83.74516296386719, 86.78856658935547, 89.83197021484375, 92.87537384033203, 95.91877746582031, 98.9621810913086]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 13.0, 18.0, 38.0, 81.0, 204.0, 23650.0, 51438904.0, 151.0, 43.0, 24.0, 22.0, 11.0, 7.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1442.74267578125, -1352.977294921875, -1263.2119140625, -1173.446533203125, -1083.6812744140625, -993.9158935546875, -904.1505126953125, -814.3851928710938, -724.6198120117188, -634.8544311523438, -545.089111328125, -455.32373046875, -365.5583801269531, -275.79302978515625, -186.02764892578125, -96.2623291015625, -6.4969482421875, 83.2684097290039, 173.0337677001953, 262.79913330078125, 352.5644836425781, 442.329833984375, 532.09521484375, 621.8605346679688, 711.6259155273438, 801.3912963867188, 891.1566162109375, 980.9219970703125, 1070.6873779296875, 1160.45263671875, 1250.218017578125, 1339.9833984375, 1429.748779296875, 1519.51416015625, 1609.279541015625, 1699.044921875, 1788.8101806640625, 1878.5755615234375, 1968.3409423828125, 2058.106201171875, 2147.87158203125, 2237.636962890625, 2327.40234375, 2417.167724609375, 2506.93310546875, 2596.6982421875, 2686.4638671875, 2776.22900390625, 2865.99462890625, 2955.760009765625, 3045.525390625, 3135.290771484375, 3225.05615234375, 3314.8212890625, 3404.5869140625, 3494.35205078125, 3584.117431640625, 3673.8828125, 3763.648193359375, 3853.41357421875, 3943.178955078125, 4032.9443359375, 4122.70947265625, 4212.47509765625, 4302.240234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 10.0, 6.0, 8.0, 7.0, 14.0, 24.0, 38.0, 61.0, 96.0, 123.0, 180.0, 288.0, 510.0, 825.0, 1243.0, 1867.0, 2953.0, 4557.0, 7005.0, 11123.0, 17339.0, 27194.0, 44026.0, 70579.0, 113621.0, 180721.0, 280320.0, 411455.0, 3328278.0, 767803.0, 362849.0, 243711.0, 153860.0, 96928.0, 59570.0, 37102.0, 23400.0, 14909.0, 9447.0, 6230.0, 3964.0, 2530.0, 1568.0, 1042.0, 701.0, 459.0, 315.0, 216.0, 143.0, 84.0, 53.0, 36.0, 28.0, 12.0, 10.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.125, -2.05377197265625, -1.9825439453125, -1.91131591796875, -1.840087890625, -1.76885986328125, -1.6976318359375, -1.62640380859375, -1.55517578125, -1.48394775390625, -1.4127197265625, -1.34149169921875, -1.270263671875, -1.19903564453125, -1.1278076171875, -1.05657958984375, -0.9853515625, -0.91412353515625, -0.8428955078125, -0.77166748046875, -0.700439453125, -0.62921142578125, -0.5579833984375, -0.48675537109375, -0.41552734375, -0.34429931640625, -0.2730712890625, -0.20184326171875, -0.130615234375, -0.05938720703125, 0.0118408203125, 0.08306884765625, 0.154296875, 0.22552490234375, 0.2967529296875, 0.36798095703125, 0.439208984375, 0.51043701171875, 0.5816650390625, 0.65289306640625, 0.72412109375, 0.79534912109375, 0.8665771484375, 0.93780517578125, 1.009033203125, 1.08026123046875, 1.1514892578125, 1.22271728515625, 1.2939453125, 1.36517333984375, 1.4364013671875, 1.50762939453125, 1.578857421875, 1.65008544921875, 1.7213134765625, 1.79254150390625, 1.86376953125, 1.93499755859375, 2.0062255859375, 2.07745361328125, 2.148681640625, 2.21990966796875, 2.2911376953125, 2.36236572265625, 2.43359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 9.0, 4.0, 3.0, 6.0, 11.0, 9.0, 11.0, 17.0, 26.0, 23.0, 28.0, 23.0, 31.0, 28.0, 40.0, 41.0, 48.0, 54.0, 48.0, 73.0, 1031.0, 54.0, 41.0, 49.0, 31.0, 39.0, 37.0, 34.0, 26.0, 23.0, 21.0, 14.0, 21.0, 12.0, 13.0, 9.0, 9.0, 7.0, 6.0, 8.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.25, -58.32958984375, -56.4091796875, -54.48876953125, -52.568359375, -50.64794921875, -48.7275390625, -46.80712890625, -44.88671875, -42.96630859375, -41.0458984375, -39.12548828125, -37.205078125, -35.28466796875, -33.3642578125, -31.44384765625, -29.5234375, -27.60302734375, -25.6826171875, -23.76220703125, -21.841796875, -19.92138671875, -18.0009765625, -16.08056640625, -14.16015625, -12.23974609375, -10.3193359375, -8.39892578125, -6.478515625, -4.55810546875, -2.6376953125, -0.71728515625, 1.203125, 3.12353515625, 5.0439453125, 6.96435546875, 8.884765625, 10.80517578125, 12.7255859375, 14.64599609375, 16.56640625, 18.48681640625, 20.4072265625, 22.32763671875, 24.248046875, 26.16845703125, 28.0888671875, 30.00927734375, 31.9296875, 33.85009765625, 35.7705078125, 37.69091796875, 39.611328125, 41.53173828125, 43.4521484375, 45.37255859375, 47.29296875, 49.21337890625, 51.1337890625, 53.05419921875, 54.974609375, 56.89501953125, 58.8154296875, 60.73583984375, 62.65625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 16.0, 25.0, 22.0, 43.0, 83.0, 97.0, 172.0, 251.0, 442.0, 695.0, 1101.0, 1666.0, 2532.0, 4058.0, 6341.0, 9935.0, 15322.0, 24697.0, 38299.0, 60766.0, 95421.0, 148210.0, 222687.0, 319264.0, 467347.0, 3515863.0, 437152.0, 310837.0, 215159.0, 141451.0, 91593.0, 57698.0, 36633.0, 23601.0, 15198.0, 9602.0, 6113.0, 3918.0, 2620.0, 1733.0, 1069.0, 666.0, 371.0, 252.0, 142.0, 106.0, 58.0, 38.0, 29.0, 18.0, 5.0, 14.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6826171875, -1.6273651123046875, -1.572113037109375, -1.5168609619140625, -1.46160888671875, -1.4063568115234375, -1.351104736328125, -1.2958526611328125, -1.2406005859375, -1.1853485107421875, -1.130096435546875, -1.0748443603515625, -1.01959228515625, -0.9643402099609375, -0.909088134765625, -0.8538360595703125, -0.798583984375, -0.7433319091796875, -0.688079833984375, -0.6328277587890625, -0.57757568359375, -0.5223236083984375, -0.467071533203125, -0.4118194580078125, -0.3565673828125, -0.3013153076171875, -0.246063232421875, -0.1908111572265625, -0.13555908203125, -0.0803070068359375, -0.025054931640625, 0.0301971435546875, 0.08544921875, 0.1407012939453125, 0.195953369140625, 0.2512054443359375, 0.30645751953125, 0.3617095947265625, 0.416961669921875, 0.4722137451171875, 0.5274658203125, 0.5827178955078125, 0.637969970703125, 0.6932220458984375, 0.74847412109375, 0.8037261962890625, 0.858978271484375, 0.9142303466796875, 0.969482421875, 1.0247344970703125, 1.079986572265625, 1.1352386474609375, 1.19049072265625, 1.2457427978515625, 1.300994873046875, 1.3562469482421875, 1.4114990234375, 1.4667510986328125, 1.522003173828125, 1.5772552490234375, 1.63250732421875, 1.6877593994140625, 1.743011474609375, 1.7982635498046875, 1.853515625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 2.0, 11.0, 11.0, 5.0, 9.0, 11.0, 16.0, 11.0, 20.0, 14.0, 23.0, 31.0, 30.0, 28.0, 25.0, 42.0, 45.0, 38.0, 50.0, 36.0, 42.0, 1037.0, 55.0, 50.0, 33.0, 45.0, 34.0, 28.0, 32.0, 28.0, 24.0, 22.0, 22.0, 25.0, 12.0, 17.0, 12.0, 12.0, 13.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.75, -43.28662109375, -41.8232421875, -40.35986328125, -38.896484375, -37.43310546875, -35.9697265625, -34.50634765625, -33.04296875, -31.57958984375, -30.1162109375, -28.65283203125, -27.189453125, -25.72607421875, -24.2626953125, -22.79931640625, -21.3359375, -19.87255859375, -18.4091796875, -16.94580078125, -15.482421875, -14.01904296875, -12.5556640625, -11.09228515625, -9.62890625, -8.16552734375, -6.7021484375, -5.23876953125, -3.775390625, -2.31201171875, -0.8486328125, 0.61474609375, 2.078125, 3.54150390625, 5.0048828125, 6.46826171875, 7.931640625, 9.39501953125, 10.8583984375, 12.32177734375, 13.78515625, 15.24853515625, 16.7119140625, 18.17529296875, 19.638671875, 21.10205078125, 22.5654296875, 24.02880859375, 25.4921875, 26.95556640625, 28.4189453125, 29.88232421875, 31.345703125, 32.80908203125, 34.2724609375, 35.73583984375, 37.19921875, 38.66259765625, 40.1259765625, 41.58935546875, 43.052734375, 44.51611328125, 45.9794921875, 47.44287109375, 48.90625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 7.0, 19.0, 8.0, 16.0, 34.0, 31.0, 54.0, 52.0, 74.0, 87.0, 122.0, 197.0, 299.0, 540.0, 864.0, 1750.0, 4314.0, 13810.0, 69257.0, 5911839.0, 237554.0, 35492.0, 8691.0, 2964.0, 1346.0, 644.0, 440.0, 274.0, 193.0, 120.0, 78.0, 80.0, 62.0, 39.0, 20.0, 12.0, 15.0, 9.0, 4.0, 1.0, 7.0, 6.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.890625, -17.4046630859375, -16.918701171875, -16.4327392578125, -15.94677734375, -15.4608154296875, -14.974853515625, -14.4888916015625, -14.0029296875, -13.5169677734375, -13.031005859375, -12.5450439453125, -12.05908203125, -11.5731201171875, -11.087158203125, -10.6011962890625, -10.115234375, -9.6292724609375, -9.143310546875, -8.6573486328125, -8.17138671875, -7.6854248046875, -7.199462890625, -6.7135009765625, -6.2275390625, -5.7415771484375, -5.255615234375, -4.7696533203125, -4.28369140625, -3.7977294921875, -3.311767578125, -2.8258056640625, -2.33984375, -1.8538818359375, -1.367919921875, -0.8819580078125, -0.39599609375, 0.0899658203125, 0.575927734375, 1.0618896484375, 1.5478515625, 2.0338134765625, 2.519775390625, 3.0057373046875, 3.49169921875, 3.9776611328125, 4.463623046875, 4.9495849609375, 5.435546875, 5.9215087890625, 6.407470703125, 6.8934326171875, 7.37939453125, 7.8653564453125, 8.351318359375, 8.8372802734375, 9.3232421875, 9.8092041015625, 10.295166015625, 10.7811279296875, 11.26708984375, 11.7530517578125, 12.239013671875, 12.7249755859375, 13.2109375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 8.0, 9.0, 11.0, 10.0, 20.0, 7.0, 15.0, 20.0, 13.0, 27.0, 25.0, 34.0, 26.0, 27.0, 41.0, 34.0, 49.0, 36.0, 48.0, 1030.0, 78.0, 44.0, 49.0, 47.0, 43.0, 26.0, 39.0, 28.0, 29.0, 21.0, 28.0, 28.0, 16.0, 24.0, 6.0, 10.0, 3.0, 5.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.96875, -39.59033203125, -38.2119140625, -36.83349609375, -35.455078125, -34.07666015625, -32.6982421875, -31.31982421875, -29.94140625, -28.56298828125, -27.1845703125, -25.80615234375, -24.427734375, -23.04931640625, -21.6708984375, -20.29248046875, -18.9140625, -17.53564453125, -16.1572265625, -14.77880859375, -13.400390625, -12.02197265625, -10.6435546875, -9.26513671875, -7.88671875, -6.50830078125, -5.1298828125, -3.75146484375, -2.373046875, -0.99462890625, 0.3837890625, 1.76220703125, 3.140625, 4.51904296875, 5.8974609375, 7.27587890625, 8.654296875, 10.03271484375, 11.4111328125, 12.78955078125, 14.16796875, 15.54638671875, 16.9248046875, 18.30322265625, 19.681640625, 21.06005859375, 22.4384765625, 23.81689453125, 25.1953125, 26.57373046875, 27.9521484375, 29.33056640625, 30.708984375, 32.08740234375, 33.4658203125, 34.84423828125, 36.22265625, 37.60107421875, 38.9794921875, 40.35791015625, 41.736328125, 43.11474609375, 44.4931640625, 45.87158203125, 47.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 22.0, 138.0, 746.0, 67.0, 17.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-671.114990234375, -658.53173828125, -645.9484252929688, -633.3651123046875, -620.7818603515625, -608.1986083984375, -595.6152954101562, -583.031982421875, -570.44873046875, -557.865478515625, -545.2821655273438, -532.6988525390625, -520.1156005859375, -507.5323181152344, -494.94903564453125, -482.3657531738281, -469.782470703125, -457.1991882324219, -444.61590576171875, -432.0326232910156, -419.4493408203125, -406.8660583496094, -394.28277587890625, -381.6994934082031, -369.1162109375, -356.5329284667969, -343.94964599609375, -331.3663635253906, -318.7830810546875, -306.1997985839844, -293.61651611328125, -281.0332336425781, -268.449951171875, -255.86666870117188, -243.28338623046875, -230.70010375976562, -218.1168212890625, -205.53353881835938, -192.95025634765625, -180.36697387695312, -167.78367614746094, -155.2003936767578, -142.6171112060547, -130.03382873535156, -117.45054626464844, -104.86726379394531, -92.28398132324219, -79.70069885253906, -67.11741638183594, -54.53413391113281, -41.95085144042969, -29.367568969726562, -16.784286499023438, -4.2010040283203125, 8.382278442382812, 20.965560913085938, 33.54884338378906, 46.13212585449219, 58.71540832519531, 71.29869079589844, 83.88197326660156, 96.46525573730469, 109.04853820800781, 121.63182067871094, 134.21510314941406]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 19.0, 20.0, 19.0, 22.0, 36.0, 45.0, 41.0, 48.0, 46.0, 56.0, 63.0, 39.0, 51.0, 64.0, 51.0, 54.0, 46.0, 47.0, 39.0, 32.0, 22.0, 28.0, 20.0, 20.0, 9.0, 10.0, 12.0, 5.0, 2.0, 3.0, 6.0, 4.0, 0.0, 4.0], "bins": [-152.04510498046875, -148.44219970703125, -144.8393096923828, -141.2364044189453, -137.63351440429688, -134.03060913085938, -130.42770385742188, -126.82481384277344, -123.22190856933594, -119.61901092529297, -116.01611328125, -112.4132080078125, -108.81031036376953, -105.20741271972656, -101.6045150756836, -98.00161743164062, -94.39871215820312, -90.79581451416016, -87.19291687011719, -83.59001159667969, -79.98711395263672, -76.38421630859375, -72.78131866455078, -69.17842102050781, -65.57552337646484, -61.972625732421875, -58.36972427368164, -54.76682662963867, -51.16392517089844, -47.56102752685547, -43.9581298828125, -40.355228424072266, -36.75232696533203, -33.14942932128906, -29.546527862548828, -25.94363021850586, -22.340728759765625, -18.737831115722656, -15.134931564331055, -11.532032012939453, -7.929132461547852, -4.32623291015625, -0.7233338356018066, 2.8795652389526367, 6.482464790344238, 10.085363388061523, 13.688262939453125, 17.291162490844727, 20.894062042236328, 24.49696159362793, 28.09986114501953, 31.7027587890625, 35.305660247802734, 38.9085578918457, 42.51145935058594, 46.114356994628906, 49.717254638671875, 53.320152282714844, 56.92305374145508, 60.52595138549805, 64.12885284423828, 67.73175048828125, 71.33464813232422, 74.93754577636719, 78.54045104980469]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 6.0, 6.0, 12.0, 15.0, 22.0, 29.0, 39.0, 55.0, 88.0, 87.0, 125.0, 181.0, 322.0, 512.0, 979.0, 1934.0, 5563.0, 51609.0, 4041125.0, 78853.0, 7920.0, 2417.0, 1055.0, 557.0, 305.0, 136.0, 105.0, 64.0, 45.0, 42.0, 9.0, 7.0, 17.0, 5.0, 3.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403076171875, -0.3917388916015625, -0.380401611328125, -0.3690643310546875, -0.35772705078125, -0.3463897705078125, -0.335052490234375, -0.3237152099609375, -0.3123779296875, -0.3010406494140625, -0.289703369140625, -0.2783660888671875, -0.26702880859375, -0.2556915283203125, -0.244354248046875, -0.2330169677734375, -0.2216796875, -0.2103424072265625, -0.199005126953125, -0.1876678466796875, -0.17633056640625, -0.1649932861328125, -0.153656005859375, -0.1423187255859375, -0.1309814453125, -0.1196441650390625, -0.108306884765625, -0.0969696044921875, -0.08563232421875, -0.0742950439453125, -0.062957763671875, -0.0516204833984375, -0.040283203125, -0.0289459228515625, -0.017608642578125, -0.0062713623046875, 0.00506591796875, 0.0164031982421875, 0.027740478515625, 0.0390777587890625, 0.0504150390625, 0.0617523193359375, 0.073089599609375, 0.0844268798828125, 0.09576416015625, 0.1071014404296875, 0.118438720703125, 0.1297760009765625, 0.14111328125, 0.1524505615234375, 0.163787841796875, 0.1751251220703125, 0.18646240234375, 0.1977996826171875, 0.209136962890625, 0.2204742431640625, 0.2318115234375, 0.2431488037109375, 0.254486083984375, 0.2658233642578125, 0.27716064453125, 0.2884979248046875, 0.299835205078125, 0.3111724853515625, 0.322509765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 2.0, 7.0, 13.0, 9.0, 14.0, 12.0, 13.0, 148.0, 648.0, 18.0, 10.0, 20.0, 9.0, 12.0, 6.0, 7.0, 6.0, 3.0, 6.0, 0.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.283203125, -0.2753429412841797, -0.2674827575683594, -0.25962257385253906, -0.25176239013671875, -0.24390220642089844, -0.23604202270507812, -0.2281818389892578, -0.2203216552734375, -0.2124614715576172, -0.20460128784179688, -0.19674110412597656, -0.18888092041015625, -0.18102073669433594, -0.17316055297851562, -0.1653003692626953, -0.157440185546875, -0.1495800018310547, -0.14171981811523438, -0.13385963439941406, -0.12599945068359375, -0.11813926696777344, -0.11027908325195312, -0.10241889953613281, -0.0945587158203125, -0.08669853210449219, -0.07883834838867188, -0.07097816467285156, -0.06311798095703125, -0.05525779724121094, -0.047397613525390625, -0.03953742980957031, -0.03167724609375, -0.023817062377929688, -0.015956878662109375, -0.008096694946289062, -0.00023651123046875, 0.0076236724853515625, 0.015483856201171875, 0.023344039916992188, 0.0312042236328125, 0.03906440734863281, 0.046924591064453125, 0.05478477478027344, 0.06264495849609375, 0.07050514221191406, 0.07836532592773438, 0.08622550964355469, 0.094085693359375, 0.10194587707519531, 0.10980606079101562, 0.11766624450683594, 0.12552642822265625, 0.13338661193847656, 0.14124679565429688, 0.1491069793701172, 0.1569671630859375, 0.1648273468017578, 0.17268753051757812, 0.18054771423339844, 0.18840789794921875, 0.19626808166503906, 0.20412826538085938, 0.2119884490966797, 0.2198486328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 6.0, 13.0, 14.0, 18.0, 15.0, 43.0, 38.0, 63.0, 92.0, 126.0, 225.0, 371.0, 741.0, 1474.0, 3397.0, 10685.0, 58401.0, 3940914.0, 153768.0, 16145.0, 4424.0, 1736.0, 733.0, 335.0, 216.0, 89.0, 63.0, 33.0, 28.0, 18.0, 9.0, 13.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.447540283203125, -0.43341064453125, -0.419281005859375, -0.4051513671875, -0.391021728515625, -0.37689208984375, -0.362762451171875, -0.3486328125, -0.334503173828125, -0.32037353515625, -0.306243896484375, -0.2921142578125, -0.277984619140625, -0.26385498046875, -0.249725341796875, -0.235595703125, -0.221466064453125, -0.20733642578125, -0.193206787109375, -0.1790771484375, -0.164947509765625, -0.15081787109375, -0.136688232421875, -0.12255859375, -0.108428955078125, -0.09429931640625, -0.080169677734375, -0.0660400390625, -0.051910400390625, -0.03778076171875, -0.023651123046875, -0.009521484375, 0.004608154296875, 0.01873779296875, 0.032867431640625, 0.0469970703125, 0.061126708984375, 0.07525634765625, 0.089385986328125, 0.103515625, 0.117645263671875, 0.13177490234375, 0.145904541015625, 0.1600341796875, 0.174163818359375, 0.18829345703125, 0.202423095703125, 0.216552734375, 0.230682373046875, 0.24481201171875, 0.258941650390625, 0.2730712890625, 0.287200927734375, 0.30133056640625, 0.315460205078125, 0.32958984375, 0.343719482421875, 0.35784912109375, 0.371978759765625, 0.3861083984375, 0.400238037109375, 0.41436767578125, 0.428497314453125, 0.442626953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 22.0, 22.0, 35.0, 51.0, 119.0, 428.0, 2087.0, 891.0, 201.0, 54.0, 36.0, 23.0, 16.0, 13.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31572723388671875, -0.3079681396484375, -0.30020904541015625, -0.292449951171875, -0.28469085693359375, -0.2769317626953125, -0.26917266845703125, -0.26141357421875, -0.25365447998046875, -0.2458953857421875, -0.23813629150390625, -0.230377197265625, -0.22261810302734375, -0.2148590087890625, -0.20709991455078125, -0.1993408203125, -0.19158172607421875, -0.1838226318359375, -0.17606353759765625, -0.168304443359375, -0.16054534912109375, -0.1527862548828125, -0.14502716064453125, -0.13726806640625, -0.12950897216796875, -0.1217498779296875, -0.11399078369140625, -0.106231689453125, -0.09847259521484375, -0.0907135009765625, -0.08295440673828125, -0.0751953125, -0.06743621826171875, -0.0596771240234375, -0.05191802978515625, -0.044158935546875, -0.03639984130859375, -0.0286407470703125, -0.02088165283203125, -0.01312255859375, -0.00536346435546875, 0.0023956298828125, 0.01015472412109375, 0.017913818359375, 0.02567291259765625, 0.0334320068359375, 0.04119110107421875, 0.0489501953125, 0.05670928955078125, 0.0644683837890625, 0.07222747802734375, 0.079986572265625, 0.08774566650390625, 0.0955047607421875, 0.10326385498046875, 0.11102294921875, 0.11878204345703125, 0.1265411376953125, 0.13430023193359375, 0.142059326171875, 0.14981842041015625, 0.1575775146484375, 0.16533660888671875, 0.173095703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 10.0, 22.0, 80.0, 282.0, 448.0, 110.0, 21.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3055990934371948, -1.2664577960968018, -1.2273164987564087, -1.1881752014160156, -1.1490339040756226, -1.1098926067352295, -1.0707513093948364, -1.0316100120544434, -0.9924687147140503, -0.9533274173736572, -0.9141861200332642, -0.8750448226928711, -0.835903525352478, -0.796762228012085, -0.7576209306716919, -0.7184796333312988, -0.6793383359909058, -0.6401970386505127, -0.6010557413101196, -0.5619144439697266, -0.5227731466293335, -0.48363184928894043, -0.44449055194854736, -0.4053492546081543, -0.36620795726776123, -0.32706665992736816, -0.2879253625869751, -0.24878406524658203, -0.20964276790618896, -0.1705014705657959, -0.13136017322540283, -0.09221887588500977, -0.05307745933532715, -0.013936161994934082, 0.025205135345458984, 0.06434643268585205, 0.10348773002624512, 0.14262902736663818, 0.18177032470703125, 0.22091162204742432, 0.2600529193878174, 0.29919421672821045, 0.3383355140686035, 0.3774768114089966, 0.41661810874938965, 0.4557594060897827, 0.4949007034301758, 0.5340420007705688, 0.5731832981109619, 0.612324595451355, 0.651465892791748, 0.6906071901321411, 0.7297484874725342, 0.7688897848129272, 0.8080310821533203, 0.8471723794937134, 0.8863136768341064, 0.9254549741744995, 0.9645962715148926, 1.0037375688552856, 1.0428788661956787, 1.0820201635360718, 1.1211614608764648, 1.160302758216858, 1.199444055557251]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 11.0, 17.0, 25.0, 25.0, 29.0, 44.0, 48.0, 43.0, 51.0, 67.0, 69.0, 70.0, 66.0, 79.0, 72.0, 58.0, 37.0, 35.0, 27.0, 29.0, 26.0, 16.0, 10.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6217141151428223, -0.5980504751205444, -0.5743868350982666, -0.5507232546806335, -0.5270596146583557, -0.5033959746360779, -0.47973233461380005, -0.4560687243938446, -0.43240511417388916, -0.40874147415161133, -0.3850778639316559, -0.36141422390937805, -0.3377506136894226, -0.3140869736671448, -0.29042333364486694, -0.2667597234249115, -0.24309608340263367, -0.21943245828151703, -0.1957688331604004, -0.17210519313812256, -0.14844158291816711, -0.12477795034646988, -0.10111431777477264, -0.077450692653656, -0.05378706753253937, -0.03012344054877758, -0.006459813565015793, 0.017203815281391144, 0.04086744040250778, 0.06453106552362442, 0.08819469809532166, 0.1118583232164383, 0.13552194833755493, 0.15918557345867157, 0.1828491985797882, 0.20651283860206604, 0.23017644882202148, 0.2538400888442993, 0.27750372886657715, 0.3011673390865326, 0.32483094930648804, 0.34849458932876587, 0.3721581995487213, 0.39582183957099915, 0.4194854497909546, 0.4431490898132324, 0.46681272983551025, 0.4904763400554657, 0.5141400098800659, 0.5378036499023438, 0.5614672899246216, 0.5851308703422546, 0.6087945103645325, 0.6324581503868103, 0.6561217904090881, 0.6797853708267212, 0.703449010848999, 0.7271126508712769, 0.7507762908935547, 0.7744398713111877, 0.7981035113334656, 0.8217671513557434, 0.8454307913780212, 0.8690943717956543, 0.8927580118179321]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 9.0, 15.0, 13.0, 23.0, 33.0, 34.0, 59.0, 85.0, 107.0, 168.0, 219.0, 318.0, 516.0, 719.0, 1047.0, 1613.0, 2559.0, 4126.0, 7082.0, 14318.0, 33588.0, 885583.0, 53723.0, 19386.0, 9263.0, 5119.0, 3016.0, 1934.0, 1214.0, 815.0, 534.0, 381.0, 274.0, 182.0, 131.0, 95.0, 68.0, 55.0, 33.0, 24.0, 13.0, 19.0, 7.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.095703125, -1.058807373046875, -1.02191162109375, -0.985015869140625, -0.9481201171875, -0.911224365234375, -0.87432861328125, -0.837432861328125, -0.800537109375, -0.763641357421875, -0.72674560546875, -0.689849853515625, -0.6529541015625, -0.616058349609375, -0.57916259765625, -0.542266845703125, -0.50537109375, -0.468475341796875, -0.43157958984375, -0.394683837890625, -0.3577880859375, -0.320892333984375, -0.28399658203125, -0.247100830078125, -0.210205078125, -0.173309326171875, -0.13641357421875, -0.099517822265625, -0.0626220703125, -0.025726318359375, 0.01116943359375, 0.048065185546875, 0.0849609375, 0.121856689453125, 0.15875244140625, 0.195648193359375, 0.2325439453125, 0.269439697265625, 0.30633544921875, 0.343231201171875, 0.380126953125, 0.417022705078125, 0.45391845703125, 0.490814208984375, 0.5277099609375, 0.564605712890625, 0.60150146484375, 0.638397216796875, 0.67529296875, 0.712188720703125, 0.74908447265625, 0.785980224609375, 0.8228759765625, 0.859771728515625, 0.89666748046875, 0.933563232421875, 0.970458984375, 1.007354736328125, 1.04425048828125, 1.081146240234375, 1.1180419921875, 1.154937744140625, 1.19183349609375, 1.228729248046875, 1.265625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 5.0, 1.0, 6.0, 4.0, 3.0, 9.0, 11.0, 11.0, 14.0, 11.0, 18.0, 593.0, 201.0, 15.0, 14.0, 14.0, 11.0, 14.0, 4.0, 7.0, 3.0, 6.0, 4.0, 0.0, 6.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.277587890625, -0.26983642578125, -0.2620849609375, -0.25433349609375, -0.24658203125, -0.23883056640625, -0.2310791015625, -0.22332763671875, -0.215576171875, -0.20782470703125, -0.2000732421875, -0.19232177734375, -0.1845703125, -0.17681884765625, -0.1690673828125, -0.16131591796875, -0.153564453125, -0.14581298828125, -0.1380615234375, -0.13031005859375, -0.12255859375, -0.11480712890625, -0.1070556640625, -0.09930419921875, -0.091552734375, -0.08380126953125, -0.0760498046875, -0.06829833984375, -0.060546875, -0.05279541015625, -0.0450439453125, -0.03729248046875, -0.029541015625, -0.02178955078125, -0.0140380859375, -0.00628662109375, 0.00146484375, 0.00921630859375, 0.0169677734375, 0.02471923828125, 0.032470703125, 0.04022216796875, 0.0479736328125, 0.05572509765625, 0.0634765625, 0.07122802734375, 0.0789794921875, 0.08673095703125, 0.094482421875, 0.10223388671875, 0.1099853515625, 0.11773681640625, 0.12548828125, 0.13323974609375, 0.1409912109375, 0.14874267578125, 0.156494140625, 0.16424560546875, 0.1719970703125, 0.17974853515625, 0.1875, 0.19525146484375, 0.2030029296875, 0.21075439453125, 0.218505859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 5.0, 6.0, 10.0, 18.0, 21.0, 32.0, 24.0, 39.0, 60.0, 59.0, 97.0, 125.0, 152.0, 226.0, 350.0, 501.0, 906.0, 1562.0, 3143.0, 6368.0, 14731.0, 38512.0, 128966.0, 482791.0, 261562.0, 66057.0, 22770.0, 9490.0, 4484.0, 2116.0, 1172.0, 702.0, 440.0, 264.0, 181.0, 150.0, 98.0, 72.0, 70.0, 29.0, 31.0, 41.0, 22.0, 20.0, 18.0, 17.0, 9.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.50439453125, -0.48743438720703125, -0.4704742431640625, -0.45351409912109375, -0.436553955078125, -0.41959381103515625, -0.4026336669921875, -0.38567352294921875, -0.36871337890625, -0.35175323486328125, -0.3347930908203125, -0.31783294677734375, -0.300872802734375, -0.28391265869140625, -0.2669525146484375, -0.24999237060546875, -0.2330322265625, -0.21607208251953125, -0.1991119384765625, -0.18215179443359375, -0.165191650390625, -0.14823150634765625, -0.1312713623046875, -0.11431121826171875, -0.09735107421875, -0.08039093017578125, -0.0634307861328125, -0.04647064208984375, -0.029510498046875, -0.01255035400390625, 0.0044097900390625, 0.02136993408203125, 0.038330078125, 0.05529022216796875, 0.0722503662109375, 0.08921051025390625, 0.106170654296875, 0.12313079833984375, 0.1400909423828125, 0.15705108642578125, 0.17401123046875, 0.19097137451171875, 0.2079315185546875, 0.22489166259765625, 0.241851806640625, 0.25881195068359375, 0.2757720947265625, 0.29273223876953125, 0.3096923828125, 0.32665252685546875, 0.3436126708984375, 0.36057281494140625, 0.377532958984375, 0.39449310302734375, 0.4114532470703125, 0.42841339111328125, 0.44537353515625, 0.46233367919921875, 0.4792938232421875, 0.49625396728515625, 0.513214111328125, 0.5301742553710938, 0.5471343994140625, 0.5640945434570312, 0.5810546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 8.0, 3.0, 4.0, 10.0, 11.0, 10.0, 16.0, 16.0, 15.0, 25.0, 21.0, 29.0, 29.0, 30.0, 34.0, 42.0, 38.0, 31.0, 40.0, 32.0, 27.0, 32.0, 34.0, 37.0, 44.0, 38.0, 31.0, 28.0, 34.0, 30.0, 30.0, 24.0, 28.0, 16.0, 24.0, 21.0, 7.0, 13.0, 9.0, 8.0, 5.0, 9.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.69775390625, -0.6742095947265625, -0.650665283203125, -0.6271209716796875, -0.60357666015625, -0.5800323486328125, -0.556488037109375, -0.5329437255859375, -0.5093994140625, -0.4858551025390625, -0.462310791015625, -0.4387664794921875, -0.41522216796875, -0.3916778564453125, -0.368133544921875, -0.3445892333984375, -0.321044921875, -0.2975006103515625, -0.273956298828125, -0.2504119873046875, -0.22686767578125, -0.2033233642578125, -0.179779052734375, -0.1562347412109375, -0.1326904296875, -0.1091461181640625, -0.085601806640625, -0.0620574951171875, -0.03851318359375, -0.0149688720703125, 0.008575439453125, 0.0321197509765625, 0.0556640625, 0.0792083740234375, 0.102752685546875, 0.1262969970703125, 0.14984130859375, 0.1733856201171875, 0.196929931640625, 0.2204742431640625, 0.2440185546875, 0.2675628662109375, 0.291107177734375, 0.3146514892578125, 0.33819580078125, 0.3617401123046875, 0.385284423828125, 0.4088287353515625, 0.432373046875, 0.4559173583984375, 0.479461669921875, 0.5030059814453125, 0.52655029296875, 0.5500946044921875, 0.573638916015625, 0.5971832275390625, 0.6207275390625, 0.6442718505859375, 0.667816162109375, 0.6913604736328125, 0.71490478515625, 0.7384490966796875, 0.761993408203125, 0.7855377197265625, 0.80908203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 9.0, 11.0, 23.0, 40.0, 63.0, 147.0, 505.0, 4221.0, 1027217.0, 15149.0, 801.0, 222.0, 65.0, 32.0, 15.0, 15.0, 7.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.25, -2.1972503662109375, -2.144500732421875, -2.0917510986328125, -2.03900146484375, -1.9862518310546875, -1.933502197265625, -1.8807525634765625, -1.8280029296875, -1.7752532958984375, -1.722503662109375, -1.6697540283203125, -1.61700439453125, -1.5642547607421875, -1.511505126953125, -1.4587554931640625, -1.406005859375, -1.3532562255859375, -1.300506591796875, -1.2477569580078125, -1.19500732421875, -1.1422576904296875, -1.089508056640625, -1.0367584228515625, -0.9840087890625, -0.9312591552734375, -0.878509521484375, -0.8257598876953125, -0.77301025390625, -0.7202606201171875, -0.667510986328125, -0.6147613525390625, -0.56201171875, -0.5092620849609375, -0.456512451171875, -0.4037628173828125, -0.35101318359375, -0.2982635498046875, -0.245513916015625, -0.1927642822265625, -0.1400146484375, -0.0872650146484375, -0.034515380859375, 0.0182342529296875, 0.07098388671875, 0.1237335205078125, 0.176483154296875, 0.2292327880859375, 0.281982421875, 0.3347320556640625, 0.387481689453125, 0.4402313232421875, 0.49298095703125, 0.5457305908203125, 0.598480224609375, 0.6512298583984375, 0.7039794921875, 0.7567291259765625, 0.809478759765625, 0.8622283935546875, 0.91497802734375, 0.9677276611328125, 1.020477294921875, 1.0732269287109375, 1.1259765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 5.0, 6.0, 14.0, 28.0, 43.0, 73.0, 83.0, 103.0, 112.0, 103.0, 113.0, 93.0, 50.0, 49.0, 32.0, 23.0, 13.0, 11.0, 13.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.568960189819336e-05, -2.5013461709022522e-05, -2.4337321519851685e-05, -2.3661181330680847e-05, -2.298504114151001e-05, -2.2308900952339172e-05, -2.1632760763168335e-05, -2.0956620573997498e-05, -2.028048038482666e-05, -1.9604340195655823e-05, -1.8928200006484985e-05, -1.8252059817314148e-05, -1.757591962814331e-05, -1.6899779438972473e-05, -1.6223639249801636e-05, -1.55474990606308e-05, -1.4871358871459961e-05, -1.4195218682289124e-05, -1.3519078493118286e-05, -1.2842938303947449e-05, -1.2166798114776611e-05, -1.1490657925605774e-05, -1.0814517736434937e-05, -1.0138377547264099e-05, -9.462237358093262e-06, -8.786097168922424e-06, -8.109956979751587e-06, -7.4338167905807495e-06, -6.757676601409912e-06, -6.081536412239075e-06, -5.405396223068237e-06, -4.7292560338974e-06, -4.0531158447265625e-06, -3.376975655555725e-06, -2.7008354663848877e-06, -2.0246952772140503e-06, -1.3485550880432129e-06, -6.724148988723755e-07, 3.725290298461914e-09, 6.798654794692993e-07, 1.3560056686401367e-06, 2.032145857810974e-06, 2.7082860469818115e-06, 3.384426236152649e-06, 4.060566425323486e-06, 4.736706614494324e-06, 5.412846803665161e-06, 6.0889869928359985e-06, 6.765127182006836e-06, 7.441267371177673e-06, 8.11740756034851e-06, 8.793547749519348e-06, 9.469687938690186e-06, 1.0145828127861023e-05, 1.082196831703186e-05, 1.1498108506202698e-05, 1.2174248695373535e-05, 1.2850388884544373e-05, 1.352652907371521e-05, 1.4202669262886047e-05, 1.4878809452056885e-05, 1.5554949641227722e-05, 1.623108983039856e-05, 1.6907230019569397e-05, 1.7583370208740234e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 24.0, 23.0, 54.0, 78.0, 160.0, 534.0, 2064.0, 28692.0, 997232.0, 17349.0, 1604.0, 393.0, 151.0, 70.0, 43.0, 29.0, 13.0, 11.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.1609878540039062, -1.1315460205078125, -1.1021041870117188, -1.072662353515625, -1.0432205200195312, -1.0137786865234375, -0.9843368530273438, -0.95489501953125, -0.9254531860351562, -0.8960113525390625, -0.8665695190429688, -0.837127685546875, -0.8076858520507812, -0.7782440185546875, -0.7488021850585938, -0.7193603515625, -0.6899185180664062, -0.6604766845703125, -0.6310348510742188, -0.601593017578125, -0.5721511840820312, -0.5427093505859375, -0.5132675170898438, -0.48382568359375, -0.45438385009765625, -0.4249420166015625, -0.39550018310546875, -0.366058349609375, -0.33661651611328125, -0.3071746826171875, -0.27773284912109375, -0.248291015625, -0.21884918212890625, -0.1894073486328125, -0.15996551513671875, -0.130523681640625, -0.10108184814453125, -0.0716400146484375, -0.04219818115234375, -0.01275634765625, 0.01668548583984375, 0.0461273193359375, 0.07556915283203125, 0.105010986328125, 0.13445281982421875, 0.1638946533203125, 0.19333648681640625, 0.2227783203125, 0.25222015380859375, 0.2816619873046875, 0.31110382080078125, 0.340545654296875, 0.36998748779296875, 0.3994293212890625, 0.42887115478515625, 0.45831298828125, 0.48775482177734375, 0.5171966552734375, 0.5466384887695312, 0.576080322265625, 0.6055221557617188, 0.6349639892578125, 0.6644058227539062, 0.69384765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 16.0, 33.0, 42.0, 92.0, 182.0, 268.0, 170.0, 83.0, 55.0, 21.0, 15.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0336685180664062, -1.0067901611328125, -0.9799118041992188, -0.953033447265625, -0.9261550903320312, -0.8992767333984375, -0.8723983764648438, -0.84552001953125, -0.8186416625976562, -0.7917633056640625, -0.7648849487304688, -0.738006591796875, -0.7111282348632812, -0.6842498779296875, -0.6573715209960938, -0.6304931640625, -0.6036148071289062, -0.5767364501953125, -0.5498580932617188, -0.522979736328125, -0.49610137939453125, -0.4692230224609375, -0.44234466552734375, -0.41546630859375, -0.38858795166015625, -0.3617095947265625, -0.33483123779296875, -0.307952880859375, -0.28107452392578125, -0.2541961669921875, -0.22731781005859375, -0.200439453125, -0.17356109619140625, -0.1466827392578125, -0.11980438232421875, -0.092926025390625, -0.06604766845703125, -0.0391693115234375, -0.01229095458984375, 0.01458740234375, 0.04146575927734375, 0.0683441162109375, 0.09522247314453125, 0.122100830078125, 0.14897918701171875, 0.1758575439453125, 0.20273590087890625, 0.2296142578125, 0.25649261474609375, 0.2833709716796875, 0.31024932861328125, 0.337127685546875, 0.36400604248046875, 0.3908843994140625, 0.41776275634765625, 0.44464111328125, 0.47151947021484375, 0.4983978271484375, 0.5252761840820312, 0.552154541015625, 0.5790328979492188, 0.6059112548828125, 0.6327896118164062, 0.65966796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 9.0, 46.0, 366.0, 501.0, 55.0, 17.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.407510757446289, -13.690621376037598, -12.973732948303223, -12.256843566894531, -11.539955139160156, -10.823065757751465, -10.106176376342773, -9.389287948608398, -8.672398567199707, -7.955509662628174, -7.238620758056641, -6.521731376647949, -5.804842472076416, -5.087953567504883, -4.371064186096191, -3.654175281524658, -2.937286376953125, -2.220397472381592, -1.5035083293914795, -0.7866191864013672, -0.06973028182983398, 0.6471586227416992, 1.3640480041503906, 2.080936908721924, 2.797825813293457, 3.5147147178649902, 4.231603622436523, 4.948493003845215, 5.665381908416748, 6.382270812988281, 7.099160194396973, 7.816049098968506, 8.532936096191406, 9.249825477600098, 9.966713905334473, 10.683603286743164, 11.400491714477539, 12.11738109588623, 12.834270477294922, 13.551158905029297, 14.268048286437988, 14.98493766784668, 15.701826095581055, 16.418716430664062, 17.135604858398438, 17.852493286132812, 18.569381713867188, 19.286272048950195, 20.00316047668457, 20.720048904418945, 21.436939239501953, 22.153827667236328, 22.870716094970703, 23.587604522705078, 24.304494857788086, 25.02138328552246, 25.73827362060547, 26.455162048339844, 27.17205238342285, 27.888940811157227, 28.6058292388916, 29.32271957397461, 30.039608001708984, 30.75649642944336, 31.473384857177734]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 8.0, 7.0, 8.0, 7.0, 19.0, 14.0, 36.0, 42.0, 73.0, 133.0, 137.0, 164.0, 124.0, 82.0, 51.0, 25.0, 15.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.19681739807129, -16.58119773864746, -15.96557903289795, -15.349960327148438, -14.73434066772461, -14.118721961975098, -13.503103256225586, -12.887483596801758, -12.27186393737793, -11.656245231628418, -11.04062557220459, -10.425006866455078, -9.80938720703125, -9.193768501281738, -8.578149795532227, -7.962530136108398, -7.346911430358887, -6.731292247772217, -6.115673065185547, -5.500054359436035, -4.884434700012207, -4.268815994262695, -3.6531968116760254, -3.0375776290893555, -2.4219584465026855, -1.8063392639160156, -1.1907202005386353, -0.5751011371612549, 0.04051804542541504, 0.656137228012085, 1.2717561721801758, 1.8873753547668457, 2.5029945373535156, 3.1186137199401855, 3.7342329025268555, 4.349851608276367, 4.965471267700195, 5.581089973449707, 6.196709156036377, 6.812328338623047, 7.427947521209717, 8.043566703796387, 8.659185409545898, 9.274805068969727, 9.890423774719238, 10.506043434143066, 11.121662139892578, 11.737281799316406, 12.352900505065918, 12.96851921081543, 13.584138870239258, 14.19975757598877, 14.815377235412598, 15.43099594116211, 16.046615600585938, 16.662235260009766, 17.27785301208496, 17.89347267150879, 18.509090423583984, 19.124710083007812, 19.74032974243164, 20.35594940185547, 20.971567153930664, 21.587186813354492, 22.20280647277832]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 3.0, 7.0, 12.0, 9.0, 14.0, 26.0, 20.0, 16.0, 39.0, 42.0, 56.0, 77.0, 105.0, 170.0, 248.0, 330.0, 523.0, 871.0, 1481.0, 2614.0, 5366.0, 12591.0, 42075.0, 3847089.0, 239244.0, 24718.0, 8500.0, 3727.0, 1874.0, 1039.0, 542.0, 325.0, 209.0, 132.0, 62.0, 46.0, 19.0, 22.0, 14.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6796875, -1.635284423828125, -1.59088134765625, -1.546478271484375, -1.5020751953125, -1.457672119140625, -1.41326904296875, -1.368865966796875, -1.324462890625, -1.280059814453125, -1.23565673828125, -1.191253662109375, -1.1468505859375, -1.102447509765625, -1.05804443359375, -1.013641357421875, -0.96923828125, -0.924835205078125, -0.88043212890625, -0.836029052734375, -0.7916259765625, -0.747222900390625, -0.70281982421875, -0.658416748046875, -0.614013671875, -0.569610595703125, -0.52520751953125, -0.480804443359375, -0.4364013671875, -0.391998291015625, -0.34759521484375, -0.303192138671875, -0.2587890625, -0.214385986328125, -0.16998291015625, -0.125579833984375, -0.0811767578125, -0.036773681640625, 0.00762939453125, 0.052032470703125, 0.096435546875, 0.140838623046875, 0.18524169921875, 0.229644775390625, 0.2740478515625, 0.318450927734375, 0.36285400390625, 0.407257080078125, 0.45166015625, 0.496063232421875, 0.54046630859375, 0.584869384765625, 0.6292724609375, 0.673675537109375, 0.71807861328125, 0.762481689453125, 0.806884765625, 0.851287841796875, 0.89569091796875, 0.940093994140625, 0.9844970703125, 1.028900146484375, 1.07330322265625, 1.117706298828125, 1.162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 11.0, 5.0, 5.0, 14.0, 11.0, 9.0, 12.0, 47.0, 312.0, 400.0, 57.0, 23.0, 14.0, 7.0, 10.0, 7.0, 12.0, 4.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.2511253356933594, -0.24468231201171875, -0.23823928833007812, -0.2317962646484375, -0.22535324096679688, -0.21891021728515625, -0.21246719360351562, -0.206024169921875, -0.19958114624023438, -0.19313812255859375, -0.18669509887695312, -0.1802520751953125, -0.17380905151367188, -0.16736602783203125, -0.16092300415039062, -0.15447998046875, -0.14803695678710938, -0.14159393310546875, -0.13515090942382812, -0.1287078857421875, -0.12226486206054688, -0.11582183837890625, -0.10937881469726562, -0.102935791015625, -0.09649276733398438, -0.09004974365234375, -0.08360671997070312, -0.0771636962890625, -0.07072067260742188, -0.06427764892578125, -0.057834625244140625, -0.0513916015625, -0.044948577880859375, -0.03850555419921875, -0.032062530517578125, -0.0256195068359375, -0.019176483154296875, -0.01273345947265625, -0.006290435791015625, 0.000152587890625, 0.006595611572265625, 0.01303863525390625, 0.019481658935546875, 0.0259246826171875, 0.032367706298828125, 0.03881072998046875, 0.045253753662109375, 0.05169677734375, 0.058139801025390625, 0.06458282470703125, 0.07102584838867188, 0.0774688720703125, 0.08391189575195312, 0.09035491943359375, 0.09679794311523438, 0.103240966796875, 0.10968399047851562, 0.11612701416015625, 0.12257003784179688, 0.1290130615234375, 0.13545608520507812, 0.14189910888671875, 0.14834213256835938, 0.15478515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 10.0, 4.0, 5.0, 16.0, 19.0, 29.0, 37.0, 50.0, 84.0, 134.0, 268.0, 519.0, 1272.0, 3357.0, 12609.0, 68390.0, 3533231.0, 523532.0, 38475.0, 7904.0, 2421.0, 922.0, 385.0, 195.0, 108.0, 87.0, 58.0, 41.0, 31.0, 18.0, 8.0, 17.0, 8.0, 6.0, 10.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90673828125, -0.8753128051757812, -0.8438873291015625, -0.8124618530273438, -0.781036376953125, -0.7496109008789062, -0.7181854248046875, -0.6867599487304688, -0.65533447265625, -0.6239089965820312, -0.5924835205078125, -0.5610580444335938, -0.529632568359375, -0.49820709228515625, -0.4667816162109375, -0.43535614013671875, -0.4039306640625, -0.37250518798828125, -0.3410797119140625, -0.30965423583984375, -0.278228759765625, -0.24680328369140625, -0.2153778076171875, -0.18395233154296875, -0.15252685546875, -0.12110137939453125, -0.0896759033203125, -0.05825042724609375, -0.026824951171875, 0.00460052490234375, 0.0360260009765625, 0.06745147705078125, 0.098876953125, 0.13030242919921875, 0.1617279052734375, 0.19315338134765625, 0.224578857421875, 0.25600433349609375, 0.2874298095703125, 0.31885528564453125, 0.35028076171875, 0.38170623779296875, 0.4131317138671875, 0.44455718994140625, 0.475982666015625, 0.5074081420898438, 0.5388336181640625, 0.5702590942382812, 0.6016845703125, 0.6331100463867188, 0.6645355224609375, 0.6959609985351562, 0.727386474609375, 0.7588119506835938, 0.7902374267578125, 0.8216629028320312, 0.85308837890625, 0.8845138549804688, 0.9159393310546875, 0.9473648071289062, 0.978790283203125, 1.0102157592773438, 1.0416412353515625, 1.0730667114257812, 1.1044921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 18.0, 17.0, 20.0, 25.0, 24.0, 29.0, 41.0, 55.0, 84.0, 147.0, 283.0, 744.0, 1638.0, 386.0, 136.0, 101.0, 68.0, 48.0, 50.0, 29.0, 21.0, 20.0, 19.0, 9.0, 7.0, 4.0, 4.0, 4.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1690673828125, -0.16382598876953125, -0.1585845947265625, -0.15334320068359375, -0.148101806640625, -0.14286041259765625, -0.1376190185546875, -0.13237762451171875, -0.12713623046875, -0.12189483642578125, -0.1166534423828125, -0.11141204833984375, -0.106170654296875, -0.10092926025390625, -0.0956878662109375, -0.09044647216796875, -0.085205078125, -0.07996368408203125, -0.0747222900390625, -0.06948089599609375, -0.064239501953125, -0.05899810791015625, -0.0537567138671875, -0.04851531982421875, -0.04327392578125, -0.03803253173828125, -0.0327911376953125, -0.02754974365234375, -0.022308349609375, -0.01706695556640625, -0.0118255615234375, -0.00658416748046875, -0.0013427734375, 0.00389862060546875, 0.0091400146484375, 0.01438140869140625, 0.019622802734375, 0.02486419677734375, 0.0301055908203125, 0.03534698486328125, 0.04058837890625, 0.04582977294921875, 0.0510711669921875, 0.05631256103515625, 0.061553955078125, 0.06679534912109375, 0.0720367431640625, 0.07727813720703125, 0.08251953125, 0.08776092529296875, 0.0930023193359375, 0.09824371337890625, 0.103485107421875, 0.10872650146484375, 0.1139678955078125, 0.11920928955078125, 0.12445068359375, 0.12969207763671875, 0.1349334716796875, 0.14017486572265625, 0.145416259765625, 0.15065765380859375, 0.1558990478515625, 0.16114044189453125, 0.1663818359375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 31.0, 449.0, 494.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.35866928100586, -11.14477825164795, -10.930887222290039, -10.716995239257812, -10.503104209899902, -10.289213180541992, -10.075322151184082, -9.861431121826172, -9.647539138793945, -9.433648109436035, -9.219757080078125, -9.005865097045898, -8.791974067687988, -8.578083038330078, -8.364192008972168, -8.150300979614258, -7.936409950256348, -7.7225189208984375, -7.508627414703369, -7.294736385345459, -7.080844879150391, -6.8669538497924805, -6.65306282043457, -6.43917179107666, -6.225280284881592, -6.011389255523682, -5.797497749328613, -5.583606719970703, -5.369715690612793, -5.155824184417725, -4.9419331550598145, -4.728041648864746, -4.514151096343994, -4.300260066986084, -4.086368560791016, -3.8724775314331055, -3.658586263656616, -3.444694995880127, -3.230803966522217, -3.0169126987457275, -2.8030214309692383, -2.589130163192749, -2.3752388954162598, -2.1613478660583496, -1.9474565982818604, -1.733565330505371, -1.5196741819381714, -1.3057830333709717, -1.0918917655944824, -0.8780005574226379, -0.6641093492507935, -0.450218141078949, -0.2363269329071045, -0.022435665130615234, 0.19145548343658447, 0.4053466320037842, 0.6192378997802734, 0.8331291079521179, 1.0470203161239624, 1.260911464691162, 1.4748027324676514, 1.6886940002441406, 1.9025851488113403, 2.11647629737854, 2.3303675651550293]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 8.0, 3.0, 10.0, 15.0, 14.0, 21.0, 35.0, 38.0, 52.0, 42.0, 57.0, 73.0, 68.0, 79.0, 78.0, 71.0, 66.0, 65.0, 52.0, 37.0, 29.0, 17.0, 15.0, 13.0, 9.0, 16.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0885677337646484, -1.0422866344451904, -0.9960055947303772, -0.949724555015564, -0.9034435153007507, -0.8571624755859375, -0.8108813762664795, -0.7646003365516663, -0.718319296836853, -0.6720382571220398, -0.6257571578025818, -0.5794761180877686, -0.5331950783729553, -0.4869140088558197, -0.4406329393386841, -0.39435189962387085, -0.34807080030441284, -0.3017897307872772, -0.255508691072464, -0.20922762155532837, -0.16294656693935394, -0.11666551232337952, -0.0703844428062439, -0.024103403091430664, 0.022177666425704956, 0.06845872104167938, 0.1147397831082344, 0.16102084517478943, 0.20730189979076385, 0.2535829544067383, 0.2998640239238739, 0.34614506363868713, 0.39242613315582275, 0.4387072026729584, 0.4849882423877716, 0.5312693119049072, 0.5775503516197205, 0.6238313913345337, 0.6701124906539917, 0.7163935303688049, 0.7626745700836182, 0.8089556097984314, 0.8552367091178894, 0.9015177488327026, 0.9477987885475159, 0.9940798282623291, 1.040360927581787, 1.0866420269012451, 1.1329231262207031, 1.1792042255401611, 1.2254852056503296, 1.2717663049697876, 1.3180474042892456, 1.364328384399414, 1.410609483718872, 1.45689058303833, 1.5031715631484985, 1.5494526624679565, 1.595733642578125, 1.642014741897583, 1.688295841217041, 1.7345768213272095, 1.7808579206466675, 1.827138900756836, 1.873420000076294]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 10.0, 19.0, 25.0, 35.0, 39.0, 61.0, 117.0, 155.0, 283.0, 523.0, 998.0, 2081.0, 4807.0, 12302.0, 46058.0, 883319.0, 71708.0, 15169.0, 5678.0, 2556.0, 1137.0, 570.0, 306.0, 198.0, 128.0, 76.0, 76.0, 28.0, 30.0, 15.0, 14.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7265625, -1.6735992431640625, -1.620635986328125, -1.5676727294921875, -1.51470947265625, -1.4617462158203125, -1.408782958984375, -1.3558197021484375, -1.3028564453125, -1.2498931884765625, -1.196929931640625, -1.1439666748046875, -1.09100341796875, -1.0380401611328125, -0.985076904296875, -0.9321136474609375, -0.879150390625, -0.8261871337890625, -0.773223876953125, -0.7202606201171875, -0.66729736328125, -0.6143341064453125, -0.561370849609375, -0.5084075927734375, -0.4554443359375, -0.4024810791015625, -0.349517822265625, -0.2965545654296875, -0.24359130859375, -0.1906280517578125, -0.137664794921875, -0.0847015380859375, -0.03173828125, 0.0212249755859375, 0.074188232421875, 0.1271514892578125, 0.18011474609375, 0.2330780029296875, 0.286041259765625, 0.3390045166015625, 0.3919677734375, 0.4449310302734375, 0.497894287109375, 0.5508575439453125, 0.60382080078125, 0.6567840576171875, 0.709747314453125, 0.7627105712890625, 0.815673828125, 0.8686370849609375, 0.921600341796875, 0.9745635986328125, 1.02752685546875, 1.0804901123046875, 1.133453369140625, 1.1864166259765625, 1.2393798828125, 1.2923431396484375, 1.345306396484375, 1.3982696533203125, 1.45123291015625, 1.5041961669921875, 1.557159423828125, 1.6101226806640625, 1.6630859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 4.0, 7.0, 7.0, 12.0, 14.0, 7.0, 24.0, 52.0, 176.0, 321.0, 198.0, 72.0, 17.0, 19.0, 13.0, 7.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2573070526123047, -0.2509422302246094, -0.24457740783691406, -0.23821258544921875, -0.23184776306152344, -0.22548294067382812, -0.2191181182861328, -0.2127532958984375, -0.2063884735107422, -0.20002365112304688, -0.19365882873535156, -0.18729400634765625, -0.18092918395996094, -0.17456436157226562, -0.1681995391845703, -0.161834716796875, -0.1554698944091797, -0.14910507202148438, -0.14274024963378906, -0.13637542724609375, -0.13001060485839844, -0.12364578247070312, -0.11728096008300781, -0.1109161376953125, -0.10455131530761719, -0.09818649291992188, -0.09182167053222656, -0.08545684814453125, -0.07909202575683594, -0.07272720336914062, -0.06636238098144531, -0.05999755859375, -0.05363273620605469, -0.047267913818359375, -0.04090309143066406, -0.03453826904296875, -0.028173446655273438, -0.021808624267578125, -0.015443801879882812, -0.0090789794921875, -0.0027141571044921875, 0.003650665283203125, 0.010015487670898438, 0.01638031005859375, 0.022745132446289062, 0.029109954833984375, 0.03547477722167969, 0.041839599609375, 0.04820442199707031, 0.054569244384765625, 0.06093406677246094, 0.06729888916015625, 0.07366371154785156, 0.08002853393554688, 0.08639335632324219, 0.0927581787109375, 0.09912300109863281, 0.10548782348632812, 0.11185264587402344, 0.11821746826171875, 0.12458229064941406, 0.13094711303710938, 0.1373119354248047, 0.1436767578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 6.0, 8.0, 6.0, 11.0, 16.0, 18.0, 14.0, 20.0, 23.0, 25.0, 45.0, 45.0, 68.0, 108.0, 155.0, 249.0, 503.0, 946.0, 2466.0, 8383.0, 35829.0, 233846.0, 632126.0, 106437.0, 19132.0, 4765.0, 1573.0, 701.0, 370.0, 177.0, 143.0, 76.0, 56.0, 37.0, 43.0, 24.0, 22.0, 13.0, 14.0, 13.0, 6.0, 7.0, 3.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.783203125, -0.7581939697265625, -0.733184814453125, -0.7081756591796875, -0.68316650390625, -0.6581573486328125, -0.633148193359375, -0.6081390380859375, -0.5831298828125, -0.5581207275390625, -0.533111572265625, -0.5081024169921875, -0.48309326171875, -0.4580841064453125, -0.433074951171875, -0.4080657958984375, -0.383056640625, -0.3580474853515625, -0.333038330078125, -0.3080291748046875, -0.28302001953125, -0.2580108642578125, -0.233001708984375, -0.2079925537109375, -0.1829833984375, -0.1579742431640625, -0.132965087890625, -0.1079559326171875, -0.08294677734375, -0.0579376220703125, -0.032928466796875, -0.0079193115234375, 0.01708984375, 0.0420989990234375, 0.067108154296875, 0.0921173095703125, 0.11712646484375, 0.1421356201171875, 0.167144775390625, 0.1921539306640625, 0.2171630859375, 0.2421722412109375, 0.267181396484375, 0.2921905517578125, 0.31719970703125, 0.3422088623046875, 0.367218017578125, 0.3922271728515625, 0.417236328125, 0.4422454833984375, 0.467254638671875, 0.4922637939453125, 0.51727294921875, 0.5422821044921875, 0.567291259765625, 0.5923004150390625, 0.6173095703125, 0.6423187255859375, 0.667327880859375, 0.6923370361328125, 0.71734619140625, 0.7423553466796875, 0.767364501953125, 0.7923736572265625, 0.8173828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 15.0, 11.0, 8.0, 18.0, 11.0, 23.0, 20.0, 20.0, 20.0, 32.0, 25.0, 33.0, 44.0, 32.0, 44.0, 55.0, 32.0, 29.0, 32.0, 43.0, 45.0, 37.0, 31.0, 29.0, 45.0, 28.0, 21.0, 22.0, 19.0, 24.0, 19.0, 19.0, 18.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.420654296875, -0.4067726135253906, -0.39289093017578125, -0.3790092468261719, -0.3651275634765625, -0.3512458801269531, -0.33736419677734375, -0.3234825134277344, -0.309600830078125, -0.2957191467285156, -0.28183746337890625, -0.2679557800292969, -0.2540740966796875, -0.24019241333007812, -0.22631072998046875, -0.21242904663085938, -0.19854736328125, -0.18466567993164062, -0.17078399658203125, -0.15690231323242188, -0.1430206298828125, -0.12913894653320312, -0.11525726318359375, -0.10137557983398438, -0.087493896484375, -0.07361221313476562, -0.05973052978515625, -0.045848846435546875, -0.0319671630859375, -0.018085479736328125, -0.00420379638671875, 0.009677886962890625, 0.0235595703125, 0.037441253662109375, 0.05132293701171875, 0.06520462036132812, 0.0790863037109375, 0.09296798706054688, 0.10684967041015625, 0.12073135375976562, 0.134613037109375, 0.14849472045898438, 0.16237640380859375, 0.17625808715820312, 0.1901397705078125, 0.20402145385742188, 0.21790313720703125, 0.23178482055664062, 0.24566650390625, 0.2595481872558594, 0.27342987060546875, 0.2873115539550781, 0.3011932373046875, 0.3150749206542969, 0.32895660400390625, 0.3428382873535156, 0.356719970703125, 0.3706016540527344, 0.38448333740234375, 0.3983650207519531, 0.4122467041015625, 0.4261283874511719, 0.44001007080078125, 0.4538917541503906, 0.4677734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 11.0, 21.0, 40.0, 78.0, 191.0, 484.0, 2750.0, 876621.0, 165636.0, 2021.0, 377.0, 143.0, 69.0, 43.0, 18.0, 9.0, 13.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.921875, -2.8553619384765625, -2.788848876953125, -2.7223358154296875, -2.65582275390625, -2.5893096923828125, -2.522796630859375, -2.4562835693359375, -2.3897705078125, -2.3232574462890625, -2.256744384765625, -2.1902313232421875, -2.12371826171875, -2.0572052001953125, -1.990692138671875, -1.9241790771484375, -1.857666015625, -1.7911529541015625, -1.724639892578125, -1.6581268310546875, -1.59161376953125, -1.5251007080078125, -1.458587646484375, -1.3920745849609375, -1.3255615234375, -1.2590484619140625, -1.192535400390625, -1.1260223388671875, -1.05950927734375, -0.9929962158203125, -0.926483154296875, -0.8599700927734375, -0.79345703125, -0.7269439697265625, -0.660430908203125, -0.5939178466796875, -0.52740478515625, -0.4608917236328125, -0.394378662109375, -0.3278656005859375, -0.2613525390625, -0.1948394775390625, -0.128326416015625, -0.0618133544921875, 0.00469970703125, 0.0712127685546875, 0.137725830078125, 0.2042388916015625, 0.270751953125, 0.3372650146484375, 0.403778076171875, 0.4702911376953125, 0.53680419921875, 0.6033172607421875, 0.669830322265625, 0.7363433837890625, 0.8028564453125, 0.8693695068359375, 0.935882568359375, 1.0023956298828125, 1.06890869140625, 1.1354217529296875, 1.201934814453125, 1.2684478759765625, 1.3349609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 11.0, 8.0, 19.0, 44.0, 179.0, 347.0, 241.0, 70.0, 21.0, 14.0, 8.0, 8.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010085105895996094, -9.755697101354599e-05, -9.426288306713104e-05, -9.09687951207161e-05, -8.767470717430115e-05, -8.43806192278862e-05, -8.108653128147125e-05, -7.77924433350563e-05, -7.449835538864136e-05, -7.120426744222641e-05, -6.791017949581146e-05, -6.461609154939651e-05, -6.132200360298157e-05, -5.802791565656662e-05, -5.473382771015167e-05, -5.1439739763736725e-05, -4.814565181732178e-05, -4.485156387090683e-05, -4.155747592449188e-05, -3.8263387978076935e-05, -3.496930003166199e-05, -3.167521208524704e-05, -2.8381124138832092e-05, -2.5087036192417145e-05, -2.1792948246002197e-05, -1.849886029958725e-05, -1.5204772353172302e-05, -1.1910684406757355e-05, -8.616596460342407e-06, -5.32250851392746e-06, -2.028420567512512e-06, 1.2656673789024353e-06, 4.559755325317383e-06, 7.85384327173233e-06, 1.1147931218147278e-05, 1.4442019164562225e-05, 1.7736107110977173e-05, 2.103019505739212e-05, 2.4324283003807068e-05, 2.7618370950222015e-05, 3.091245889663696e-05, 3.420654684305191e-05, 3.750063478946686e-05, 4.0794722735881805e-05, 4.408881068229675e-05, 4.73828986287117e-05, 5.067698657512665e-05, 5.3971074521541595e-05, 5.726516246795654e-05, 6.055925041437149e-05, 6.385333836078644e-05, 6.714742630720139e-05, 7.044151425361633e-05, 7.373560220003128e-05, 7.702969014644623e-05, 8.032377809286118e-05, 8.361786603927612e-05, 8.691195398569107e-05, 9.020604193210602e-05, 9.350012987852097e-05, 9.679421782493591e-05, 0.00010008830577135086, 0.00010338239371776581, 0.00010667648166418076, 0.0001099705696105957]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 20.0, 38.0, 69.0, 156.0, 340.0, 1309.0, 36790.0, 1005385.0, 3802.0, 419.0, 122.0, 48.0, 16.0, 16.0, 10.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0859375, -3.0206298828125, -2.955322265625, -2.8900146484375, -2.82470703125, -2.7593994140625, -2.694091796875, -2.6287841796875, -2.5634765625, -2.4981689453125, -2.432861328125, -2.3675537109375, -2.30224609375, -2.2369384765625, -2.171630859375, -2.1063232421875, -2.041015625, -1.9757080078125, -1.910400390625, -1.8450927734375, -1.77978515625, -1.7144775390625, -1.649169921875, -1.5838623046875, -1.5185546875, -1.4532470703125, -1.387939453125, -1.3226318359375, -1.25732421875, -1.1920166015625, -1.126708984375, -1.0614013671875, -0.99609375, -0.9307861328125, -0.865478515625, -0.8001708984375, -0.73486328125, -0.6695556640625, -0.604248046875, -0.5389404296875, -0.4736328125, -0.4083251953125, -0.343017578125, -0.2777099609375, -0.21240234375, -0.1470947265625, -0.081787109375, -0.0164794921875, 0.048828125, 0.1141357421875, 0.179443359375, 0.2447509765625, 0.31005859375, 0.3753662109375, 0.440673828125, 0.5059814453125, 0.5712890625, 0.6365966796875, 0.701904296875, 0.7672119140625, 0.83251953125, 0.8978271484375, 0.963134765625, 1.0284423828125, 1.09375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 23.0, 44.0, 95.0, 204.0, 281.0, 190.0, 85.0, 35.0, 19.0, 10.0, 5.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.4345703125, -1.40777587890625, -1.3809814453125, -1.35418701171875, -1.327392578125, -1.30059814453125, -1.2738037109375, -1.24700927734375, -1.22021484375, -1.19342041015625, -1.1666259765625, -1.13983154296875, -1.113037109375, -1.08624267578125, -1.0594482421875, -1.03265380859375, -1.005859375, -0.97906494140625, -0.9522705078125, -0.92547607421875, -0.898681640625, -0.87188720703125, -0.8450927734375, -0.81829833984375, -0.79150390625, -0.76470947265625, -0.7379150390625, -0.71112060546875, -0.684326171875, -0.65753173828125, -0.6307373046875, -0.60394287109375, -0.5771484375, -0.55035400390625, -0.5235595703125, -0.49676513671875, -0.469970703125, -0.44317626953125, -0.4163818359375, -0.38958740234375, -0.36279296875, -0.33599853515625, -0.3092041015625, -0.28240966796875, -0.255615234375, -0.22882080078125, -0.2020263671875, -0.17523193359375, -0.1484375, -0.12164306640625, -0.0948486328125, -0.06805419921875, -0.041259765625, -0.01446533203125, 0.0123291015625, 0.03912353515625, 0.06591796875, 0.09271240234375, 0.1195068359375, 0.14630126953125, 0.173095703125, 0.19989013671875, 0.2266845703125, 0.25347900390625, 0.2802734375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 25.0, 47.0, 150.0, 401.0, 259.0, 75.0, 18.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.841560363769531, -11.599265098571777, -11.356968879699707, -11.114673614501953, -10.872377395629883, -10.630082130432129, -10.387785911560059, -10.145490646362305, -9.903194427490234, -9.66089916229248, -9.41860294342041, -9.176307678222656, -8.934011459350586, -8.691716194152832, -8.449419975280762, -8.207124710083008, -7.964828968048096, -7.722533226013184, -7.4802374839782715, -7.237941741943359, -6.995645999908447, -6.753350257873535, -6.511054992675781, -6.268758773803711, -6.026463508605957, -5.784167766571045, -5.541872024536133, -5.299576282501221, -5.057280540466309, -4.8149847984313965, -4.572689056396484, -4.3303937911987305, -4.08809757232666, -3.845801830291748, -3.603506088256836, -3.361210346221924, -3.1189146041870117, -2.8766188621520996, -2.6343233585357666, -2.3920276165008545, -2.1497321128845215, -1.9074363708496094, -1.6651406288146973, -1.4228450059890747, -1.1805492639541626, -0.9382535219192505, -0.6959578990936279, -0.4536621570587158, -0.2113664150238037, 0.03092929720878601, 0.27322500944137573, 0.5155206918716431, 0.7578164339065552, 1.0001121759414673, 1.2424077987670898, 1.484703540802002, 1.726999282836914, 1.9692950248718262, 2.2115907669067383, 2.4538865089416504, 2.6961822509765625, 2.9384779930114746, 3.1807734966278076, 3.4230692386627197, 3.665364980697632]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 9.0, 9.0, 12.0, 5.0, 20.0, 21.0, 37.0, 62.0, 73.0, 77.0, 94.0, 95.0, 101.0, 87.0, 80.0, 61.0, 40.0, 32.0, 18.0, 14.0, 12.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.269471168518066, -7.0550079345703125, -6.840544700622559, -6.626081466674805, -6.411618232727051, -6.197154998779297, -5.982691764831543, -5.768228530883789, -5.553765296936035, -5.339302062988281, -5.124838829040527, -4.910375595092773, -4.6959123611450195, -4.481449127197266, -4.266985893249512, -4.052522659301758, -3.838059902191162, -3.623596668243408, -3.4091334342956543, -3.1946702003479004, -2.9802069664001465, -2.7657437324523926, -2.5512807369232178, -2.336817502975464, -2.12235426902771, -1.907891035079956, -1.6934278011322021, -1.4789646863937378, -1.2645014524459839, -1.05003821849823, -0.8355751037597656, -0.6211118698120117, -0.4066486358642578, -0.1921854317188263, 0.022277772426605225, 0.23674094676971436, 0.45120418071746826, 0.6656674146652222, 0.8801305294036865, 1.0945937633514404, 1.3090569972991943, 1.5235202312469482, 1.7379834651947021, 1.9524465799331665, 2.166909694671631, 2.3813729286193848, 2.5958361625671387, 2.8102993965148926, 3.0247626304626465, 3.2392258644104004, 3.4536890983581543, 3.668152332305908, 3.882615566253662, 4.097078800201416, 4.311541557312012, 4.526004791259766, 4.7404680252075195, 4.954931259155273, 5.169394493103027, 5.383857727050781, 5.598320960998535, 5.812784194946289, 6.027247428894043, 6.241710662841797, 6.456173896789551]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 9.0, 7.0, 6.0, 7.0, 13.0, 7.0, 24.0, 24.0, 34.0, 31.0, 43.0, 63.0, 70.0, 103.0, 178.0, 266.0, 499.0, 985.0, 1788.0, 3919.0, 16587.0, 4064396.0, 93586.0, 7207.0, 2207.0, 1035.0, 526.0, 291.0, 156.0, 90.0, 52.0, 31.0, 13.0, 10.0, 6.0, 8.0, 3.0, 1.0, 5.0], "bins": [-5.359375, -5.2447662353515625, -5.130157470703125, -5.0155487060546875, -4.90093994140625, -4.7863311767578125, -4.671722412109375, -4.5571136474609375, -4.4425048828125, -4.3278961181640625, -4.213287353515625, -4.0986785888671875, -3.98406982421875, -3.8694610595703125, -3.754852294921875, -3.6402435302734375, -3.525634765625, -3.4110260009765625, -3.296417236328125, -3.1818084716796875, -3.06719970703125, -2.9525909423828125, -2.837982177734375, -2.7233734130859375, -2.6087646484375, -2.4941558837890625, -2.379547119140625, -2.2649383544921875, -2.15032958984375, -2.0357208251953125, -1.921112060546875, -1.8065032958984375, -1.69189453125, -1.5772857666015625, -1.462677001953125, -1.3480682373046875, -1.23345947265625, -1.1188507080078125, -1.004241943359375, -0.8896331787109375, -0.7750244140625, -0.6604156494140625, -0.545806884765625, -0.4311981201171875, -0.31658935546875, -0.2019805908203125, -0.087371826171875, 0.0272369384765625, 0.141845703125, 0.2564544677734375, 0.371063232421875, 0.4856719970703125, 0.60028076171875, 0.7148895263671875, 0.829498291015625, 0.9441070556640625, 1.0587158203125, 1.1733245849609375, 1.287933349609375, 1.4025421142578125, 1.51715087890625, 1.6317596435546875, 1.746368408203125, 1.8609771728515625, 1.9755859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 4.0, 11.0, 5.0, 15.0, 9.0, 15.0, 30.0, 84.0, 209.0, 298.0, 158.0, 55.0, 24.0, 20.0, 9.0, 9.0, 9.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.260986328125, -0.25533199310302734, -0.2496776580810547, -0.24402332305908203, -0.23836898803710938, -0.23271465301513672, -0.22706031799316406, -0.2214059829711914, -0.21575164794921875, -0.2100973129272461, -0.20444297790527344, -0.19878864288330078, -0.19313430786132812, -0.18747997283935547, -0.1818256378173828, -0.17617130279541016, -0.1705169677734375, -0.16486263275146484, -0.1592082977294922, -0.15355396270751953, -0.14789962768554688, -0.14224529266357422, -0.13659095764160156, -0.1309366226196289, -0.12528228759765625, -0.1196279525756836, -0.11397361755371094, -0.10831928253173828, -0.10266494750976562, -0.09701061248779297, -0.09135627746582031, -0.08570194244384766, -0.080047607421875, -0.07439327239990234, -0.06873893737792969, -0.06308460235595703, -0.057430267333984375, -0.05177593231201172, -0.04612159729003906, -0.040467262268066406, -0.03481292724609375, -0.029158592224121094, -0.023504257202148438, -0.01784992218017578, -0.012195587158203125, -0.006541252136230469, -0.0008869171142578125, 0.004767417907714844, 0.0104217529296875, 0.016076087951660156, 0.021730422973632812, 0.02738475799560547, 0.033039093017578125, 0.03869342803955078, 0.04434776306152344, 0.050002098083496094, 0.05565643310546875, 0.061310768127441406, 0.06696510314941406, 0.07261943817138672, 0.07827377319335938, 0.08392810821533203, 0.08958244323730469, 0.09523677825927734, 0.10089111328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 12.0, 14.0, 20.0, 33.0, 59.0, 135.0, 283.0, 1371.0, 20289.0, 4139710.0, 30159.0, 1530.0, 330.0, 154.0, 81.0, 23.0, 18.0, 19.0, 10.0, 3.0, 10.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.466461181640625, -3.34503173828125, -3.223602294921875, -3.1021728515625, -2.980743408203125, -2.85931396484375, -2.737884521484375, -2.616455078125, -2.495025634765625, -2.37359619140625, -2.252166748046875, -2.1307373046875, -2.009307861328125, -1.88787841796875, -1.766448974609375, -1.64501953125, -1.523590087890625, -1.40216064453125, -1.280731201171875, -1.1593017578125, -1.037872314453125, -0.91644287109375, -0.795013427734375, -0.673583984375, -0.552154541015625, -0.43072509765625, -0.309295654296875, -0.1878662109375, -0.066436767578125, 0.05499267578125, 0.176422119140625, 0.2978515625, 0.419281005859375, 0.54071044921875, 0.662139892578125, 0.7835693359375, 0.904998779296875, 1.02642822265625, 1.147857666015625, 1.269287109375, 1.390716552734375, 1.51214599609375, 1.633575439453125, 1.7550048828125, 1.876434326171875, 1.99786376953125, 2.119293212890625, 2.24072265625, 2.362152099609375, 2.48358154296875, 2.605010986328125, 2.7264404296875, 2.847869873046875, 2.96929931640625, 3.090728759765625, 3.212158203125, 3.333587646484375, 3.45501708984375, 3.576446533203125, 3.6978759765625, 3.819305419921875, 3.94073486328125, 4.062164306640625, 4.18359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 15.0, 17.0, 34.0, 37.0, 66.0, 164.0, 725.0, 2407.0, 352.0, 99.0, 58.0, 29.0, 18.0, 12.0, 8.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3760414123535156, -0.36438751220703125, -0.3527336120605469, -0.3410797119140625, -0.3294258117675781, -0.31777191162109375, -0.3061180114746094, -0.294464111328125, -0.2828102111816406, -0.27115631103515625, -0.2595024108886719, -0.2478485107421875, -0.23619461059570312, -0.22454071044921875, -0.21288681030273438, -0.20123291015625, -0.18957901000976562, -0.17792510986328125, -0.16627120971679688, -0.1546173095703125, -0.14296340942382812, -0.13130950927734375, -0.11965560913085938, -0.108001708984375, -0.09634780883789062, -0.08469390869140625, -0.07304000854492188, -0.0613861083984375, -0.049732208251953125, -0.03807830810546875, -0.026424407958984375, -0.0147705078125, -0.003116607666015625, 0.00853729248046875, 0.020191192626953125, 0.0318450927734375, 0.043498992919921875, 0.05515289306640625, 0.06680679321289062, 0.078460693359375, 0.09011459350585938, 0.10176849365234375, 0.11342239379882812, 0.1250762939453125, 0.13673019409179688, 0.14838409423828125, 0.16003799438476562, 0.17169189453125, 0.18334579467773438, 0.19499969482421875, 0.20665359497070312, 0.2183074951171875, 0.22996139526367188, 0.24161529541015625, 0.2532691955566406, 0.264923095703125, 0.2765769958496094, 0.28823089599609375, 0.2998847961425781, 0.3115386962890625, 0.3231925964355469, 0.33484649658203125, 0.3465003967285156, 0.358154296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 5.0, 13.0, 30.0, 209.0, 553.0, 160.0, 18.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3447232246398926, -2.2490410804748535, -2.1533589363098145, -2.0576767921447754, -1.9619946479797363, -1.8663125038146973, -1.7706303596496582, -1.6749482154846191, -1.57926607131958, -1.483583927154541, -1.387901782989502, -1.292219638824463, -1.1965374946594238, -1.1008553504943848, -1.0051732063293457, -0.9094910025596619, -0.813808798789978, -0.718126654624939, -0.6224445104598999, -0.5267623662948608, -0.4310801923274994, -0.3353980481624603, -0.23971587419509888, -0.14403373003005981, -0.04835158586502075, 0.04733056575059891, 0.14301271736621857, 0.23869487643241882, 0.3343770205974579, 0.43005916476249695, 0.5257413387298584, 0.6214234828948975, 0.7171056270599365, 0.8127877712249756, 0.9084699153900146, 1.0041520595550537, 1.0998342037200928, 1.1955163478851318, 1.291198492050171, 1.38688063621521, 1.482562780380249, 1.578244924545288, 1.6739270687103271, 1.7696092128753662, 1.8652913570404053, 1.9609735012054443, 2.0566556453704834, 2.1523377895355225, 2.2480201721191406, 2.3437023162841797, 2.4393844604492188, 2.535066604614258, 2.630748748779297, 2.726430892944336, 2.822113037109375, 2.917795181274414, 3.013477325439453, 3.109159469604492, 3.2048416137695312, 3.3005237579345703, 3.3962059020996094, 3.4918880462646484, 3.5875701904296875, 3.6832523345947266, 3.7789344787597656]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 7.0, 6.0, 11.0, 14.0, 10.0, 20.0, 20.0, 39.0, 40.0, 46.0, 58.0, 66.0, 72.0, 80.0, 71.0, 76.0, 72.0, 51.0, 51.0, 34.0, 45.0, 21.0, 24.0, 14.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1454839706420898, -1.1123164892196655, -1.0791491270065308, -1.0459816455841064, -1.0128141641616821, -0.9796468019485474, -0.946479320526123, -0.9133118987083435, -0.880144476890564, -0.8469770550727844, -0.8138095736503601, -0.7806421518325806, -0.747474730014801, -0.7143073081970215, -0.6811398267745972, -0.6479724049568176, -0.6148049235343933, -0.5816375017166138, -0.5484700202941895, -0.5153025984764099, -0.48213517665863037, -0.44896772503852844, -0.4158002734184265, -0.382632851600647, -0.34946539998054504, -0.3162979483604431, -0.2831305265426636, -0.24996307492256165, -0.2167956382036209, -0.18362820148468018, -0.15046074986457825, -0.11729331314563751, -0.08412587642669678, -0.050958435982465744, -0.01779099553823471, 0.015376448631286621, 0.048543885350227356, 0.08171132206916809, 0.11487877368927002, 0.14804621040821075, 0.1812136471271515, 0.21438108384609222, 0.24754852056503296, 0.2807159721851349, 0.3138834238052368, 0.34705084562301636, 0.3802182972431183, 0.4133857488632202, 0.44655317068099976, 0.4797206223011017, 0.5128880739212036, 0.5460554957389832, 0.5792229175567627, 0.612390398979187, 0.6455578207969666, 0.6787252426147461, 0.7118927240371704, 0.74506014585495, 0.7782276272773743, 0.8113950490951538, 0.8445624709129333, 0.8777298927307129, 0.9108973741531372, 0.9440647959709167, 0.9772322177886963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 10.0, 15.0, 22.0, 20.0, 17.0, 54.0, 69.0, 104.0, 135.0, 238.0, 410.0, 753.0, 1637.0, 4226.0, 16044.0, 256202.0, 733373.0, 25397.0, 5566.0, 1949.0, 960.0, 484.0, 292.0, 159.0, 118.0, 79.0, 55.0, 39.0, 36.0, 24.0, 17.0, 11.0, 11.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5966796875, -1.545379638671875, -1.49407958984375, -1.442779541015625, -1.3914794921875, -1.340179443359375, -1.28887939453125, -1.237579345703125, -1.186279296875, -1.134979248046875, -1.08367919921875, -1.032379150390625, -0.9810791015625, -0.929779052734375, -0.87847900390625, -0.827178955078125, -0.77587890625, -0.724578857421875, -0.67327880859375, -0.621978759765625, -0.5706787109375, -0.519378662109375, -0.46807861328125, -0.416778564453125, -0.365478515625, -0.314178466796875, -0.26287841796875, -0.211578369140625, -0.1602783203125, -0.108978271484375, -0.05767822265625, -0.006378173828125, 0.044921875, 0.096221923828125, 0.14752197265625, 0.198822021484375, 0.2501220703125, 0.301422119140625, 0.35272216796875, 0.404022216796875, 0.455322265625, 0.506622314453125, 0.55792236328125, 0.609222412109375, 0.6605224609375, 0.711822509765625, 0.76312255859375, 0.814422607421875, 0.86572265625, 0.917022705078125, 0.96832275390625, 1.019622802734375, 1.0709228515625, 1.122222900390625, 1.17352294921875, 1.224822998046875, 1.276123046875, 1.327423095703125, 1.37872314453125, 1.430023193359375, 1.4813232421875, 1.532623291015625, 1.58392333984375, 1.635223388671875, 1.6865234375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 25.0, 49.0, 92.0, 184.0, 266.0, 163.0, 88.0, 39.0, 17.0, 12.0, 8.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.263427734375, -0.25785160064697266, -0.2522754669189453, -0.24669933319091797, -0.24112319946289062, -0.23554706573486328, -0.22997093200683594, -0.2243947982788086, -0.21881866455078125, -0.2132425308227539, -0.20766639709472656, -0.20209026336669922, -0.19651412963867188, -0.19093799591064453, -0.1853618621826172, -0.17978572845458984, -0.1742095947265625, -0.16863346099853516, -0.1630573272705078, -0.15748119354248047, -0.15190505981445312, -0.14632892608642578, -0.14075279235839844, -0.1351766586303711, -0.12960052490234375, -0.1240243911743164, -0.11844825744628906, -0.11287212371826172, -0.10729598999023438, -0.10171985626220703, -0.09614372253417969, -0.09056758880615234, -0.084991455078125, -0.07941532135009766, -0.07383918762207031, -0.06826305389404297, -0.06268692016601562, -0.05711078643798828, -0.05153465270996094, -0.045958518981933594, -0.04038238525390625, -0.034806251525878906, -0.029230117797851562, -0.02365398406982422, -0.018077850341796875, -0.012501716613769531, -0.0069255828857421875, -0.0013494491577148438, 0.0042266845703125, 0.009802818298339844, 0.015378952026367188, 0.02095508575439453, 0.026531219482421875, 0.03210735321044922, 0.03768348693847656, 0.043259620666503906, 0.04883575439453125, 0.054411888122558594, 0.05998802185058594, 0.06556415557861328, 0.07114028930664062, 0.07671642303466797, 0.08229255676269531, 0.08786869049072266, 0.09344482421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 12.0, 26.0, 21.0, 40.0, 46.0, 78.0, 98.0, 153.0, 242.0, 395.0, 574.0, 1038.0, 1985.0, 5309.0, 20313.0, 125023.0, 651073.0, 201035.0, 28849.0, 6872.0, 2407.0, 1109.0, 629.0, 421.0, 255.0, 162.0, 101.0, 84.0, 48.0, 28.0, 22.0, 17.0, 14.0, 11.0, 9.0, 11.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8525390625, -0.8255767822265625, -0.798614501953125, -0.7716522216796875, -0.74468994140625, -0.7177276611328125, -0.690765380859375, -0.6638031005859375, -0.6368408203125, -0.6098785400390625, -0.582916259765625, -0.5559539794921875, -0.52899169921875, -0.5020294189453125, -0.475067138671875, -0.4481048583984375, -0.421142578125, -0.3941802978515625, -0.367218017578125, -0.3402557373046875, -0.31329345703125, -0.2863311767578125, -0.259368896484375, -0.2324066162109375, -0.2054443359375, -0.1784820556640625, -0.151519775390625, -0.1245574951171875, -0.09759521484375, -0.0706329345703125, -0.043670654296875, -0.0167083740234375, 0.01025390625, 0.0372161865234375, 0.064178466796875, 0.0911407470703125, 0.11810302734375, 0.1450653076171875, 0.172027587890625, 0.1989898681640625, 0.2259521484375, 0.2529144287109375, 0.279876708984375, 0.3068389892578125, 0.33380126953125, 0.3607635498046875, 0.387725830078125, 0.4146881103515625, 0.441650390625, 0.4686126708984375, 0.495574951171875, 0.5225372314453125, 0.54949951171875, 0.5764617919921875, 0.603424072265625, 0.6303863525390625, 0.6573486328125, 0.6843109130859375, 0.711273193359375, 0.7382354736328125, 0.76519775390625, 0.7921600341796875, 0.819122314453125, 0.8460845947265625, 0.873046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 3.0, 7.0, 5.0, 11.0, 13.0, 13.0, 13.0, 23.0, 16.0, 15.0, 28.0, 27.0, 23.0, 27.0, 29.0, 34.0, 49.0, 35.0, 39.0, 51.0, 38.0, 40.0, 35.0, 34.0, 23.0, 47.0, 45.0, 22.0, 34.0, 27.0, 34.0, 22.0, 19.0, 12.0, 20.0, 13.0, 13.0, 6.0, 6.0, 6.0, 7.0, 6.0, 7.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.36572265625, -0.35418701171875, -0.3426513671875, -0.33111572265625, -0.319580078125, -0.30804443359375, -0.2965087890625, -0.28497314453125, -0.2734375, -0.26190185546875, -0.2503662109375, -0.23883056640625, -0.227294921875, -0.21575927734375, -0.2042236328125, -0.19268798828125, -0.18115234375, -0.16961669921875, -0.1580810546875, -0.14654541015625, -0.135009765625, -0.12347412109375, -0.1119384765625, -0.10040283203125, -0.0888671875, -0.07733154296875, -0.0657958984375, -0.05426025390625, -0.042724609375, -0.03118896484375, -0.0196533203125, -0.00811767578125, 0.00341796875, 0.01495361328125, 0.0264892578125, 0.03802490234375, 0.049560546875, 0.06109619140625, 0.0726318359375, 0.08416748046875, 0.095703125, 0.10723876953125, 0.1187744140625, 0.13031005859375, 0.141845703125, 0.15338134765625, 0.1649169921875, 0.17645263671875, 0.18798828125, 0.19952392578125, 0.2110595703125, 0.22259521484375, 0.234130859375, 0.24566650390625, 0.2572021484375, 0.26873779296875, 0.2802734375, 0.29180908203125, 0.3033447265625, 0.31488037109375, 0.326416015625, 0.33795166015625, 0.3494873046875, 0.36102294921875, 0.37255859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 7.0, 4.0, 6.0, 11.0, 22.0, 25.0, 56.0, 106.0, 228.0, 479.0, 1470.0, 7478.0, 154738.0, 854315.0, 25183.0, 2989.0, 769.0, 320.0, 160.0, 75.0, 42.0, 18.0, 15.0, 4.0, 15.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7289810180664062, -0.7040557861328125, -0.6791305541992188, -0.654205322265625, -0.6292800903320312, -0.6043548583984375, -0.5794296264648438, -0.55450439453125, -0.5295791625976562, -0.5046539306640625, -0.47972869873046875, -0.454803466796875, -0.42987823486328125, -0.4049530029296875, -0.38002777099609375, -0.3551025390625, -0.33017730712890625, -0.3052520751953125, -0.28032684326171875, -0.255401611328125, -0.23047637939453125, -0.2055511474609375, -0.18062591552734375, -0.15570068359375, -0.13077545166015625, -0.1058502197265625, -0.08092498779296875, -0.055999755859375, -0.03107452392578125, -0.0061492919921875, 0.01877593994140625, 0.043701171875, 0.06862640380859375, 0.0935516357421875, 0.11847686767578125, 0.143402099609375, 0.16832733154296875, 0.1932525634765625, 0.21817779541015625, 0.24310302734375, 0.26802825927734375, 0.2929534912109375, 0.31787872314453125, 0.342803955078125, 0.36772918701171875, 0.3926544189453125, 0.41757965087890625, 0.4425048828125, 0.46743011474609375, 0.4923553466796875, 0.5172805786132812, 0.542205810546875, 0.5671310424804688, 0.5920562744140625, 0.6169815063476562, 0.64190673828125, 0.6668319702148438, 0.6917572021484375, 0.7166824340820312, 0.741607666015625, 0.7665328979492188, 0.7914581298828125, 0.8163833618164062, 0.84130859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 7.0, 17.0, 23.0, 30.0, 44.0, 71.0, 72.0, 110.0, 161.0, 127.0, 100.0, 51.0, 47.0, 44.0, 30.0, 20.0, 16.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018513202667236328, -0.00017572380602359772, -0.00016631558537483215, -0.0001569073647260666, -0.00014749914407730103, -0.00013809092342853546, -0.0001286827027797699, -0.00011927448213100433, -0.00010986626148223877, -0.0001004580408334732, -9.104982018470764e-05, -8.164159953594208e-05, -7.223337888717651e-05, -6.282515823841095e-05, -5.3416937589645386e-05, -4.400871694087982e-05, -3.460049629211426e-05, -2.5192275643348694e-05, -1.578405499458313e-05, -6.375834345817566e-06, 3.032386302947998e-06, 1.2440606951713562e-05, 2.1848827600479126e-05, 3.125704824924469e-05, 4.0665268898010254e-05, 5.007348954677582e-05, 5.948171019554138e-05, 6.888993084430695e-05, 7.829815149307251e-05, 8.770637214183807e-05, 9.711459279060364e-05, 0.0001065228134393692, 0.00011593103408813477, 0.00012533925473690033, 0.0001347474753856659, 0.00014415569603443146, 0.00015356391668319702, 0.00016297213733196259, 0.00017238035798072815, 0.0001817885786294937, 0.00019119679927825928, 0.00020060501992702484, 0.0002100132405757904, 0.00021942146122455597, 0.00022882968187332153, 0.0002382379025220871, 0.00024764612317085266, 0.0002570543438196182, 0.0002664625644683838, 0.00027587078511714935, 0.0002852790057659149, 0.0002946872264146805, 0.00030409544706344604, 0.0003135036677122116, 0.00032291188836097717, 0.00033232010900974274, 0.0003417283296585083, 0.00035113655030727386, 0.00036054477095603943, 0.000369952991604805, 0.00037936121225357056, 0.0003887694329023361, 0.0003981776535511017, 0.00040758587419986725, 0.0004169940948486328]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 4.0, 12.0, 19.0, 37.0, 43.0, 83.0, 132.0, 257.0, 641.0, 1592.0, 6205.0, 67037.0, 888778.0, 74567.0, 6367.0, 1563.0, 591.0, 245.0, 143.0, 77.0, 56.0, 16.0, 15.0, 22.0, 11.0, 7.0, 6.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97509765625, -0.948394775390625, -0.92169189453125, -0.894989013671875, -0.8682861328125, -0.841583251953125, -0.81488037109375, -0.788177490234375, -0.761474609375, -0.734771728515625, -0.70806884765625, -0.681365966796875, -0.6546630859375, -0.627960205078125, -0.60125732421875, -0.574554443359375, -0.5478515625, -0.521148681640625, -0.49444580078125, -0.467742919921875, -0.4410400390625, -0.414337158203125, -0.38763427734375, -0.360931396484375, -0.334228515625, -0.307525634765625, -0.28082275390625, -0.254119873046875, -0.2274169921875, -0.200714111328125, -0.17401123046875, -0.147308349609375, -0.12060546875, -0.093902587890625, -0.06719970703125, -0.040496826171875, -0.0137939453125, 0.012908935546875, 0.03961181640625, 0.066314697265625, 0.093017578125, 0.119720458984375, 0.14642333984375, 0.173126220703125, 0.1998291015625, 0.226531982421875, 0.25323486328125, 0.279937744140625, 0.306640625, 0.333343505859375, 0.36004638671875, 0.386749267578125, 0.4134521484375, 0.440155029296875, 0.46685791015625, 0.493560791015625, 0.520263671875, 0.546966552734375, 0.57366943359375, 0.600372314453125, 0.6270751953125, 0.653778076171875, 0.68048095703125, 0.707183837890625, 0.73388671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 6.0, 17.0, 17.0, 34.0, 42.0, 52.0, 65.0, 118.0, 148.0, 148.0, 104.0, 68.0, 59.0, 29.0, 29.0, 16.0, 9.0, 10.0, 13.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6575355529785156, -0.6422195434570312, -0.6269035339355469, -0.6115875244140625, -0.5962715148925781, -0.5809555053710938, -0.5656394958496094, -0.550323486328125, -0.5350074768066406, -0.5196914672851562, -0.5043754577636719, -0.4890594482421875, -0.4737434387207031, -0.45842742919921875, -0.4431114196777344, -0.42779541015625, -0.4124794006347656, -0.39716339111328125, -0.3818473815917969, -0.3665313720703125, -0.3512153625488281, -0.33589935302734375, -0.3205833435058594, -0.305267333984375, -0.2899513244628906, -0.27463531494140625, -0.2593193054199219, -0.2440032958984375, -0.22868728637695312, -0.21337127685546875, -0.19805526733398438, -0.1827392578125, -0.16742324829101562, -0.15210723876953125, -0.13679122924804688, -0.1214752197265625, -0.10615921020507812, -0.09084320068359375, -0.07552719116210938, -0.060211181640625, -0.044895172119140625, -0.02957916259765625, -0.014263153076171875, 0.0010528564453125, 0.016368865966796875, 0.03168487548828125, 0.047000885009765625, 0.06231689453125, 0.07763290405273438, 0.09294891357421875, 0.10826492309570312, 0.1235809326171875, 0.13889694213867188, 0.15421295166015625, 0.16952896118164062, 0.184844970703125, 0.20016098022460938, 0.21547698974609375, 0.23079299926757812, 0.2461090087890625, 0.2614250183105469, 0.27674102783203125, 0.2920570373535156, 0.307373046875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 31.0, 328.0, 581.0, 51.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.163188934326172, -25.557373046875, -24.95155906677246, -24.345745086669922, -23.73992919921875, -23.134113311767578, -22.52829933166504, -21.9224853515625, -21.316669464111328, -20.710853576660156, -20.105039596557617, -19.499225616455078, -18.893409729003906, -18.287593841552734, -17.681779861450195, -17.075965881347656, -16.470149993896484, -15.864335060119629, -15.258520126342773, -14.652705192565918, -14.046890258789062, -13.441075325012207, -12.835260391235352, -12.229445457458496, -11.62363052368164, -11.017815589904785, -10.41200065612793, -9.806185722351074, -9.200370788574219, -8.594555854797363, -7.988740921020508, -7.382925987243652, -6.777109146118164, -6.171294212341309, -5.565479278564453, -4.959664344787598, -4.353849411010742, -3.7480344772338867, -3.1422195434570312, -2.536404609680176, -1.9305896759033203, -1.3247747421264648, -0.7189598083496094, -0.1131448745727539, 0.49267005920410156, 1.098484992980957, 1.7042999267578125, 2.310114860534668, 2.9159297943115234, 3.521744728088379, 4.127559661865234, 4.73337459564209, 5.339189529418945, 5.945004463195801, 6.550819396972656, 7.156634330749512, 7.762449264526367, 8.368264198303223, 8.974079132080078, 9.579894065856934, 10.185708999633789, 10.791523933410645, 11.3973388671875, 12.003153800964355, 12.608968734741211]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 6.0, 8.0, 11.0, 8.0, 15.0, 24.0, 31.0, 25.0, 37.0, 32.0, 46.0, 51.0, 50.0, 53.0, 59.0, 63.0, 61.0, 59.0, 47.0, 49.0, 47.0, 28.0, 43.0, 30.0, 27.0, 18.0, 15.0, 10.0, 12.0, 0.0, 3.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1264801025390625, -4.003203392028809, -3.8799262046813965, -3.7566492557525635, -3.6333723068237305, -3.5100955963134766, -3.3868186473846436, -3.2635416984558105, -3.1402647495269775, -3.0169878005981445, -2.8937108516693115, -2.7704339027404785, -2.6471571922302246, -2.5238800048828125, -2.4006032943725586, -2.2773263454437256, -2.1540493965148926, -2.0307724475860596, -1.9074954986572266, -1.784218668937683, -1.66094172000885, -1.537664771080017, -1.4143879413604736, -1.2911109924316406, -1.1678340435028076, -1.0445570945739746, -0.9212802052497864, -0.7980033159255981, -0.6747263669967651, -0.5514494180679321, -0.4281725287437439, -0.30489563941955566, -0.18161869049072266, -0.058341771364212036, 0.06493514776229858, 0.1882120668888092, 0.3114889860153198, 0.43476593494415283, 0.5580428242683411, 0.6813197135925293, 0.8045966625213623, 0.9278736114501953, 1.0511505603790283, 1.1744273900985718, 1.2977043390274048, 1.4209812879562378, 1.5442581176757812, 1.6675350666046143, 1.7908120155334473, 1.9140889644622803, 2.0373659133911133, 2.1606428623199463, 2.2839198112487793, 2.407196521759033, 2.530473470687866, 2.653750419616699, 2.7770273685455322, 2.9003043174743652, 3.0235812664031982, 3.1468582153320312, 3.270134925842285, 3.3934121131896973, 3.516688823699951, 3.639965772628784, 3.763242721557617]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 11.0, 16.0, 23.0, 48.0, 72.0, 153.0, 447.0, 1835.0, 232926.0, 3956656.0, 1652.0, 292.0, 78.0, 25.0, 12.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.96875, -10.73052978515625, -10.4923095703125, -10.25408935546875, -10.015869140625, -9.77764892578125, -9.5394287109375, -9.30120849609375, -9.06298828125, -8.82476806640625, -8.5865478515625, -8.34832763671875, -8.110107421875, -7.87188720703125, -7.6336669921875, -7.39544677734375, -7.1572265625, -6.91900634765625, -6.6807861328125, -6.44256591796875, -6.204345703125, -5.96612548828125, -5.7279052734375, -5.48968505859375, -5.25146484375, -5.01324462890625, -4.7750244140625, -4.53680419921875, -4.298583984375, -4.06036376953125, -3.8221435546875, -3.58392333984375, -3.345703125, -3.10748291015625, -2.8692626953125, -2.63104248046875, -2.392822265625, -2.15460205078125, -1.9163818359375, -1.67816162109375, -1.43994140625, -1.20172119140625, -0.9635009765625, -0.72528076171875, -0.487060546875, -0.24884033203125, -0.0106201171875, 0.22760009765625, 0.4658203125, 0.70404052734375, 0.9422607421875, 1.18048095703125, 1.418701171875, 1.65692138671875, 1.8951416015625, 2.13336181640625, 2.37158203125, 2.60980224609375, 2.8480224609375, 3.08624267578125, 3.324462890625, 3.56268310546875, 3.8009033203125, 4.03912353515625, 4.27734375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 10.0, 23.0, 32.0, 66.0, 127.0, 225.0, 217.0, 135.0, 79.0, 27.0, 13.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.3017578125, -0.2953205108642578, -0.2888832092285156, -0.28244590759277344, -0.27600860595703125, -0.26957130432128906, -0.2631340026855469, -0.2566967010498047, -0.2502593994140625, -0.2438220977783203, -0.23738479614257812, -0.23094749450683594, -0.22451019287109375, -0.21807289123535156, -0.21163558959960938, -0.2051982879638672, -0.198760986328125, -0.1923236846923828, -0.18588638305664062, -0.17944908142089844, -0.17301177978515625, -0.16657447814941406, -0.16013717651367188, -0.1536998748779297, -0.1472625732421875, -0.1408252716064453, -0.13438796997070312, -0.12795066833496094, -0.12151336669921875, -0.11507606506347656, -0.10863876342773438, -0.10220146179199219, -0.09576416015625, -0.08932685852050781, -0.08288955688476562, -0.07645225524902344, -0.07001495361328125, -0.06357765197753906, -0.057140350341796875, -0.05070304870605469, -0.0442657470703125, -0.03782844543457031, -0.031391143798828125, -0.024953842163085938, -0.01851654052734375, -0.012079238891601562, -0.005641937255859375, 0.0007953643798828125, 0.007232666015625, 0.013669967651367188, 0.020107269287109375, 0.026544570922851562, 0.03298187255859375, 0.03941917419433594, 0.045856475830078125, 0.05229377746582031, 0.0587310791015625, 0.06516838073730469, 0.07160568237304688, 0.07804298400878906, 0.08448028564453125, 0.09091758728027344, 0.09735488891601562, 0.10379219055175781, 0.1102294921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 15.0, 22.0, 26.0, 60.0, 95.0, 237.0, 593.0, 2056.0, 12048.0, 258150.0, 3882584.0, 32841.0, 3999.0, 928.0, 300.0, 142.0, 74.0, 42.0, 24.0, 17.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.244140625, -2.1909637451171875, -2.137786865234375, -2.0846099853515625, -2.03143310546875, -1.9782562255859375, -1.925079345703125, -1.8719024658203125, -1.8187255859375, -1.7655487060546875, -1.712371826171875, -1.6591949462890625, -1.60601806640625, -1.5528411865234375, -1.499664306640625, -1.4464874267578125, -1.393310546875, -1.3401336669921875, -1.286956787109375, -1.2337799072265625, -1.18060302734375, -1.1274261474609375, -1.074249267578125, -1.0210723876953125, -0.9678955078125, -0.9147186279296875, -0.861541748046875, -0.8083648681640625, -0.75518798828125, -0.7020111083984375, -0.648834228515625, -0.5956573486328125, -0.54248046875, -0.4893035888671875, -0.436126708984375, -0.3829498291015625, -0.32977294921875, -0.2765960693359375, -0.223419189453125, -0.1702423095703125, -0.1170654296875, -0.0638885498046875, -0.010711669921875, 0.0424652099609375, 0.09564208984375, 0.1488189697265625, 0.201995849609375, 0.2551727294921875, 0.308349609375, 0.3615264892578125, 0.414703369140625, 0.4678802490234375, 0.52105712890625, 0.5742340087890625, 0.627410888671875, 0.6805877685546875, 0.7337646484375, 0.7869415283203125, 0.840118408203125, 0.8932952880859375, 0.94647216796875, 0.9996490478515625, 1.052825927734375, 1.1060028076171875, 1.1591796875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 11.0, 29.0, 37.0, 48.0, 110.0, 311.0, 1529.0, 1346.0, 281.0, 127.0, 71.0, 44.0, 33.0, 15.0, 17.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2381591796875, -0.2304668426513672, -0.22277450561523438, -0.21508216857910156, -0.20738983154296875, -0.19969749450683594, -0.19200515747070312, -0.1843128204345703, -0.1766204833984375, -0.1689281463623047, -0.16123580932617188, -0.15354347229003906, -0.14585113525390625, -0.13815879821777344, -0.13046646118164062, -0.12277412414550781, -0.115081787109375, -0.10738945007324219, -0.09969711303710938, -0.09200477600097656, -0.08431243896484375, -0.07662010192871094, -0.06892776489257812, -0.06123542785644531, -0.0535430908203125, -0.04585075378417969, -0.038158416748046875, -0.030466079711914062, -0.02277374267578125, -0.015081405639648438, -0.007389068603515625, 0.0003032684326171875, 0.00799560546875, 0.015687942504882812, 0.023380279541015625, 0.031072616577148438, 0.03876495361328125, 0.04645729064941406, 0.054149627685546875, 0.06184196472167969, 0.0695343017578125, 0.07722663879394531, 0.08491897583007812, 0.09261131286621094, 0.10030364990234375, 0.10799598693847656, 0.11568832397460938, 0.12338066101074219, 0.131072998046875, 0.1387653350830078, 0.14645767211914062, 0.15415000915527344, 0.16184234619140625, 0.16953468322753906, 0.17722702026367188, 0.1849193572998047, 0.1926116943359375, 0.2003040313720703, 0.20799636840820312, 0.21568870544433594, 0.22338104248046875, 0.23107337951660156, 0.23876571655273438, 0.2464580535888672, 0.254150390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 87.0, 648.0, 242.0, 16.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.866507053375244, -4.717939853668213, -4.569372177124023, -4.420804977416992, -4.272237777709961, -4.1236701011657715, -3.9751029014587402, -3.82653546333313, -3.6779680252075195, -3.529400587081909, -3.380833148956299, -3.2322659492492676, -3.0836985111236572, -2.935131072998047, -2.7865638732910156, -2.6379964351654053, -2.489428997039795, -2.3408615589141846, -2.192294120788574, -2.043726921081543, -1.8951594829559326, -1.7465920448303223, -1.5980247259140015, -1.4494574069976807, -1.3008899688720703, -1.15232253074646, -1.0037552118301392, -0.8551878333091736, -0.706620454788208, -0.5580530762672424, -0.40948569774627686, -0.26091837882995605, -0.1123514175415039, 0.03621596097946167, 0.18478333950042725, 0.3333507180213928, 0.4819180965423584, 0.630485475063324, 0.7790528535842896, 0.9276201725006104, 1.0761876106262207, 1.224755048751831, 1.3733223676681519, 1.5218896865844727, 1.670457124710083, 1.8190245628356934, 1.9675918817520142, 2.116159200668335, 2.2647266387939453, 2.4132940769195557, 2.561861515045166, 2.7104287147521973, 2.8589961528778076, 3.007563591003418, 3.156130790710449, 3.3046982288360596, 3.45326566696167, 3.6018331050872803, 3.7504005432128906, 3.898967742919922, 4.047534942626953, 4.196102619171143, 4.344669818878174, 4.493237495422363, 4.6418046951293945]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 13.0, 16.0, 11.0, 24.0, 24.0, 30.0, 33.0, 41.0, 33.0, 43.0, 49.0, 46.0, 67.0, 49.0, 57.0, 53.0, 50.0, 53.0, 50.0, 39.0, 40.0, 31.0, 22.0, 24.0, 11.0, 13.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8123870491981506, -0.7890617251396179, -0.7657364010810852, -0.7424110770225525, -0.7190857529640198, -0.6957604289054871, -0.6724351048469543, -0.6491097807884216, -0.6257844567298889, -0.6024591326713562, -0.5791338086128235, -0.5558084845542908, -0.5324831604957581, -0.5091578364372253, -0.4858325123786926, -0.4625071883201599, -0.4391818642616272, -0.4158565402030945, -0.39253121614456177, -0.36920589208602905, -0.34588056802749634, -0.3225552439689636, -0.2992299199104309, -0.2759045958518982, -0.2525792717933655, -0.22925394773483276, -0.20592862367630005, -0.18260329961776733, -0.15927797555923462, -0.1359526515007019, -0.11262732744216919, -0.08930200338363647, -0.06597673892974854, -0.04265141487121582, -0.019326090812683105, 0.003999233245849609, 0.027324557304382324, 0.05064988136291504, 0.07397520542144775, 0.09730052947998047, 0.12062585353851318, 0.1439511775970459, 0.1672765016555786, 0.19060182571411133, 0.21392714977264404, 0.23725247383117676, 0.2605777978897095, 0.2839031219482422, 0.3072284460067749, 0.3305537700653076, 0.35387909412384033, 0.37720441818237305, 0.40052974224090576, 0.4238550662994385, 0.4471803903579712, 0.4705057144165039, 0.4938310384750366, 0.5171563625335693, 0.540481686592102, 0.5638070106506348, 0.5871323347091675, 0.6104576587677002, 0.6337829828262329, 0.6571083068847656, 0.6804336309432983]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 3.0, 9.0, 13.0, 18.0, 30.0, 51.0, 54.0, 73.0, 118.0, 166.0, 259.0, 494.0, 894.0, 1826.0, 5834.0, 32452.0, 661137.0, 318344.0, 19203.0, 4135.0, 1558.0, 691.0, 396.0, 239.0, 172.0, 97.0, 70.0, 63.0, 59.0, 21.0, 17.0, 17.0, 15.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.266326904296875, -1.22894287109375, -1.191558837890625, -1.1541748046875, -1.116790771484375, -1.07940673828125, -1.042022705078125, -1.004638671875, -0.967254638671875, -0.92987060546875, -0.892486572265625, -0.8551025390625, -0.817718505859375, -0.78033447265625, -0.742950439453125, -0.70556640625, -0.668182373046875, -0.63079833984375, -0.593414306640625, -0.5560302734375, -0.518646240234375, -0.48126220703125, -0.443878173828125, -0.406494140625, -0.369110107421875, -0.33172607421875, -0.294342041015625, -0.2569580078125, -0.219573974609375, -0.18218994140625, -0.144805908203125, -0.107421875, -0.070037841796875, -0.03265380859375, 0.004730224609375, 0.0421142578125, 0.079498291015625, 0.11688232421875, 0.154266357421875, 0.191650390625, 0.229034423828125, 0.26641845703125, 0.303802490234375, 0.3411865234375, 0.378570556640625, 0.41595458984375, 0.453338623046875, 0.49072265625, 0.528106689453125, 0.56549072265625, 0.602874755859375, 0.6402587890625, 0.677642822265625, 0.71502685546875, 0.752410888671875, 0.789794921875, 0.827178955078125, 0.86456298828125, 0.901947021484375, 0.9393310546875, 0.976715087890625, 1.01409912109375, 1.051483154296875, 1.0888671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 16.0, 14.0, 42.0, 70.0, 134.0, 202.0, 203.0, 147.0, 84.0, 33.0, 18.0, 10.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.292724609375, -0.28661632537841797, -0.28050804138183594, -0.2743997573852539, -0.2682914733886719, -0.26218318939208984, -0.2560749053955078, -0.24996662139892578, -0.24385833740234375, -0.23775005340576172, -0.2316417694091797, -0.22553348541259766, -0.21942520141601562, -0.2133169174194336, -0.20720863342285156, -0.20110034942626953, -0.1949920654296875, -0.18888378143310547, -0.18277549743652344, -0.1766672134399414, -0.17055892944335938, -0.16445064544677734, -0.1583423614501953, -0.15223407745361328, -0.14612579345703125, -0.14001750946044922, -0.1339092254638672, -0.12780094146728516, -0.12169265747070312, -0.1155843734741211, -0.10947608947753906, -0.10336780548095703, -0.097259521484375, -0.09115123748779297, -0.08504295349121094, -0.0789346694946289, -0.07282638549804688, -0.06671810150146484, -0.06060981750488281, -0.05450153350830078, -0.04839324951171875, -0.04228496551513672, -0.03617668151855469, -0.030068397521972656, -0.023960113525390625, -0.017851829528808594, -0.011743545532226562, -0.005635261535644531, 0.0004730224609375, 0.006581306457519531, 0.012689590454101562, 0.018797874450683594, 0.024906158447265625, 0.031014442443847656, 0.03712272644042969, 0.04323101043701172, 0.04933929443359375, 0.05544757843017578, 0.06155586242675781, 0.06766414642333984, 0.07377243041992188, 0.0798807144165039, 0.08598899841308594, 0.09209728240966797, 0.09820556640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 10.0, 17.0, 20.0, 27.0, 30.0, 52.0, 83.0, 119.0, 214.0, 349.0, 645.0, 1287.0, 2910.0, 7844.0, 29371.0, 163698.0, 588359.0, 202672.0, 35210.0, 9248.0, 3309.0, 1365.0, 718.0, 360.0, 204.0, 144.0, 74.0, 56.0, 38.0, 38.0, 22.0, 17.0, 9.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5849609375, -0.5629348754882812, -0.5409088134765625, -0.5188827514648438, -0.496856689453125, -0.47483062744140625, -0.4528045654296875, -0.43077850341796875, -0.40875244140625, -0.38672637939453125, -0.3647003173828125, -0.34267425537109375, -0.320648193359375, -0.29862213134765625, -0.2765960693359375, -0.25457000732421875, -0.2325439453125, -0.21051788330078125, -0.1884918212890625, -0.16646575927734375, -0.144439697265625, -0.12241363525390625, -0.1003875732421875, -0.07836151123046875, -0.05633544921875, -0.03430938720703125, -0.0122833251953125, 0.00974273681640625, 0.031768798828125, 0.05379486083984375, 0.0758209228515625, 0.09784698486328125, 0.119873046875, 0.14189910888671875, 0.1639251708984375, 0.18595123291015625, 0.207977294921875, 0.23000335693359375, 0.2520294189453125, 0.27405548095703125, 0.29608154296875, 0.31810760498046875, 0.3401336669921875, 0.36215972900390625, 0.384185791015625, 0.40621185302734375, 0.4282379150390625, 0.45026397705078125, 0.4722900390625, 0.49431610107421875, 0.5163421630859375, 0.5383682250976562, 0.560394287109375, 0.5824203491210938, 0.6044464111328125, 0.6264724731445312, 0.64849853515625, 0.6705245971679688, 0.6925506591796875, 0.7145767211914062, 0.736602783203125, 0.7586288452148438, 0.7806549072265625, 0.8026809692382812, 0.82470703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 10.0, 16.0, 13.0, 17.0, 17.0, 22.0, 32.0, 39.0, 30.0, 36.0, 41.0, 49.0, 44.0, 34.0, 36.0, 45.0, 36.0, 36.0, 44.0, 47.0, 35.0, 28.0, 35.0, 33.0, 28.0, 18.0, 14.0, 26.0, 15.0, 19.0, 21.0, 12.0, 11.0, 11.0, 7.0, 2.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38427734375, -0.37104034423828125, -0.3578033447265625, -0.34456634521484375, -0.331329345703125, -0.31809234619140625, -0.3048553466796875, -0.29161834716796875, -0.27838134765625, -0.26514434814453125, -0.2519073486328125, -0.23867034912109375, -0.225433349609375, -0.21219635009765625, -0.1989593505859375, -0.18572235107421875, -0.1724853515625, -0.15924835205078125, -0.1460113525390625, -0.13277435302734375, -0.119537353515625, -0.10630035400390625, -0.0930633544921875, -0.07982635498046875, -0.06658935546875, -0.05335235595703125, -0.0401153564453125, -0.02687835693359375, -0.013641357421875, -0.00040435791015625, 0.0128326416015625, 0.02606964111328125, 0.039306640625, 0.05254364013671875, 0.0657806396484375, 0.07901763916015625, 0.092254638671875, 0.10549163818359375, 0.1187286376953125, 0.13196563720703125, 0.14520263671875, 0.15843963623046875, 0.1716766357421875, 0.18491363525390625, 0.198150634765625, 0.21138763427734375, 0.2246246337890625, 0.23786163330078125, 0.2510986328125, 0.26433563232421875, 0.2775726318359375, 0.29080963134765625, 0.304046630859375, 0.31728363037109375, 0.3305206298828125, 0.34375762939453125, 0.35699462890625, 0.37023162841796875, 0.3834686279296875, 0.39670562744140625, 0.409942626953125, 0.42317962646484375, 0.4364166259765625, 0.44965362548828125, 0.462890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 10.0, 11.0, 18.0, 29.0, 40.0, 78.0, 118.0, 171.0, 412.0, 1033.0, 3190.0, 14557.0, 158774.0, 813243.0, 46541.0, 7047.0, 1902.0, 707.0, 315.0, 137.0, 81.0, 45.0, 18.0, 14.0, 18.0, 11.0, 9.0, 2.0, 7.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8359375, -0.810821533203125, -0.78570556640625, -0.760589599609375, -0.7354736328125, -0.710357666015625, -0.68524169921875, -0.660125732421875, -0.635009765625, -0.609893798828125, -0.58477783203125, -0.559661865234375, -0.5345458984375, -0.509429931640625, -0.48431396484375, -0.459197998046875, -0.43408203125, -0.408966064453125, -0.38385009765625, -0.358734130859375, -0.3336181640625, -0.308502197265625, -0.28338623046875, -0.258270263671875, -0.233154296875, -0.208038330078125, -0.18292236328125, -0.157806396484375, -0.1326904296875, -0.107574462890625, -0.08245849609375, -0.057342529296875, -0.0322265625, -0.007110595703125, 0.01800537109375, 0.043121337890625, 0.0682373046875, 0.093353271484375, 0.11846923828125, 0.143585205078125, 0.168701171875, 0.193817138671875, 0.21893310546875, 0.244049072265625, 0.2691650390625, 0.294281005859375, 0.31939697265625, 0.344512939453125, 0.36962890625, 0.394744873046875, 0.41986083984375, 0.444976806640625, 0.4700927734375, 0.495208740234375, 0.52032470703125, 0.545440673828125, 0.570556640625, 0.595672607421875, 0.62078857421875, 0.645904541015625, 0.6710205078125, 0.696136474609375, 0.72125244140625, 0.746368408203125, 0.771484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 15.0, 18.0, 24.0, 30.0, 38.0, 49.0, 56.0, 73.0, 105.0, 164.0, 106.0, 73.0, 61.0, 48.0, 32.0, 26.0, 17.0, 15.0, 5.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001996755599975586, -0.00019390136003494263, -0.00018812716007232666, -0.0001823529601097107, -0.00017657876014709473, -0.00017080456018447876, -0.0001650303602218628, -0.00015925616025924683, -0.00015348196029663086, -0.0001477077603340149, -0.00014193356037139893, -0.00013615936040878296, -0.000130385160446167, -0.00012461096048355103, -0.00011883676052093506, -0.00011306256055831909, -0.00010728836059570312, -0.00010151416063308716, -9.573996067047119e-05, -8.996576070785522e-05, -8.419156074523926e-05, -7.841736078262329e-05, -7.264316082000732e-05, -6.686896085739136e-05, -6.109476089477539e-05, -5.5320560932159424e-05, -4.954636096954346e-05, -4.377216100692749e-05, -3.7997961044311523e-05, -3.222376108169556e-05, -2.644956111907959e-05, -2.0675361156463623e-05, -1.4901161193847656e-05, -9.12696123123169e-06, -3.3527612686157227e-06, 2.421438694000244e-06, 8.195638656616211e-06, 1.3969838619232178e-05, 1.9744038581848145e-05, 2.551823854446411e-05, 3.129243850708008e-05, 3.7066638469696045e-05, 4.284083843231201e-05, 4.861503839492798e-05, 5.4389238357543945e-05, 6.016343832015991e-05, 6.593763828277588e-05, 7.171183824539185e-05, 7.748603820800781e-05, 8.326023817062378e-05, 8.903443813323975e-05, 9.480863809585571e-05, 0.00010058283805847168, 0.00010635703802108765, 0.00011213123798370361, 0.00011790543794631958, 0.00012367963790893555, 0.00012945383787155151, 0.00013522803783416748, 0.00014100223779678345, 0.00014677643775939941, 0.00015255063772201538, 0.00015832483768463135, 0.00016409903764724731, 0.00016987323760986328]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 13.0, 24.0, 33.0, 55.0, 91.0, 173.0, 342.0, 843.0, 2669.0, 11886.0, 125395.0, 844874.0, 52248.0, 6870.0, 1746.0, 622.0, 283.0, 128.0, 90.0, 47.0, 29.0, 18.0, 21.0, 7.0, 7.0, 1.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9199752807617188, -0.8863372802734375, -0.8526992797851562, -0.819061279296875, -0.7854232788085938, -0.7517852783203125, -0.7181472778320312, -0.68450927734375, -0.6508712768554688, -0.6172332763671875, -0.5835952758789062, -0.549957275390625, -0.5163192749023438, -0.4826812744140625, -0.44904327392578125, -0.4154052734375, -0.38176727294921875, -0.3481292724609375, -0.31449127197265625, -0.280853271484375, -0.24721527099609375, -0.2135772705078125, -0.17993927001953125, -0.14630126953125, -0.11266326904296875, -0.0790252685546875, -0.04538726806640625, -0.011749267578125, 0.02188873291015625, 0.0555267333984375, 0.08916473388671875, 0.122802734375, 0.15644073486328125, 0.1900787353515625, 0.22371673583984375, 0.257354736328125, 0.29099273681640625, 0.3246307373046875, 0.35826873779296875, 0.39190673828125, 0.42554473876953125, 0.4591827392578125, 0.49282073974609375, 0.526458740234375, 0.5600967407226562, 0.5937347412109375, 0.6273727416992188, 0.6610107421875, 0.6946487426757812, 0.7282867431640625, 0.7619247436523438, 0.795562744140625, 0.8292007446289062, 0.8628387451171875, 0.8964767456054688, 0.93011474609375, 0.9637527465820312, 0.9973907470703125, 1.0310287475585938, 1.064666748046875, 1.0983047485351562, 1.1319427490234375, 1.1655807495117188, 1.19921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 6.0, 5.0, 8.0, 14.0, 14.0, 20.0, 24.0, 25.0, 44.0, 50.0, 82.0, 120.0, 134.0, 127.0, 92.0, 60.0, 47.0, 37.0, 23.0, 22.0, 12.0, 11.0, 9.0, 7.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6089630126953125, -0.586090087890625, -0.5632171630859375, -0.54034423828125, -0.5174713134765625, -0.494598388671875, -0.4717254638671875, -0.4488525390625, -0.4259796142578125, -0.403106689453125, -0.3802337646484375, -0.35736083984375, -0.3344879150390625, -0.311614990234375, -0.2887420654296875, -0.265869140625, -0.2429962158203125, -0.220123291015625, -0.1972503662109375, -0.17437744140625, -0.1515045166015625, -0.128631591796875, -0.1057586669921875, -0.0828857421875, -0.0600128173828125, -0.037139892578125, -0.0142669677734375, 0.00860595703125, 0.0314788818359375, 0.054351806640625, 0.0772247314453125, 0.10009765625, 0.1229705810546875, 0.145843505859375, 0.1687164306640625, 0.19158935546875, 0.2144622802734375, 0.237335205078125, 0.2602081298828125, 0.2830810546875, 0.3059539794921875, 0.328826904296875, 0.3516998291015625, 0.37457275390625, 0.3974456787109375, 0.420318603515625, 0.4431915283203125, 0.466064453125, 0.4889373779296875, 0.511810302734375, 0.5346832275390625, 0.55755615234375, 0.5804290771484375, 0.603302001953125, 0.6261749267578125, 0.6490478515625, 0.6719207763671875, 0.694793701171875, 0.7176666259765625, 0.74053955078125, 0.7634124755859375, 0.786285400390625, 0.8091583251953125, 0.83203125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 25.0, 142.0, 632.0, 169.0, 14.0, 16.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.485965728759766, -27.90035057067871, -27.314735412597656, -26.729122161865234, -26.14350700378418, -25.557891845703125, -24.972278594970703, -24.38666343688965, -23.801048278808594, -23.21543312072754, -22.629817962646484, -22.044204711914062, -21.458589553833008, -20.872974395751953, -20.28736114501953, -19.701745986938477, -19.116130828857422, -18.530515670776367, -17.944900512695312, -17.35928726196289, -16.773672103881836, -16.18805694580078, -15.602442741394043, -15.016828536987305, -14.43121337890625, -13.845598220825195, -13.259984016418457, -12.674369812011719, -12.088754653930664, -11.50313949584961, -10.917525291442871, -10.331911087036133, -9.746297836303711, -9.160682678222656, -8.575068473815918, -7.9894537925720215, -7.403839111328125, -6.8182244300842285, -6.232609748840332, -5.6469950675964355, -5.061380386352539, -4.475765705108643, -3.890151023864746, -3.3045363426208496, -2.718921661376953, -2.1333069801330566, -1.5476922988891602, -0.9620776176452637, -0.3764629364013672, 0.2091517448425293, 0.7947664260864258, 1.3803811073303223, 1.9659957885742188, 2.5516104698181152, 3.1372251510620117, 3.722839832305908, 4.308454513549805, 4.894069194793701, 5.479683876037598, 6.065298557281494, 6.650913238525391, 7.236527919769287, 7.822142601013184, 8.407756805419922, 8.993371963500977]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 20.0, 15.0, 20.0, 17.0, 47.0, 23.0, 35.0, 30.0, 38.0, 45.0, 43.0, 61.0, 55.0, 67.0, 52.0, 55.0, 47.0, 42.0, 38.0, 33.0, 35.0, 34.0, 28.0, 22.0, 17.0, 9.0, 10.0, 16.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.420712947845459, -4.3009161949157715, -4.181119441986084, -4.0613226890563965, -3.941525936126709, -3.8217291831970215, -3.701932430267334, -3.5821356773376465, -3.462338924407959, -3.3425421714782715, -3.222745418548584, -3.1029486656188965, -2.983151912689209, -2.8633551597595215, -2.743558406829834, -2.6237616539001465, -2.503964900970459, -2.3841681480407715, -2.264371395111084, -2.1445746421813965, -2.024777889251709, -1.9049811363220215, -1.785184383392334, -1.6653876304626465, -1.545590877532959, -1.4257941246032715, -1.305997371673584, -1.1862006187438965, -1.066403865814209, -0.9466071128845215, -0.826810359954834, -0.7070136070251465, -0.587216854095459, -0.4674201011657715, -0.347623348236084, -0.22782659530639648, -0.10802984237670898, 0.011766910552978516, 0.13156366348266602, 0.2513604164123535, 0.371157169342041, 0.4909539222717285, 0.610750675201416, 0.7305474281311035, 0.850344181060791, 0.9701409339904785, 1.089937686920166, 1.2097344398498535, 1.329531192779541, 1.4493279457092285, 1.569124698638916, 1.6889214515686035, 1.808718204498291, 1.9285149574279785, 2.048311710357666, 2.1681084632873535, 2.287905216217041, 2.4077019691467285, 2.527498722076416, 2.6472954750061035, 2.767092227935791, 2.8868889808654785, 3.006685733795166, 3.1264824867248535, 3.246279239654541]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 9.0, 7.0, 7.0, 25.0, 24.0, 25.0, 38.0, 43.0, 69.0, 83.0, 95.0, 205.0, 371.0, 649.0, 1354.0, 3273.0, 12811.0, 255788.0, 3888839.0, 23337.0, 4415.0, 1503.0, 616.0, 295.0, 157.0, 83.0, 52.0, 27.0, 20.0, 9.0, 13.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.8974609375, -1.8544921875, -1.8115234375, -1.7685546875, -1.7255859375, -1.6826171875, -1.6396484375, -1.5966796875, -1.5537109375, -1.5107421875, -1.4677734375, -1.4248046875, -1.3818359375, -1.3388671875, -1.2958984375, -1.2529296875, -1.2099609375, -1.1669921875, -1.1240234375, -1.0810546875, -1.0380859375, -0.9951171875, -0.9521484375, -0.9091796875, -0.8662109375, -0.8232421875, -0.7802734375, -0.7373046875, -0.6943359375, -0.6513671875, -0.6083984375, -0.5654296875, -0.5224609375, -0.4794921875, -0.4365234375, -0.3935546875, -0.3505859375, -0.3076171875, -0.2646484375, -0.2216796875, -0.1787109375, -0.1357421875, -0.0927734375, -0.0498046875, -0.0068359375, 0.0361328125, 0.0791015625, 0.1220703125, 0.1650390625, 0.2080078125, 0.2509765625, 0.2939453125, 0.3369140625, 0.3798828125, 0.4228515625, 0.4658203125, 0.5087890625, 0.5517578125, 0.5947265625, 0.6376953125, 0.6806640625, 0.7236328125, 0.7666015625, 0.8095703125, 0.8525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 15.0, 25.0, 38.0, 72.0, 98.0, 138.0, 143.0, 142.0, 125.0, 72.0, 50.0, 29.0, 13.0, 7.0, 10.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.27978515625, -0.2738943099975586, -0.2680034637451172, -0.2621126174926758, -0.2562217712402344, -0.25033092498779297, -0.24444007873535156, -0.23854923248291016, -0.23265838623046875, -0.22676753997802734, -0.22087669372558594, -0.21498584747314453, -0.20909500122070312, -0.20320415496826172, -0.1973133087158203, -0.1914224624633789, -0.1855316162109375, -0.1796407699584961, -0.1737499237060547, -0.16785907745361328, -0.16196823120117188, -0.15607738494873047, -0.15018653869628906, -0.14429569244384766, -0.13840484619140625, -0.13251399993896484, -0.12662315368652344, -0.12073230743408203, -0.11484146118164062, -0.10895061492919922, -0.10305976867675781, -0.0971689224243164, -0.091278076171875, -0.0853872299194336, -0.07949638366699219, -0.07360553741455078, -0.06771469116210938, -0.06182384490966797, -0.05593299865722656, -0.050042152404785156, -0.04415130615234375, -0.038260459899902344, -0.03236961364746094, -0.02647876739501953, -0.020587921142578125, -0.014697074890136719, -0.008806228637695312, -0.0029153823852539062, 0.0029754638671875, 0.008866310119628906, 0.014757156372070312, 0.02064800262451172, 0.026538848876953125, 0.03242969512939453, 0.03832054138183594, 0.044211387634277344, 0.05010223388671875, 0.055993080139160156, 0.06188392639160156, 0.06777477264404297, 0.07366561889648438, 0.07955646514892578, 0.08544731140136719, 0.0913381576538086, 0.09722900390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 16.0, 33.0, 47.0, 89.0, 168.0, 363.0, 806.0, 2119.0, 7246.0, 41005.0, 3817428.0, 302189.0, 16878.0, 3689.0, 1257.0, 453.0, 216.0, 108.0, 52.0, 26.0, 14.0, 17.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2236328125, -1.1903762817382812, -1.1571197509765625, -1.1238632202148438, -1.090606689453125, -1.0573501586914062, -1.0240936279296875, -0.9908370971679688, -0.95758056640625, -0.9243240356445312, -0.8910675048828125, -0.8578109741210938, -0.824554443359375, -0.7912979125976562, -0.7580413818359375, -0.7247848510742188, -0.6915283203125, -0.6582717895507812, -0.6250152587890625, -0.5917587280273438, -0.558502197265625, -0.5252456665039062, -0.4919891357421875, -0.45873260498046875, -0.42547607421875, -0.39221954345703125, -0.3589630126953125, -0.32570648193359375, -0.292449951171875, -0.25919342041015625, -0.2259368896484375, -0.19268035888671875, -0.159423828125, -0.12616729736328125, -0.0929107666015625, -0.05965423583984375, -0.026397705078125, 0.00685882568359375, 0.0401153564453125, 0.07337188720703125, 0.10662841796875, 0.13988494873046875, 0.1731414794921875, 0.20639801025390625, 0.239654541015625, 0.27291107177734375, 0.3061676025390625, 0.33942413330078125, 0.3726806640625, 0.40593719482421875, 0.4391937255859375, 0.47245025634765625, 0.505706787109375, 0.5389633178710938, 0.5722198486328125, 0.6054763793945312, 0.63873291015625, 0.6719894409179688, 0.7052459716796875, 0.7385025024414062, 0.771759033203125, 0.8050155639648438, 0.8382720947265625, 0.8715286254882812, 0.90478515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 10.0, 7.0, 18.0, 20.0, 42.0, 53.0, 130.0, 264.0, 1091.0, 1706.0, 388.0, 156.0, 58.0, 47.0, 23.0, 7.0, 12.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22412109375, -0.21713638305664062, -0.21015167236328125, -0.20316696166992188, -0.1961822509765625, -0.18919754028320312, -0.18221282958984375, -0.17522811889648438, -0.168243408203125, -0.16125869750976562, -0.15427398681640625, -0.14728927612304688, -0.1403045654296875, -0.13331985473632812, -0.12633514404296875, -0.11935043334960938, -0.11236572265625, -0.10538101196289062, -0.09839630126953125, -0.09141159057617188, -0.0844268798828125, -0.07744216918945312, -0.07045745849609375, -0.06347274780273438, -0.056488037109375, -0.049503326416015625, -0.04251861572265625, -0.035533905029296875, -0.0285491943359375, -0.021564483642578125, -0.01457977294921875, -0.007595062255859375, -0.0006103515625, 0.006374359130859375, 0.01335906982421875, 0.020343780517578125, 0.0273284912109375, 0.034313201904296875, 0.04129791259765625, 0.048282623291015625, 0.055267333984375, 0.062252044677734375, 0.06923675537109375, 0.07622146606445312, 0.0832061767578125, 0.09019088745117188, 0.09717559814453125, 0.10416030883789062, 0.11114501953125, 0.11812973022460938, 0.12511444091796875, 0.13209915161132812, 0.1390838623046875, 0.14606857299804688, 0.15305328369140625, 0.16003799438476562, 0.167022705078125, 0.17400741577148438, 0.18099212646484375, 0.18797683715820312, 0.1949615478515625, 0.20194625854492188, 0.20893096923828125, 0.21591567993164062, 0.222900390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 17.0, 33.0, 131.0, 292.0, 364.0, 118.0, 32.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6790753602981567, -1.6150943040847778, -1.551113247871399, -1.4871323108673096, -1.4231512546539307, -1.3591701984405518, -1.2951891422271729, -1.231208086013794, -1.167227029800415, -1.1032459735870361, -1.0392649173736572, -0.9752839207649231, -0.911302924156189, -0.8473218679428101, -0.7833408117294312, -0.7193597555160522, -0.6553788185119629, -0.591397762298584, -0.5274167656898499, -0.46343570947647095, -0.39945468306541443, -0.3354736566543579, -0.271492600440979, -0.20751157402992249, -0.14353054761886597, -0.07954951375722885, -0.015568479895591736, 0.04841256141662598, 0.1123935878276825, 0.176374614238739, 0.24035567045211792, 0.30433669686317444, 0.3683178424835205, 0.432298868894577, 0.49627989530563354, 0.5602609515190125, 0.6242419481277466, 0.6882230043411255, 0.7522040605545044, 0.8161851167678833, 0.8801661133766174, 0.9441471695899963, 1.0081281661987305, 1.0721092224121094, 1.1360902786254883, 1.2000713348388672, 1.264052391052246, 1.3280333280563354, 1.3920143842697144, 1.4559954404830933, 1.5199764966964722, 1.5839574337005615, 1.6479384899139404, 1.7119195461273193, 1.7759006023406982, 1.8398816585540771, 1.903862714767456, 1.967843770980835, 2.031824827194214, 2.0958058834075928, 2.1597869396209717, 2.2237677574157715, 2.2877488136291504, 2.3517298698425293, 2.415710926055908]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 16.0, 7.0, 9.0, 19.0, 23.0, 28.0, 19.0, 36.0, 35.0, 55.0, 47.0, 60.0, 53.0, 63.0, 61.0, 75.0, 61.0, 59.0, 63.0, 38.0, 34.0, 21.0, 22.0, 22.0, 23.0, 12.0, 8.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6316056847572327, -0.6094751358032227, -0.5873446464538574, -0.5652140974998474, -0.5430835485458374, -0.5209530591964722, -0.49882251024246216, -0.47669199109077454, -0.4545614719390869, -0.4324309527873993, -0.41030043363571167, -0.38816988468170166, -0.36603936553001404, -0.3439088463783264, -0.3217782974243164, -0.2996477782726288, -0.27751725912094116, -0.25538673996925354, -0.23325620591640472, -0.2111256718635559, -0.1889951527118683, -0.16686463356018066, -0.14473409950733185, -0.12260356545448303, -0.10047304630279541, -0.07834251970052719, -0.05621199309825897, -0.03408146649599075, -0.011950939893722534, 0.010179586708545685, 0.032310113310813904, 0.05444064736366272, 0.07657116651535034, 0.09870169311761856, 0.12083221971988678, 0.1429627537727356, 0.16509327292442322, 0.18722379207611084, 0.20935432612895966, 0.23148486018180847, 0.2536153793334961, 0.2757458984851837, 0.29787641763687134, 0.32000696659088135, 0.34213748574256897, 0.3642680048942566, 0.3863985538482666, 0.4085290729999542, 0.43065959215164185, 0.45279011130332947, 0.4749206304550171, 0.4970511794090271, 0.5191817283630371, 0.5413122177124023, 0.5634427666664124, 0.5855733156204224, 0.6077038049697876, 0.6298343539237976, 0.6519648432731628, 0.6740953922271729, 0.6962258815765381, 0.7183564305305481, 0.7404869794845581, 0.7626174688339233, 0.7847480177879333]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 9.0, 3.0, 12.0, 15.0, 13.0, 25.0, 34.0, 43.0, 44.0, 73.0, 79.0, 136.0, 170.0, 269.0, 472.0, 818.0, 1583.0, 3998.0, 15649.0, 165296.0, 743042.0, 98501.0, 11422.0, 3321.0, 1386.0, 780.0, 434.0, 288.0, 194.0, 135.0, 83.0, 68.0, 35.0, 35.0, 15.0, 16.0, 23.0, 10.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.703125, -0.6792144775390625, -0.655303955078125, -0.6313934326171875, -0.60748291015625, -0.5835723876953125, -0.559661865234375, -0.5357513427734375, -0.5118408203125, -0.4879302978515625, -0.464019775390625, -0.4401092529296875, -0.41619873046875, -0.3922882080078125, -0.368377685546875, -0.3444671630859375, -0.320556640625, -0.2966461181640625, -0.272735595703125, -0.2488250732421875, -0.22491455078125, -0.2010040283203125, -0.177093505859375, -0.1531829833984375, -0.1292724609375, -0.1053619384765625, -0.081451416015625, -0.0575408935546875, -0.03363037109375, -0.0097198486328125, 0.014190673828125, 0.0381011962890625, 0.06201171875, 0.0859222412109375, 0.109832763671875, 0.1337432861328125, 0.15765380859375, 0.1815643310546875, 0.205474853515625, 0.2293853759765625, 0.2532958984375, 0.2772064208984375, 0.301116943359375, 0.3250274658203125, 0.34893798828125, 0.3728485107421875, 0.396759033203125, 0.4206695556640625, 0.444580078125, 0.4684906005859375, 0.492401123046875, 0.5163116455078125, 0.54022216796875, 0.5641326904296875, 0.588043212890625, 0.6119537353515625, 0.6358642578125, 0.6597747802734375, 0.683685302734375, 0.7075958251953125, 0.73150634765625, 0.7554168701171875, 0.779327392578125, 0.8032379150390625, 0.8271484375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 12.0, 13.0, 25.0, 59.0, 79.0, 123.0, 131.0, 144.0, 146.0, 93.0, 68.0, 39.0, 24.0, 9.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.25830078125, -0.2527008056640625, -0.247100830078125, -0.2415008544921875, -0.23590087890625, -0.2303009033203125, -0.224700927734375, -0.2191009521484375, -0.2135009765625, -0.2079010009765625, -0.202301025390625, -0.1967010498046875, -0.19110107421875, -0.1855010986328125, -0.179901123046875, -0.1743011474609375, -0.168701171875, -0.1631011962890625, -0.157501220703125, -0.1519012451171875, -0.14630126953125, -0.1407012939453125, -0.135101318359375, -0.1295013427734375, -0.1239013671875, -0.1183013916015625, -0.112701416015625, -0.1071014404296875, -0.10150146484375, -0.0959014892578125, -0.090301513671875, -0.0847015380859375, -0.0791015625, -0.0735015869140625, -0.067901611328125, -0.0623016357421875, -0.05670166015625, -0.0511016845703125, -0.045501708984375, -0.0399017333984375, -0.0343017578125, -0.0287017822265625, -0.023101806640625, -0.0175018310546875, -0.01190185546875, -0.0063018798828125, -0.000701904296875, 0.0048980712890625, 0.010498046875, 0.0160980224609375, 0.021697998046875, 0.0272979736328125, 0.03289794921875, 0.0384979248046875, 0.044097900390625, 0.0496978759765625, 0.0552978515625, 0.0608978271484375, 0.066497802734375, 0.0720977783203125, 0.07769775390625, 0.0832977294921875, 0.088897705078125, 0.0944976806640625, 0.10009765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 14.0, 11.0, 16.0, 23.0, 29.0, 51.0, 68.0, 127.0, 178.0, 276.0, 460.0, 815.0, 1759.0, 3831.0, 10175.0, 31803.0, 121149.0, 420985.0, 334006.0, 85202.0, 23198.0, 7898.0, 3143.0, 1474.0, 720.0, 382.0, 256.0, 145.0, 101.0, 70.0, 67.0, 34.0, 23.0, 16.0, 12.0, 5.0, 12.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.47153472900390625, -0.4567413330078125, -0.44194793701171875, -0.427154541015625, -0.41236114501953125, -0.3975677490234375, -0.38277435302734375, -0.36798095703125, -0.35318756103515625, -0.3383941650390625, -0.32360076904296875, -0.308807373046875, -0.29401397705078125, -0.2792205810546875, -0.26442718505859375, -0.2496337890625, -0.23484039306640625, -0.2200469970703125, -0.20525360107421875, -0.190460205078125, -0.17566680908203125, -0.1608734130859375, -0.14608001708984375, -0.13128662109375, -0.11649322509765625, -0.1016998291015625, -0.08690643310546875, -0.072113037109375, -0.05731964111328125, -0.0425262451171875, -0.02773284912109375, -0.012939453125, 0.00185394287109375, 0.0166473388671875, 0.03144073486328125, 0.046234130859375, 0.06102752685546875, 0.0758209228515625, 0.09061431884765625, 0.10540771484375, 0.12020111083984375, 0.1349945068359375, 0.14978790283203125, 0.164581298828125, 0.17937469482421875, 0.1941680908203125, 0.20896148681640625, 0.2237548828125, 0.23854827880859375, 0.2533416748046875, 0.26813507080078125, 0.282928466796875, 0.29772186279296875, 0.3125152587890625, 0.32730865478515625, 0.34210205078125, 0.35689544677734375, 0.3716888427734375, 0.38648223876953125, 0.401275634765625, 0.41606903076171875, 0.4308624267578125, 0.44565582275390625, 0.46044921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 12.0, 18.0, 15.0, 24.0, 24.0, 14.0, 33.0, 26.0, 29.0, 45.0, 32.0, 36.0, 31.0, 58.0, 39.0, 47.0, 43.0, 35.0, 35.0, 52.0, 42.0, 45.0, 24.0, 32.0, 27.0, 26.0, 22.0, 19.0, 18.0, 14.0, 13.0, 8.0, 9.0, 5.0, 11.0, 3.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3689002990722656, -0.35620880126953125, -0.3435173034667969, -0.3308258056640625, -0.3181343078613281, -0.30544281005859375, -0.2927513122558594, -0.280059814453125, -0.2673683166503906, -0.25467681884765625, -0.24198532104492188, -0.2292938232421875, -0.21660232543945312, -0.20391082763671875, -0.19121932983398438, -0.17852783203125, -0.16583633422851562, -0.15314483642578125, -0.14045333862304688, -0.1277618408203125, -0.11507034301757812, -0.10237884521484375, -0.08968734741210938, -0.076995849609375, -0.06430435180664062, -0.05161285400390625, -0.038921356201171875, -0.0262298583984375, -0.013538360595703125, -0.00084686279296875, 0.011844635009765625, 0.0245361328125, 0.037227630615234375, 0.04991912841796875, 0.06261062622070312, 0.0753021240234375, 0.08799362182617188, 0.10068511962890625, 0.11337661743164062, 0.126068115234375, 0.13875961303710938, 0.15145111083984375, 0.16414260864257812, 0.1768341064453125, 0.18952560424804688, 0.20221710205078125, 0.21490859985351562, 0.22760009765625, 0.24029159545898438, 0.25298309326171875, 0.2656745910644531, 0.2783660888671875, 0.2910575866699219, 0.30374908447265625, 0.3164405822753906, 0.329132080078125, 0.3418235778808594, 0.35451507568359375, 0.3672065734863281, 0.3798980712890625, 0.3925895690917969, 0.40528106689453125, 0.4179725646972656, 0.4306640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 6.0, 8.0, 13.0, 21.0, 23.0, 31.0, 54.0, 94.0, 142.0, 207.0, 332.0, 573.0, 1080.0, 2271.0, 5845.0, 20521.0, 136193.0, 719391.0, 130907.0, 20248.0, 5769.0, 2302.0, 1068.0, 548.0, 300.0, 187.0, 116.0, 80.0, 74.0, 32.0, 38.0, 21.0, 10.0, 8.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.26258087158203125, -0.2536773681640625, -0.24477386474609375, -0.235870361328125, -0.22696685791015625, -0.2180633544921875, -0.20915985107421875, -0.20025634765625, -0.19135284423828125, -0.1824493408203125, -0.17354583740234375, -0.164642333984375, -0.15573883056640625, -0.1468353271484375, -0.13793182373046875, -0.1290283203125, -0.12012481689453125, -0.1112213134765625, -0.10231781005859375, -0.093414306640625, -0.08451080322265625, -0.0756072998046875, -0.06670379638671875, -0.05780029296875, -0.04889678955078125, -0.0399932861328125, -0.03108978271484375, -0.022186279296875, -0.01328277587890625, -0.0043792724609375, 0.00452423095703125, 0.013427734375, 0.02233123779296875, 0.0312347412109375, 0.04013824462890625, 0.049041748046875, 0.05794525146484375, 0.0668487548828125, 0.07575225830078125, 0.08465576171875, 0.09355926513671875, 0.1024627685546875, 0.11136627197265625, 0.120269775390625, 0.12917327880859375, 0.1380767822265625, 0.14698028564453125, 0.1558837890625, 0.16478729248046875, 0.1736907958984375, 0.18259429931640625, 0.191497802734375, 0.20040130615234375, 0.2093048095703125, 0.21820831298828125, 0.22711181640625, 0.23601531982421875, 0.2449188232421875, 0.25382232666015625, 0.262725830078125, 0.27162933349609375, 0.2805328369140625, 0.28943634033203125, 0.29833984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 8.0, 7.0, 11.0, 15.0, 12.0, 15.0, 23.0, 26.0, 21.0, 28.0, 29.0, 43.0, 54.0, 57.0, 92.0, 106.0, 84.0, 66.0, 51.0, 46.0, 27.0, 31.0, 28.0, 14.0, 17.0, 11.0, 18.0, 6.0, 12.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.565187454223633e-05, -8.27442854642868e-05, -7.983669638633728e-05, -7.692910730838776e-05, -7.402151823043823e-05, -7.111392915248871e-05, -6.820634007453918e-05, -6.529875099658966e-05, -6.239116191864014e-05, -5.948357284069061e-05, -5.657598376274109e-05, -5.3668394684791565e-05, -5.076080560684204e-05, -4.785321652889252e-05, -4.494562745094299e-05, -4.203803837299347e-05, -3.9130449295043945e-05, -3.622286021709442e-05, -3.33152711391449e-05, -3.0407682061195374e-05, -2.750009298324585e-05, -2.4592503905296326e-05, -2.1684914827346802e-05, -1.8777325749397278e-05, -1.5869736671447754e-05, -1.296214759349823e-05, -1.0054558515548706e-05, -7.146969437599182e-06, -4.239380359649658e-06, -1.3317912817001343e-06, 1.5757977962493896e-06, 4.4833868741989136e-06, 7.3909759521484375e-06, 1.0298565030097961e-05, 1.3206154108047485e-05, 1.611374318599701e-05, 1.9021332263946533e-05, 2.1928921341896057e-05, 2.483651041984558e-05, 2.7744099497795105e-05, 3.065168857574463e-05, 3.355927765369415e-05, 3.646686673164368e-05, 3.93744558095932e-05, 4.2282044887542725e-05, 4.518963396549225e-05, 4.809722304344177e-05, 5.1004812121391296e-05, 5.391240119934082e-05, 5.6819990277290344e-05, 5.972757935523987e-05, 6.263516843318939e-05, 6.554275751113892e-05, 6.845034658908844e-05, 7.135793566703796e-05, 7.426552474498749e-05, 7.717311382293701e-05, 8.008070290088654e-05, 8.298829197883606e-05, 8.589588105678558e-05, 8.880347013473511e-05, 9.171105921268463e-05, 9.461864829063416e-05, 9.752623736858368e-05, 0.0001004338264465332]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 20.0, 17.0, 30.0, 34.0, 100.0, 160.0, 330.0, 785.0, 2352.0, 9346.0, 69983.0, 787353.0, 157216.0, 15555.0, 3328.0, 1096.0, 413.0, 179.0, 102.0, 52.0, 33.0, 19.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.422607421875, -0.4083518981933594, -0.39409637451171875, -0.3798408508300781, -0.3655853271484375, -0.3513298034667969, -0.33707427978515625, -0.3228187561035156, -0.308563232421875, -0.2943077087402344, -0.28005218505859375, -0.2657966613769531, -0.2515411376953125, -0.23728561401367188, -0.22303009033203125, -0.20877456665039062, -0.19451904296875, -0.18026351928710938, -0.16600799560546875, -0.15175247192382812, -0.1374969482421875, -0.12324142456054688, -0.10898590087890625, -0.09473037719726562, -0.080474853515625, -0.06621932983398438, -0.05196380615234375, -0.037708282470703125, -0.0234527587890625, -0.009197235107421875, 0.00505828857421875, 0.019313812255859375, 0.0335693359375, 0.047824859619140625, 0.06208038330078125, 0.07633590698242188, 0.0905914306640625, 0.10484695434570312, 0.11910247802734375, 0.13335800170898438, 0.147613525390625, 0.16186904907226562, 0.17612457275390625, 0.19038009643554688, 0.2046356201171875, 0.21889114379882812, 0.23314666748046875, 0.24740219116210938, 0.26165771484375, 0.2759132385253906, 0.29016876220703125, 0.3044242858886719, 0.3186798095703125, 0.3329353332519531, 0.34719085693359375, 0.3614463806152344, 0.375701904296875, 0.3899574279785156, 0.40421295166015625, 0.4184684753417969, 0.4327239990234375, 0.4469795227050781, 0.46123504638671875, 0.4754905700683594, 0.48974609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 8.0, 12.0, 11.0, 8.0, 12.0, 28.0, 23.0, 33.0, 39.0, 52.0, 64.0, 86.0, 98.0, 96.0, 99.0, 81.0, 52.0, 50.0, 25.0, 22.0, 26.0, 19.0, 12.0, 8.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.2399768829345703, -0.23080825805664062, -0.22163963317871094, -0.21247100830078125, -0.20330238342285156, -0.19413375854492188, -0.1849651336669922, -0.1757965087890625, -0.1666278839111328, -0.15745925903320312, -0.14829063415527344, -0.13912200927734375, -0.12995338439941406, -0.12078475952148438, -0.11161613464355469, -0.102447509765625, -0.09327888488769531, -0.08411026000976562, -0.07494163513183594, -0.06577301025390625, -0.05660438537597656, -0.047435760498046875, -0.03826713562011719, -0.0290985107421875, -0.019929885864257812, -0.010761260986328125, -0.0015926361083984375, 0.00757598876953125, 0.016744613647460938, 0.025913238525390625, 0.03508186340332031, 0.04425048828125, 0.05341911315917969, 0.06258773803710938, 0.07175636291503906, 0.08092498779296875, 0.09009361267089844, 0.09926223754882812, 0.10843086242675781, 0.1175994873046875, 0.1267681121826172, 0.13593673706054688, 0.14510536193847656, 0.15427398681640625, 0.16344261169433594, 0.17261123657226562, 0.1817798614501953, 0.190948486328125, 0.2001171112060547, 0.20928573608398438, 0.21845436096191406, 0.22762298583984375, 0.23679161071777344, 0.24596023559570312, 0.2551288604736328, 0.2642974853515625, 0.2734661102294922, 0.2826347351074219, 0.29180335998535156, 0.30097198486328125, 0.31014060974121094, 0.3193092346191406, 0.3284778594970703, 0.337646484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 24.0, 281.0, 579.0, 100.0, 18.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.96441650390625, -23.530237197875977, -23.09605598449707, -22.661876678466797, -22.227697372436523, -21.79351806640625, -21.359336853027344, -20.92515754699707, -20.490978240966797, -20.056798934936523, -19.622617721557617, -19.188438415527344, -18.75425910949707, -18.320079803466797, -17.88589859008789, -17.451719284057617, -17.017539978027344, -16.58336067199707, -16.149179458618164, -15.71500015258789, -15.280820846557617, -14.846640586853027, -14.412460327148438, -13.978281021118164, -13.544099807739258, -13.109919548034668, -12.675740242004395, -12.241559982299805, -11.807380676269531, -11.373200416564941, -10.939020156860352, -10.504840850830078, -10.070660591125488, -9.636480331420898, -9.202301025390625, -8.768120765686035, -8.333941459655762, -7.899761199951172, -7.46558141708374, -7.031401634216309, -6.597222328186035, -6.1630425453186035, -5.728862762451172, -5.294682502746582, -4.860503196716309, -4.426322937011719, -3.992143154144287, -3.5579633712768555, -3.1237833499908447, -2.689603567123413, -2.2554235458374023, -1.8212437629699707, -1.387063980102539, -0.9528841972351074, -0.5187041759490967, -0.08452439308166504, 0.3496553897857666, 0.783835232257843, 1.2180150747299194, 1.6521949768066406, 2.0863747596740723, 2.520554542541504, 2.9547345638275146, 3.3889143466949463, 3.823094129562378]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 11.0, 14.0, 11.0, 6.0, 10.0, 17.0, 19.0, 29.0, 39.0, 40.0, 42.0, 44.0, 44.0, 47.0, 49.0, 57.0, 55.0, 41.0, 48.0, 54.0, 42.0, 45.0, 42.0, 27.0, 24.0, 27.0, 18.0, 18.0, 11.0, 16.0, 13.0, 13.0, 6.0, 8.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.730586051940918, -2.643235683441162, -2.5558853149414062, -2.4685347080230713, -2.3811843395233154, -2.2938339710235596, -2.2064836025238037, -2.1191329956054688, -2.031782627105713, -1.944432258605957, -1.8570817708969116, -1.7697314023971558, -1.6823809146881104, -1.5950305461883545, -1.5076801776885986, -1.4203296899795532, -1.3329793214797974, -1.2456289529800415, -1.158278465270996, -1.0709280967712402, -0.9835776090621948, -0.896227240562439, -0.8088768124580383, -0.7215263843536377, -0.6341759562492371, -0.5468255281448364, -0.4594751000404358, -0.37212470173835754, -0.2847742736339569, -0.19742384552955627, -0.11007344722747803, -0.022723019123077393, 0.06462740898132324, 0.15197783708572388, 0.23932825028896332, 0.32667866349220276, 0.4140290915966034, 0.5013794898986816, 0.5887299180030823, 0.6760803461074829, 0.7634307742118835, 0.8507812023162842, 0.9381316304206848, 1.0254820585250854, 1.1128324270248413, 1.2001829147338867, 1.2875332832336426, 1.3748836517333984, 1.4622341394424438, 1.5495845079421997, 1.6369349956512451, 1.724285364151001, 1.8116358518600464, 1.8989862203598022, 1.9863367080688477, 2.0736870765686035, 2.1610374450683594, 2.2483878135681152, 2.335738182067871, 2.423088788986206, 2.510439157485962, 2.5977895259857178, 2.6851398944854736, 2.7724905014038086, 2.8598408699035645]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 6.0, 7.0, 4.0, 11.0, 14.0, 18.0, 24.0, 25.0, 40.0, 34.0, 80.0, 97.0, 184.0, 260.0, 464.0, 884.0, 1974.0, 4756.0, 16731.0, 205319.0, 3907735.0, 42825.0, 7859.0, 2621.0, 1090.0, 560.0, 256.0, 155.0, 89.0, 50.0, 38.0, 16.0, 16.0, 4.0, 8.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.96044921875, -0.937713623046875, -0.91497802734375, -0.892242431640625, -0.8695068359375, -0.846771240234375, -0.82403564453125, -0.801300048828125, -0.778564453125, -0.755828857421875, -0.73309326171875, -0.710357666015625, -0.6876220703125, -0.664886474609375, -0.64215087890625, -0.619415283203125, -0.5966796875, -0.573944091796875, -0.55120849609375, -0.528472900390625, -0.5057373046875, -0.483001708984375, -0.46026611328125, -0.437530517578125, -0.414794921875, -0.392059326171875, -0.36932373046875, -0.346588134765625, -0.3238525390625, -0.301116943359375, -0.27838134765625, -0.255645751953125, -0.23291015625, -0.210174560546875, -0.18743896484375, -0.164703369140625, -0.1419677734375, -0.119232177734375, -0.09649658203125, -0.073760986328125, -0.051025390625, -0.028289794921875, -0.00555419921875, 0.017181396484375, 0.0399169921875, 0.062652587890625, 0.08538818359375, 0.108123779296875, 0.130859375, 0.153594970703125, 0.17633056640625, 0.199066162109375, 0.2218017578125, 0.244537353515625, 0.26727294921875, 0.290008544921875, 0.312744140625, 0.335479736328125, 0.35821533203125, 0.380950927734375, 0.4036865234375, 0.426422119140625, 0.44915771484375, 0.471893310546875, 0.49462890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 8.0, 11.0, 22.0, 28.0, 48.0, 100.0, 125.0, 108.0, 129.0, 124.0, 110.0, 74.0, 42.0, 20.0, 15.0, 8.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.2369222640991211, -0.2312908172607422, -0.22565937042236328, -0.22002792358398438, -0.21439647674560547, -0.20876502990722656, -0.20313358306884766, -0.19750213623046875, -0.19187068939208984, -0.18623924255371094, -0.18060779571533203, -0.17497634887695312, -0.16934490203857422, -0.1637134552001953, -0.1580820083618164, -0.1524505615234375, -0.1468191146850586, -0.1411876678466797, -0.13555622100830078, -0.12992477416992188, -0.12429332733154297, -0.11866188049316406, -0.11303043365478516, -0.10739898681640625, -0.10176753997802734, -0.09613609313964844, -0.09050464630126953, -0.08487319946289062, -0.07924175262451172, -0.07361030578613281, -0.0679788589477539, -0.062347412109375, -0.056715965270996094, -0.05108451843261719, -0.04545307159423828, -0.039821624755859375, -0.03419017791748047, -0.028558731079101562, -0.022927284240722656, -0.01729583740234375, -0.011664390563964844, -0.0060329437255859375, -0.00040149688720703125, 0.005229949951171875, 0.010861396789550781, 0.016492843627929688, 0.022124290466308594, 0.0277557373046875, 0.033387184143066406, 0.03901863098144531, 0.04465007781982422, 0.050281524658203125, 0.05591297149658203, 0.06154441833496094, 0.06717586517333984, 0.07280731201171875, 0.07843875885009766, 0.08407020568847656, 0.08970165252685547, 0.09533309936523438, 0.10096454620361328, 0.10659599304199219, 0.1122274398803711, 0.11785888671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 6.0, 22.0, 24.0, 40.0, 71.0, 137.0, 390.0, 1757.0, 13020.0, 751975.0, 3406454.0, 17304.0, 2164.0, 473.0, 185.0, 98.0, 47.0, 38.0, 25.0, 20.0, 7.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.8850784301757812, -0.8546295166015625, -0.8241806030273438, -0.793731689453125, -0.7632827758789062, -0.7328338623046875, -0.7023849487304688, -0.67193603515625, -0.6414871215820312, -0.6110382080078125, -0.5805892944335938, -0.550140380859375, -0.5196914672851562, -0.4892425537109375, -0.45879364013671875, -0.4283447265625, -0.39789581298828125, -0.3674468994140625, -0.33699798583984375, -0.306549072265625, -0.27610015869140625, -0.2456512451171875, -0.21520233154296875, -0.18475341796875, -0.15430450439453125, -0.1238555908203125, -0.09340667724609375, -0.062957763671875, -0.03250885009765625, -0.0020599365234375, 0.02838897705078125, 0.058837890625, 0.08928680419921875, 0.1197357177734375, 0.15018463134765625, 0.180633544921875, 0.21108245849609375, 0.2415313720703125, 0.27198028564453125, 0.30242919921875, 0.33287811279296875, 0.3633270263671875, 0.39377593994140625, 0.424224853515625, 0.45467376708984375, 0.4851226806640625, 0.5155715942382812, 0.5460205078125, 0.5764694213867188, 0.6069183349609375, 0.6373672485351562, 0.667816162109375, 0.6982650756835938, 0.7287139892578125, 0.7591629028320312, 0.78961181640625, 0.8200607299804688, 0.8505096435546875, 0.8809585571289062, 0.911407470703125, 0.9418563842773438, 0.9723052978515625, 1.0027542114257812, 1.033203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 16.0, 20.0, 38.0, 51.0, 154.0, 469.0, 2445.0, 576.0, 158.0, 72.0, 31.0, 15.0, 11.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.1208648681640625, -0.113555908203125, -0.1062469482421875, -0.09893798828125, -0.0916290283203125, -0.084320068359375, -0.0770111083984375, -0.0697021484375, -0.0623931884765625, -0.055084228515625, -0.0477752685546875, -0.04046630859375, -0.0331573486328125, -0.025848388671875, -0.0185394287109375, -0.01123046875, -0.0039215087890625, 0.003387451171875, 0.0106964111328125, 0.01800537109375, 0.0253143310546875, 0.032623291015625, 0.0399322509765625, 0.0472412109375, 0.0545501708984375, 0.061859130859375, 0.0691680908203125, 0.07647705078125, 0.0837860107421875, 0.091094970703125, 0.0984039306640625, 0.105712890625, 0.1130218505859375, 0.120330810546875, 0.1276397705078125, 0.13494873046875, 0.1422576904296875, 0.149566650390625, 0.1568756103515625, 0.1641845703125, 0.1714935302734375, 0.178802490234375, 0.1861114501953125, 0.19342041015625, 0.2007293701171875, 0.208038330078125, 0.2153472900390625, 0.22265625, 0.2299652099609375, 0.237274169921875, 0.2445831298828125, 0.25189208984375, 0.2592010498046875, 0.266510009765625, 0.2738189697265625, 0.2811279296875, 0.2884368896484375, 0.295745849609375, 0.3030548095703125, 0.31036376953125, 0.3176727294921875, 0.324981689453125, 0.3322906494140625, 0.339599609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 24.0, 89.0, 263.0, 348.0, 200.0, 60.0, 12.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.3293261528015137, -2.2799885272979736, -2.2306509017944336, -2.1813132762908936, -2.1319756507873535, -2.0826382637023926, -2.0333006381988525, -1.9839630126953125, -1.9346253871917725, -1.8852877616882324, -1.8359501361846924, -1.786612629890442, -1.7372750043869019, -1.6879373788833618, -1.6385997533798218, -1.5892622470855713, -1.5399246215820312, -1.4905869960784912, -1.4412493705749512, -1.3919118642807007, -1.3425742387771606, -1.2932366132736206, -1.2438989877700806, -1.19456148147583, -1.1452237367630005, -1.0958861112594604, -1.0465484857559204, -0.9972109198570251, -0.9478733539581299, -0.8985357284545898, -0.8491981029510498, -0.7998605370521545, -0.7505229711532593, -0.7011853456497192, -0.651847779750824, -0.6025101542472839, -0.5531725883483887, -0.5038349628448486, -0.454497367143631, -0.40515977144241333, -0.3558221757411957, -0.306484580039978, -0.2571469843387604, -0.20780937373638153, -0.15847177803516388, -0.10913418233394623, -0.05979657173156738, -0.010458976030349731, 0.03887861967086792, 0.08821621537208557, 0.13755381107330322, 0.18689142167568207, 0.23622901737689972, 0.28556662797927856, 0.3349042236804962, 0.38424181938171387, 0.4335794150829315, 0.48291701078414917, 0.5322546362876892, 0.5815922021865845, 0.6309298276901245, 0.6802673935890198, 0.7296050190925598, 0.7789425849914551, 0.8282802104949951]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 11.0, 11.0, 10.0, 24.0, 22.0, 39.0, 29.0, 31.0, 38.0, 45.0, 56.0, 62.0, 63.0, 69.0, 56.0, 57.0, 63.0, 52.0, 50.0, 32.0, 31.0, 40.0, 28.0, 20.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44090574979782104, -0.42397254705429077, -0.4070393443107605, -0.3901061415672302, -0.37317293882369995, -0.3562397360801697, -0.3393065333366394, -0.32237333059310913, -0.30544012784957886, -0.2885069251060486, -0.2715737223625183, -0.25464051961898804, -0.23770731687545776, -0.2207741141319275, -0.20384089648723602, -0.18690769374370575, -0.16997447609901428, -0.153041273355484, -0.13610807061195374, -0.11917486041784286, -0.10224165767431259, -0.08530845493078232, -0.06837524473667145, -0.051442041993141174, -0.0345088392496109, -0.017575634643435478, -0.0006424300372600555, 0.016290776431560516, 0.03322397917509079, 0.05015718191862106, 0.06709039211273193, 0.08402359485626221, 0.10095679759979248, 0.11789000034332275, 0.13482320308685303, 0.1517564058303833, 0.16868960857391357, 0.18562281131744385, 0.20255602896213531, 0.2194892317056656, 0.23642243444919586, 0.25335565209388733, 0.2702888548374176, 0.2872220575809479, 0.30415526032447815, 0.3210884630680084, 0.3380216658115387, 0.35495486855506897, 0.37188807129859924, 0.3888212740421295, 0.4057544767856598, 0.42268767952919006, 0.43962088227272034, 0.4565540850162506, 0.47348731756210327, 0.49042052030563354, 0.5073537230491638, 0.5242869257926941, 0.5412201285362244, 0.5581533312797546, 0.5750865340232849, 0.5920197367668152, 0.6089529395103455, 0.6258861422538757, 0.642819344997406]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 5.0, 7.0, 11.0, 19.0, 25.0, 23.0, 43.0, 72.0, 102.0, 151.0, 227.0, 377.0, 670.0, 1513.0, 3905.0, 17382.0, 219267.0, 729979.0, 61697.0, 8224.0, 2400.0, 1037.0, 533.0, 300.0, 181.0, 113.0, 71.0, 55.0, 40.0, 26.0, 28.0, 19.0, 10.0, 12.0, 8.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87451171875, -0.8497238159179688, -0.8249359130859375, -0.8001480102539062, -0.775360107421875, -0.7505722045898438, -0.7257843017578125, -0.7009963989257812, -0.67620849609375, -0.6514205932617188, -0.6266326904296875, -0.6018447875976562, -0.577056884765625, -0.5522689819335938, -0.5274810791015625, -0.5026931762695312, -0.4779052734375, -0.45311737060546875, -0.4283294677734375, -0.40354156494140625, -0.378753662109375, -0.35396575927734375, -0.3291778564453125, -0.30438995361328125, -0.27960205078125, -0.25481414794921875, -0.2300262451171875, -0.20523834228515625, -0.180450439453125, -0.15566253662109375, -0.1308746337890625, -0.10608673095703125, -0.081298828125, -0.05651092529296875, -0.0317230224609375, -0.00693511962890625, 0.017852783203125, 0.04264068603515625, 0.0674285888671875, 0.09221649169921875, 0.11700439453125, 0.14179229736328125, 0.1665802001953125, 0.19136810302734375, 0.216156005859375, 0.24094390869140625, 0.2657318115234375, 0.29051971435546875, 0.3153076171875, 0.34009552001953125, 0.3648834228515625, 0.38967132568359375, 0.414459228515625, 0.43924713134765625, 0.4640350341796875, 0.48882293701171875, 0.51361083984375, 0.5383987426757812, 0.5631866455078125, 0.5879745483398438, 0.612762451171875, 0.6375503540039062, 0.6623382568359375, 0.6871261596679688, 0.7119140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 18.0, 26.0, 46.0, 68.0, 114.0, 127.0, 124.0, 123.0, 120.0, 88.0, 58.0, 18.0, 17.0, 14.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23565196990966797, -0.22997093200683594, -0.2242898941040039, -0.21860885620117188, -0.21292781829833984, -0.2072467803955078, -0.20156574249267578, -0.19588470458984375, -0.19020366668701172, -0.1845226287841797, -0.17884159088134766, -0.17316055297851562, -0.1674795150756836, -0.16179847717285156, -0.15611743927001953, -0.1504364013671875, -0.14475536346435547, -0.13907432556152344, -0.1333932876586914, -0.12771224975585938, -0.12203121185302734, -0.11635017395019531, -0.11066913604736328, -0.10498809814453125, -0.09930706024169922, -0.09362602233886719, -0.08794498443603516, -0.08226394653320312, -0.0765829086303711, -0.07090187072753906, -0.06522083282470703, -0.059539794921875, -0.05385875701904297, -0.04817771911621094, -0.042496681213378906, -0.036815643310546875, -0.031134605407714844, -0.025453567504882812, -0.01977252960205078, -0.01409149169921875, -0.008410453796386719, -0.0027294158935546875, 0.0029516220092773438, 0.008632659912109375, 0.014313697814941406, 0.019994735717773438, 0.02567577362060547, 0.0313568115234375, 0.03703784942626953, 0.04271888732910156, 0.048399925231933594, 0.054080963134765625, 0.059762001037597656, 0.06544303894042969, 0.07112407684326172, 0.07680511474609375, 0.08248615264892578, 0.08816719055175781, 0.09384822845458984, 0.09952926635742188, 0.1052103042602539, 0.11089134216308594, 0.11657238006591797, 0.12225341796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 11.0, 22.0, 18.0, 19.0, 35.0, 61.0, 77.0, 132.0, 169.0, 263.0, 408.0, 596.0, 1118.0, 2002.0, 3953.0, 8618.0, 22254.0, 64646.0, 199504.0, 397657.0, 227784.0, 74585.0, 25128.0, 9924.0, 4286.0, 2150.0, 1107.0, 678.0, 459.0, 283.0, 184.0, 132.0, 96.0, 42.0, 38.0, 28.0, 13.0, 10.0, 16.0, 8.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.317138671875, -0.30709075927734375, -0.2970428466796875, -0.28699493408203125, -0.276947021484375, -0.26689910888671875, -0.2568511962890625, -0.24680328369140625, -0.23675537109375, -0.22670745849609375, -0.2166595458984375, -0.20661163330078125, -0.196563720703125, -0.18651580810546875, -0.1764678955078125, -0.16641998291015625, -0.1563720703125, -0.14632415771484375, -0.1362762451171875, -0.12622833251953125, -0.116180419921875, -0.10613250732421875, -0.0960845947265625, -0.08603668212890625, -0.07598876953125, -0.06594085693359375, -0.0558929443359375, -0.04584503173828125, -0.035797119140625, -0.02574920654296875, -0.0157012939453125, -0.00565338134765625, 0.00439453125, 0.01444244384765625, 0.0244903564453125, 0.03453826904296875, 0.044586181640625, 0.05463409423828125, 0.0646820068359375, 0.07472991943359375, 0.08477783203125, 0.09482574462890625, 0.1048736572265625, 0.11492156982421875, 0.124969482421875, 0.13501739501953125, 0.1450653076171875, 0.15511322021484375, 0.1651611328125, 0.17520904541015625, 0.1852569580078125, 0.19530487060546875, 0.205352783203125, 0.21540069580078125, 0.2254486083984375, 0.23549652099609375, 0.24554443359375, 0.25559234619140625, 0.2656402587890625, 0.27568817138671875, 0.285736083984375, 0.29578399658203125, 0.3058319091796875, 0.31587982177734375, 0.325927734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 16.0, 25.0, 12.0, 16.0, 31.0, 35.0, 42.0, 39.0, 33.0, 50.0, 41.0, 44.0, 40.0, 53.0, 50.0, 49.0, 45.0, 36.0, 36.0, 31.0, 35.0, 28.0, 26.0, 25.0, 28.0, 15.0, 14.0, 10.0, 15.0, 7.0, 9.0, 5.0, 6.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.421142578125, -0.40863037109375, -0.3961181640625, -0.38360595703125, -0.37109375, -0.35858154296875, -0.3460693359375, -0.33355712890625, -0.321044921875, -0.30853271484375, -0.2960205078125, -0.28350830078125, -0.27099609375, -0.25848388671875, -0.2459716796875, -0.23345947265625, -0.220947265625, -0.20843505859375, -0.1959228515625, -0.18341064453125, -0.1708984375, -0.15838623046875, -0.1458740234375, -0.13336181640625, -0.120849609375, -0.10833740234375, -0.0958251953125, -0.08331298828125, -0.07080078125, -0.05828857421875, -0.0457763671875, -0.03326416015625, -0.020751953125, -0.00823974609375, 0.0042724609375, 0.01678466796875, 0.029296875, 0.04180908203125, 0.0543212890625, 0.06683349609375, 0.079345703125, 0.09185791015625, 0.1043701171875, 0.11688232421875, 0.12939453125, 0.14190673828125, 0.1544189453125, 0.16693115234375, 0.179443359375, 0.19195556640625, 0.2044677734375, 0.21697998046875, 0.2294921875, 0.24200439453125, 0.2545166015625, 0.26702880859375, 0.279541015625, 0.29205322265625, 0.3045654296875, 0.31707763671875, 0.32958984375, 0.34210205078125, 0.3546142578125, 0.36712646484375, 0.379638671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 10.0, 11.0, 12.0, 20.0, 36.0, 61.0, 100.0, 244.0, 532.0, 1320.0, 4833.0, 31489.0, 579885.0, 400982.0, 23018.0, 3939.0, 1132.0, 436.0, 237.0, 106.0, 56.0, 32.0, 19.0, 12.0, 8.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.32513427734375, -0.3155517578125, -0.30596923828125, -0.29638671875, -0.28680419921875, -0.2772216796875, -0.26763916015625, -0.258056640625, -0.24847412109375, -0.2388916015625, -0.22930908203125, -0.2197265625, -0.21014404296875, -0.2005615234375, -0.19097900390625, -0.181396484375, -0.17181396484375, -0.1622314453125, -0.15264892578125, -0.14306640625, -0.13348388671875, -0.1239013671875, -0.11431884765625, -0.104736328125, -0.09515380859375, -0.0855712890625, -0.07598876953125, -0.06640625, -0.05682373046875, -0.0472412109375, -0.03765869140625, -0.028076171875, -0.01849365234375, -0.0089111328125, 0.00067138671875, 0.01025390625, 0.01983642578125, 0.0294189453125, 0.03900146484375, 0.048583984375, 0.05816650390625, 0.0677490234375, 0.07733154296875, 0.0869140625, 0.09649658203125, 0.1060791015625, 0.11566162109375, 0.125244140625, 0.13482666015625, 0.1444091796875, 0.15399169921875, 0.16357421875, 0.17315673828125, 0.1827392578125, 0.19232177734375, 0.201904296875, 0.21148681640625, 0.2210693359375, 0.23065185546875, 0.240234375, 0.24981689453125, 0.2593994140625, 0.26898193359375, 0.278564453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 2.0, 7.0, 3.0, 8.0, 10.0, 15.0, 16.0, 14.0, 24.0, 19.0, 30.0, 45.0, 47.0, 62.0, 97.0, 120.0, 118.0, 73.0, 42.0, 40.0, 43.0, 21.0, 24.0, 20.0, 17.0, 15.0, 15.0, 8.0, 7.0, 10.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012409687042236328, -0.000120529904961586, -0.00011696293950080872, -0.00011339597404003143, -0.00010982900857925415, -0.00010626204311847687, -0.00010269507765769958, -9.91281121969223e-05, -9.556114673614502e-05, -9.199418127536774e-05, -8.842721581459045e-05, -8.486025035381317e-05, -8.129328489303589e-05, -7.77263194322586e-05, -7.415935397148132e-05, -7.059238851070404e-05, -6.702542304992676e-05, -6.345845758914948e-05, -5.989149212837219e-05, -5.632452666759491e-05, -5.275756120681763e-05, -4.9190595746040344e-05, -4.562363028526306e-05, -4.205666482448578e-05, -3.8489699363708496e-05, -3.492273390293121e-05, -3.135576844215393e-05, -2.7788802981376648e-05, -2.4221837520599365e-05, -2.0654872059822083e-05, -1.70879065990448e-05, -1.3520941138267517e-05, -9.953975677490234e-06, -6.387010216712952e-06, -2.820044755935669e-06, 7.469207048416138e-07, 4.3138861656188965e-06, 7.88085162639618e-06, 1.1447817087173462e-05, 1.5014782547950745e-05, 1.8581748008728027e-05, 2.214871346950531e-05, 2.5715678930282593e-05, 2.9282644391059875e-05, 3.284960985183716e-05, 3.641657531261444e-05, 3.9983540773391724e-05, 4.3550506234169006e-05, 4.711747169494629e-05, 5.068443715572357e-05, 5.4251402616500854e-05, 5.781836807727814e-05, 6.138533353805542e-05, 6.49522989988327e-05, 6.851926445960999e-05, 7.208622992038727e-05, 7.565319538116455e-05, 7.922016084194183e-05, 8.278712630271912e-05, 8.63540917634964e-05, 8.992105722427368e-05, 9.348802268505096e-05, 9.705498814582825e-05, 0.00010062195360660553, 0.00010418891906738281]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 19.0, 25.0, 36.0, 69.0, 106.0, 165.0, 278.0, 574.0, 1283.0, 4078.0, 20505.0, 217597.0, 715182.0, 74385.0, 9840.0, 2435.0, 963.0, 425.0, 254.0, 139.0, 65.0, 40.0, 24.0, 19.0, 7.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32666015625, -0.3168487548828125, -0.307037353515625, -0.2972259521484375, -0.28741455078125, -0.2776031494140625, -0.267791748046875, -0.2579803466796875, -0.2481689453125, -0.2383575439453125, -0.228546142578125, -0.2187347412109375, -0.20892333984375, -0.1991119384765625, -0.189300537109375, -0.1794891357421875, -0.169677734375, -0.1598663330078125, -0.150054931640625, -0.1402435302734375, -0.13043212890625, -0.1206207275390625, -0.110809326171875, -0.1009979248046875, -0.0911865234375, -0.0813751220703125, -0.071563720703125, -0.0617523193359375, -0.05194091796875, -0.0421295166015625, -0.032318115234375, -0.0225067138671875, -0.0126953125, -0.0028839111328125, 0.006927490234375, 0.0167388916015625, 0.02655029296875, 0.0363616943359375, 0.046173095703125, 0.0559844970703125, 0.0657958984375, 0.0756072998046875, 0.085418701171875, 0.0952301025390625, 0.10504150390625, 0.1148529052734375, 0.124664306640625, 0.1344757080078125, 0.144287109375, 0.1540985107421875, 0.163909912109375, 0.1737213134765625, 0.18353271484375, 0.1933441162109375, 0.203155517578125, 0.2129669189453125, 0.2227783203125, 0.2325897216796875, 0.242401123046875, 0.2522125244140625, 0.26202392578125, 0.2718353271484375, 0.281646728515625, 0.2914581298828125, 0.30126953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 11.0, 8.0, 13.0, 15.0, 28.0, 51.0, 62.0, 80.0, 101.0, 120.0, 131.0, 85.0, 86.0, 57.0, 51.0, 29.0, 26.0, 10.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2631950378417969, -0.25344085693359375, -0.24368667602539062, -0.2339324951171875, -0.22417831420898438, -0.21442413330078125, -0.20466995239257812, -0.194915771484375, -0.18516159057617188, -0.17540740966796875, -0.16565322875976562, -0.1558990478515625, -0.14614486694335938, -0.13639068603515625, -0.12663650512695312, -0.11688232421875, -0.10712814331054688, -0.09737396240234375, -0.08761978149414062, -0.0778656005859375, -0.06811141967773438, -0.05835723876953125, -0.048603057861328125, -0.038848876953125, -0.029094696044921875, -0.01934051513671875, -0.009586334228515625, 0.0001678466796875, 0.009922027587890625, 0.01967620849609375, 0.029430389404296875, 0.0391845703125, 0.048938751220703125, 0.05869293212890625, 0.06844711303710938, 0.0782012939453125, 0.08795547485351562, 0.09770965576171875, 0.10746383666992188, 0.117218017578125, 0.12697219848632812, 0.13672637939453125, 0.14648056030273438, 0.1562347412109375, 0.16598892211914062, 0.17574310302734375, 0.18549728393554688, 0.19525146484375, 0.20500564575195312, 0.21475982666015625, 0.22451400756835938, 0.2342681884765625, 0.24402236938476562, 0.25377655029296875, 0.2635307312011719, 0.273284912109375, 0.2830390930175781, 0.29279327392578125, 0.3025474548339844, 0.3123016357421875, 0.3220558166503906, 0.33180999755859375, 0.3415641784667969, 0.351318359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 13.0, 86.0, 264.0, 383.0, 162.0, 55.0, 22.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.584945678710938, -10.360420227050781, -10.135893821716309, -9.911368370056152, -9.68684196472168, -9.462316513061523, -9.23779010772705, -9.013264656066895, -8.788738250732422, -8.564212799072266, -8.339686393737793, -8.115160942077637, -7.890634536743164, -7.666109085083008, -7.441583156585693, -7.217057228088379, -6.992531776428223, -6.768005847930908, -6.543479919433594, -6.318953990936279, -6.094428062438965, -5.869902610778809, -5.645376682281494, -5.42085075378418, -5.196324825286865, -4.971798896789551, -4.747272968292236, -4.522747039794922, -4.298221588134766, -4.073695182800293, -3.8491697311401367, -3.6246438026428223, -3.400117874145508, -3.1755919456481934, -2.951066017150879, -2.7265403270721436, -2.502014398574829, -2.2774884700775146, -2.0529627799987793, -1.8284368515014648, -1.6039109230041504, -1.379384994506836, -1.154859185218811, -0.9303333163261414, -0.7058074474334717, -0.4812815189361572, -0.2567557096481323, -0.03222990036010742, 0.19229602813720703, 0.4168218970298767, 0.6413477659225464, 0.8658736348152161, 1.0903995037078857, 1.3149254322052002, 1.539451241493225, 1.76397705078125, 1.9885029792785645, 2.213028907775879, 2.4375548362731934, 2.6620805263519287, 2.886606454849243, 3.1111323833465576, 3.335658073425293, 3.5601840019226074, 3.784709930419922]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 12.0, 12.0, 17.0, 19.0, 31.0, 34.0, 27.0, 46.0, 42.0, 60.0, 58.0, 47.0, 61.0, 65.0, 56.0, 52.0, 65.0, 53.0, 58.0, 45.0, 35.0, 19.0, 18.0, 20.0, 15.0, 12.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.5222702026367188, -3.4272208213806152, -3.3321714401245117, -3.237122058868408, -3.1420726776123047, -3.0470235347747803, -2.9519741535186768, -2.8569247722625732, -2.7618753910064697, -2.666826009750366, -2.5717766284942627, -2.476727247238159, -2.3816781044006348, -2.2866287231445312, -2.1915793418884277, -2.096529960632324, -2.0014805793762207, -1.9064311981201172, -1.8113818168640137, -1.7163325548171997, -1.6212831735610962, -1.5262337923049927, -1.4311845302581787, -1.3361351490020752, -1.2410857677459717, -1.1460363864898682, -1.0509870052337646, -0.9559377431869507, -0.8608883619308472, -0.7658389806747437, -0.6707896590232849, -0.5757403373718262, -0.48069095611572266, -0.38564160466194153, -0.2905922532081604, -0.19554290175437927, -0.10049355030059814, -0.005444198846817017, 0.08960515260696411, 0.18465447425842285, 0.27970385551452637, 0.3747532069683075, 0.4698025584220886, 0.5648518800735474, 0.6599012613296509, 0.7549506425857544, 0.8499999642372131, 0.9450492858886719, 1.0400986671447754, 1.135148048400879, 1.2301974296569824, 1.3252466917037964, 1.4202960729599, 1.5153454542160034, 1.6103947162628174, 1.705444097518921, 1.8004934787750244, 1.895542860031128, 1.9905922412872314, 2.085641622543335, 2.1806907653808594, 2.275740146636963, 2.3707895278930664, 2.46583890914917, 2.5608882904052734]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 6.0, 4.0, 11.0, 18.0, 24.0, 37.0, 47.0, 71.0, 122.0, 172.0, 326.0, 545.0, 1210.0, 3305.0, 11330.0, 142948.0, 3973086.0, 50599.0, 6845.0, 2049.0, 775.0, 350.0, 142.0, 79.0, 50.0, 31.0, 25.0, 15.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.939453125, -0.9155731201171875, -0.891693115234375, -0.8678131103515625, -0.84393310546875, -0.8200531005859375, -0.796173095703125, -0.7722930908203125, -0.7484130859375, -0.7245330810546875, -0.700653076171875, -0.6767730712890625, -0.65289306640625, -0.6290130615234375, -0.605133056640625, -0.5812530517578125, -0.557373046875, -0.5334930419921875, -0.509613037109375, -0.4857330322265625, -0.46185302734375, -0.4379730224609375, -0.414093017578125, -0.3902130126953125, -0.3663330078125, -0.3424530029296875, -0.318572998046875, -0.2946929931640625, -0.27081298828125, -0.2469329833984375, -0.223052978515625, -0.1991729736328125, -0.17529296875, -0.1514129638671875, -0.127532958984375, -0.1036529541015625, -0.07977294921875, -0.0558929443359375, -0.032012939453125, -0.0081329345703125, 0.0157470703125, 0.0396270751953125, 0.063507080078125, 0.0873870849609375, 0.11126708984375, 0.1351470947265625, 0.159027099609375, 0.1829071044921875, 0.206787109375, 0.2306671142578125, 0.254547119140625, 0.2784271240234375, 0.30230712890625, 0.3261871337890625, 0.350067138671875, 0.3739471435546875, 0.3978271484375, 0.4217071533203125, 0.445587158203125, 0.4694671630859375, 0.49334716796875, 0.5172271728515625, 0.541107177734375, 0.5649871826171875, 0.5888671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 22.0, 32.0, 43.0, 68.0, 118.0, 133.0, 126.0, 127.0, 116.0, 85.0, 45.0, 21.0, 23.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2408447265625, -0.23472976684570312, -0.22861480712890625, -0.22249984741210938, -0.2163848876953125, -0.21026992797851562, -0.20415496826171875, -0.19804000854492188, -0.191925048828125, -0.18581008911132812, -0.17969512939453125, -0.17358016967773438, -0.1674652099609375, -0.16135025024414062, -0.15523529052734375, -0.14912033081054688, -0.14300537109375, -0.13689041137695312, -0.13077545166015625, -0.12466049194335938, -0.1185455322265625, -0.11243057250976562, -0.10631561279296875, -0.10020065307617188, -0.094085693359375, -0.08797073364257812, -0.08185577392578125, -0.07574081420898438, -0.0696258544921875, -0.06351089477539062, -0.05739593505859375, -0.051280975341796875, -0.045166015625, -0.039051055908203125, -0.03293609619140625, -0.026821136474609375, -0.0207061767578125, -0.014591217041015625, -0.00847625732421875, -0.002361297607421875, 0.003753662109375, 0.009868621826171875, 0.01598358154296875, 0.022098541259765625, 0.0282135009765625, 0.034328460693359375, 0.04044342041015625, 0.046558380126953125, 0.05267333984375, 0.058788299560546875, 0.06490325927734375, 0.07101821899414062, 0.0771331787109375, 0.08324813842773438, 0.08936309814453125, 0.09547805786132812, 0.101593017578125, 0.10770797729492188, 0.11382293701171875, 0.11993789672851562, 0.1260528564453125, 0.13216781616210938, 0.13828277587890625, 0.14439773559570312, 0.1505126953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 15.0, 13.0, 27.0, 71.0, 124.0, 287.0, 744.0, 2497.0, 12892.0, 226868.0, 3901271.0, 42611.0, 4935.0, 1187.0, 418.0, 161.0, 61.0, 45.0, 16.0, 12.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6467742919921875, -0.622161865234375, -0.5975494384765625, -0.57293701171875, -0.5483245849609375, -0.523712158203125, -0.4990997314453125, -0.4744873046875, -0.4498748779296875, -0.425262451171875, -0.4006500244140625, -0.37603759765625, -0.3514251708984375, -0.326812744140625, -0.3022003173828125, -0.277587890625, -0.2529754638671875, -0.228363037109375, -0.2037506103515625, -0.17913818359375, -0.1545257568359375, -0.129913330078125, -0.1053009033203125, -0.0806884765625, -0.0560760498046875, -0.031463623046875, -0.0068511962890625, 0.01776123046875, 0.0423736572265625, 0.066986083984375, 0.0915985107421875, 0.1162109375, 0.1408233642578125, 0.165435791015625, 0.1900482177734375, 0.21466064453125, 0.2392730712890625, 0.263885498046875, 0.2884979248046875, 0.3131103515625, 0.3377227783203125, 0.362335205078125, 0.3869476318359375, 0.41156005859375, 0.4361724853515625, 0.460784912109375, 0.4853973388671875, 0.510009765625, 0.5346221923828125, 0.559234619140625, 0.5838470458984375, 0.60845947265625, 0.6330718994140625, 0.657684326171875, 0.6822967529296875, 0.7069091796875, 0.7315216064453125, 0.756134033203125, 0.7807464599609375, 0.80535888671875, 0.8299713134765625, 0.854583740234375, 0.8791961669921875, 0.90380859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 11.0, 10.0, 16.0, 19.0, 28.0, 39.0, 61.0, 127.0, 229.0, 693.0, 1766.0, 617.0, 224.0, 90.0, 49.0, 35.0, 18.0, 12.0, 8.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2584800720214844, -0.25157928466796875, -0.24467849731445312, -0.2377777099609375, -0.23087692260742188, -0.22397613525390625, -0.21707534790039062, -0.210174560546875, -0.20327377319335938, -0.19637298583984375, -0.18947219848632812, -0.1825714111328125, -0.17567062377929688, -0.16876983642578125, -0.16186904907226562, -0.15496826171875, -0.14806747436523438, -0.14116668701171875, -0.13426589965820312, -0.1273651123046875, -0.12046432495117188, -0.11356353759765625, -0.10666275024414062, -0.099761962890625, -0.09286117553710938, -0.08596038818359375, -0.07905960083007812, -0.0721588134765625, -0.06525802612304688, -0.05835723876953125, -0.051456451416015625, -0.0445556640625, -0.037654876708984375, -0.03075408935546875, -0.023853302001953125, -0.0169525146484375, -0.010051727294921875, -0.00315093994140625, 0.003749847412109375, 0.010650634765625, 0.017551422119140625, 0.02445220947265625, 0.031352996826171875, 0.0382537841796875, 0.045154571533203125, 0.05205535888671875, 0.058956146240234375, 0.06585693359375, 0.07275772094726562, 0.07965850830078125, 0.08655929565429688, 0.0934600830078125, 0.10036087036132812, 0.10726165771484375, 0.11416244506835938, 0.121063232421875, 0.12796401977539062, 0.13486480712890625, 0.14176559448242188, 0.1486663818359375, 0.15556716918945312, 0.16246795654296875, 0.16936874389648438, 0.17626953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 13.0, 44.0, 163.0, 405.0, 275.0, 75.0, 22.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51230525970459, -2.433605909347534, -2.3549063205718994, -2.2762069702148438, -2.197507619857788, -2.1188080310821533, -2.0401086807250977, -1.9614092111587524, -1.8827097415924072, -1.804010272026062, -1.7253109216690063, -1.6466114521026611, -1.567911982536316, -1.4892125129699707, -1.410513162612915, -1.3318136930465698, -1.2531143426895142, -1.174414873123169, -1.0957155227661133, -1.017016053199768, -0.9383165836334229, -0.8596171736717224, -0.780917763710022, -0.7022182941436768, -0.6235188841819763, -0.5448194742202759, -0.46612000465393066, -0.3874205946922302, -0.3087211549282074, -0.23002171516418457, -0.15132230520248413, -0.07262283563613892, 0.0060765743255615234, 0.08477600663900375, 0.16347543895244598, 0.24217486381530762, 0.32087430357933044, 0.39957374334335327, 0.4782731533050537, 0.5569726228713989, 0.6356720328330994, 0.7143714427947998, 0.793070912361145, 0.8717703223228455, 0.9504697322845459, 1.0291692018508911, 1.1078686714172363, 1.186568021774292, 1.2652674913406372, 1.3439669609069824, 1.422666311264038, 1.5013657808303833, 1.5800652503967285, 1.6587646007537842, 1.7374640703201294, 1.8161635398864746, 1.8948628902435303, 1.9735623598098755, 2.0522618293762207, 2.1309611797332764, 2.209660530090332, 2.288360118865967, 2.3670594692230225, 2.445758819580078, 2.524458408355713]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 11.0, 9.0, 20.0, 20.0, 22.0, 29.0, 28.0, 42.0, 47.0, 56.0, 70.0, 62.0, 62.0, 63.0, 46.0, 54.0, 49.0, 51.0, 50.0, 35.0, 33.0, 31.0, 35.0, 18.0, 10.0, 12.0, 9.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5914614200592041, -0.5689360499382019, -0.5464107394218445, -0.5238853693008423, -0.5013599991798401, -0.4788346588611603, -0.45630931854248047, -0.43378394842147827, -0.41125860810279846, -0.38873326778411865, -0.36620789766311646, -0.34368255734443665, -0.32115721702575684, -0.29863184690475464, -0.27610650658607483, -0.253581166267395, -0.23105579614639282, -0.20853044092655182, -0.18600508570671082, -0.163479745388031, -0.14095439016819, -0.118429034948349, -0.09590369462966919, -0.07337833940982819, -0.05085298418998718, -0.028327632695436478, -0.005802281200885773, 0.016723066568374634, 0.03924842178821564, 0.06177377700805664, 0.08429911732673645, 0.10682447254657745, 0.12934982776641846, 0.15187518298625946, 0.17440053820610046, 0.19692587852478027, 0.21945123374462128, 0.24197658896446228, 0.2645019292831421, 0.2870272994041443, 0.3095526397228241, 0.3320779800415039, 0.3546033501625061, 0.3771286904811859, 0.3996540307998657, 0.4221794009208679, 0.44470474123954773, 0.46723008155822754, 0.48975545167922974, 0.5122808218002319, 0.5348061323165894, 0.5573315024375916, 0.5798568725585938, 0.6023821830749512, 0.6249075531959534, 0.6474329233169556, 0.669958233833313, 0.6924836039543152, 0.7150089144706726, 0.7375342845916748, 0.760059654712677, 0.7825850248336792, 0.8051103353500366, 0.8276357054710388, 0.850161075592041]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 12.0, 10.0, 15.0, 24.0, 38.0, 43.0, 40.0, 73.0, 106.0, 185.0, 302.0, 452.0, 839.0, 1713.0, 4104.0, 15073.0, 124643.0, 745718.0, 131474.0, 15563.0, 4175.0, 1656.0, 882.0, 518.0, 272.0, 180.0, 123.0, 80.0, 55.0, 46.0, 26.0, 31.0, 17.0, 15.0, 9.0, 11.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.79052734375, -0.766937255859375, -0.74334716796875, -0.719757080078125, -0.6961669921875, -0.672576904296875, -0.64898681640625, -0.625396728515625, -0.601806640625, -0.578216552734375, -0.55462646484375, -0.531036376953125, -0.5074462890625, -0.483856201171875, -0.46026611328125, -0.436676025390625, -0.4130859375, -0.389495849609375, -0.36590576171875, -0.342315673828125, -0.3187255859375, -0.295135498046875, -0.27154541015625, -0.247955322265625, -0.224365234375, -0.200775146484375, -0.17718505859375, -0.153594970703125, -0.1300048828125, -0.106414794921875, -0.08282470703125, -0.059234619140625, -0.03564453125, -0.012054443359375, 0.01153564453125, 0.035125732421875, 0.0587158203125, 0.082305908203125, 0.10589599609375, 0.129486083984375, 0.153076171875, 0.176666259765625, 0.20025634765625, 0.223846435546875, 0.2474365234375, 0.271026611328125, 0.29461669921875, 0.318206787109375, 0.341796875, 0.365386962890625, 0.38897705078125, 0.412567138671875, 0.4361572265625, 0.459747314453125, 0.48333740234375, 0.506927490234375, 0.530517578125, 0.554107666015625, 0.57769775390625, 0.601287841796875, 0.6248779296875, 0.648468017578125, 0.67205810546875, 0.695648193359375, 0.71923828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 15.0, 26.0, 35.0, 67.0, 95.0, 125.0, 134.0, 113.0, 119.0, 94.0, 79.0, 29.0, 19.0, 14.0, 10.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2215576171875, -0.2157001495361328, -0.20984268188476562, -0.20398521423339844, -0.19812774658203125, -0.19227027893066406, -0.18641281127929688, -0.1805553436279297, -0.1746978759765625, -0.1688404083251953, -0.16298294067382812, -0.15712547302246094, -0.15126800537109375, -0.14541053771972656, -0.13955307006835938, -0.1336956024169922, -0.127838134765625, -0.12198066711425781, -0.11612319946289062, -0.11026573181152344, -0.10440826416015625, -0.09855079650878906, -0.09269332885742188, -0.08683586120605469, -0.0809783935546875, -0.07512092590332031, -0.06926345825195312, -0.06340599060058594, -0.05754852294921875, -0.05169105529785156, -0.045833587646484375, -0.03997611999511719, -0.03411865234375, -0.028261184692382812, -0.022403717041015625, -0.016546249389648438, -0.01068878173828125, -0.0048313140869140625, 0.001026153564453125, 0.0068836212158203125, 0.0127410888671875, 0.018598556518554688, 0.024456024169921875, 0.030313491821289062, 0.03617095947265625, 0.04202842712402344, 0.047885894775390625, 0.05374336242675781, 0.059600830078125, 0.06545829772949219, 0.07131576538085938, 0.07717323303222656, 0.08303070068359375, 0.08888816833496094, 0.09474563598632812, 0.10060310363769531, 0.1064605712890625, 0.11231803894042969, 0.11817550659179688, 0.12403297424316406, 0.12989044189453125, 0.13574790954589844, 0.14160537719726562, 0.1474628448486328, 0.1533203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 14.0, 14.0, 22.0, 28.0, 34.0, 48.0, 67.0, 110.0, 219.0, 265.0, 507.0, 927.0, 1904.0, 4249.0, 11113.0, 34791.0, 127296.0, 450105.0, 302259.0, 77641.0, 22781.0, 7800.0, 3119.0, 1398.0, 745.0, 379.0, 241.0, 156.0, 92.0, 65.0, 37.0, 22.0, 25.0, 23.0, 12.0, 11.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.442138671875, -0.4290618896484375, -0.415985107421875, -0.4029083251953125, -0.38983154296875, -0.3767547607421875, -0.363677978515625, -0.3506011962890625, -0.3375244140625, -0.3244476318359375, -0.311370849609375, -0.2982940673828125, -0.28521728515625, -0.2721405029296875, -0.259063720703125, -0.2459869384765625, -0.23291015625, -0.2198333740234375, -0.206756591796875, -0.1936798095703125, -0.18060302734375, -0.1675262451171875, -0.154449462890625, -0.1413726806640625, -0.1282958984375, -0.1152191162109375, -0.102142333984375, -0.0890655517578125, -0.07598876953125, -0.0629119873046875, -0.049835205078125, -0.0367584228515625, -0.023681640625, -0.0106048583984375, 0.002471923828125, 0.0155487060546875, 0.02862548828125, 0.0417022705078125, 0.054779052734375, 0.0678558349609375, 0.0809326171875, 0.0940093994140625, 0.107086181640625, 0.1201629638671875, 0.13323974609375, 0.1463165283203125, 0.159393310546875, 0.1724700927734375, 0.185546875, 0.1986236572265625, 0.211700439453125, 0.2247772216796875, 0.23785400390625, 0.2509307861328125, 0.264007568359375, 0.2770843505859375, 0.2901611328125, 0.3032379150390625, 0.316314697265625, 0.3293914794921875, 0.34246826171875, 0.3555450439453125, 0.368621826171875, 0.3816986083984375, 0.394775390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 4.0, 7.0, 7.0, 9.0, 15.0, 13.0, 17.0, 16.0, 17.0, 32.0, 27.0, 37.0, 33.0, 42.0, 50.0, 43.0, 45.0, 50.0, 36.0, 49.0, 48.0, 42.0, 38.0, 50.0, 34.0, 32.0, 33.0, 22.0, 24.0, 19.0, 23.0, 16.0, 22.0, 10.0, 8.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.434814453125, -0.4220771789550781, -0.40933990478515625, -0.3966026306152344, -0.3838653564453125, -0.3711280822753906, -0.35839080810546875, -0.3456535339355469, -0.332916259765625, -0.3201789855957031, -0.30744171142578125, -0.2947044372558594, -0.2819671630859375, -0.2692298889160156, -0.25649261474609375, -0.24375534057617188, -0.23101806640625, -0.21828079223632812, -0.20554351806640625, -0.19280624389648438, -0.1800689697265625, -0.16733169555664062, -0.15459442138671875, -0.14185714721679688, -0.129119873046875, -0.11638259887695312, -0.10364532470703125, -0.09090805053710938, -0.0781707763671875, -0.06543350219726562, -0.05269622802734375, -0.039958953857421875, -0.0272216796875, -0.014484405517578125, -0.00174713134765625, 0.010990142822265625, 0.0237274169921875, 0.036464691162109375, 0.04920196533203125, 0.061939239501953125, 0.074676513671875, 0.08741378784179688, 0.10015106201171875, 0.11288833618164062, 0.1256256103515625, 0.13836288452148438, 0.15110015869140625, 0.16383743286132812, 0.17657470703125, 0.18931198120117188, 0.20204925537109375, 0.21478652954101562, 0.2275238037109375, 0.24026107788085938, 0.25299835205078125, 0.2657356262207031, 0.278472900390625, 0.2912101745605469, 0.30394744873046875, 0.3166847229003906, 0.3294219970703125, 0.3421592712402344, 0.35489654541015625, 0.3676338195800781, 0.38037109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 14.0, 15.0, 25.0, 47.0, 96.0, 194.0, 502.0, 1401.0, 4795.0, 26651.0, 859439.0, 141161.0, 10187.0, 2578.0, 824.0, 326.0, 137.0, 67.0, 25.0, 15.0, 11.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4990234375, -0.4822540283203125, -0.465484619140625, -0.4487152099609375, -0.43194580078125, -0.4151763916015625, -0.398406982421875, -0.3816375732421875, -0.3648681640625, -0.3480987548828125, -0.331329345703125, -0.3145599365234375, -0.29779052734375, -0.2810211181640625, -0.264251708984375, -0.2474822998046875, -0.230712890625, -0.2139434814453125, -0.197174072265625, -0.1804046630859375, -0.16363525390625, -0.1468658447265625, -0.130096435546875, -0.1133270263671875, -0.0965576171875, -0.0797882080078125, -0.063018798828125, -0.0462493896484375, -0.02947998046875, -0.0127105712890625, 0.004058837890625, 0.0208282470703125, 0.03759765625, 0.0543670654296875, 0.071136474609375, 0.0879058837890625, 0.10467529296875, 0.1214447021484375, 0.138214111328125, 0.1549835205078125, 0.1717529296875, 0.1885223388671875, 0.205291748046875, 0.2220611572265625, 0.23883056640625, 0.2555999755859375, 0.272369384765625, 0.2891387939453125, 0.305908203125, 0.3226776123046875, 0.339447021484375, 0.3562164306640625, 0.37298583984375, 0.3897552490234375, 0.406524658203125, 0.4232940673828125, 0.4400634765625, 0.4568328857421875, 0.473602294921875, 0.4903717041015625, 0.50714111328125, 0.5239105224609375, 0.540679931640625, 0.5574493408203125, 0.57421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 9.0, 12.0, 13.0, 13.0, 19.0, 23.0, 31.0, 42.0, 58.0, 95.0, 113.0, 124.0, 100.0, 86.0, 52.0, 50.0, 26.0, 22.0, 19.0, 12.0, 11.0, 11.0, 10.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001061558723449707, -0.0001029549166560173, -9.97539609670639e-05, -9.65530052781105e-05, -9.33520495891571e-05, -9.01510939002037e-05, -8.69501382112503e-05, -8.37491825222969e-05, -8.05482268333435e-05, -7.73472711443901e-05, -7.41463154554367e-05, -7.094535976648331e-05, -6.774440407752991e-05, -6.454344838857651e-05, -6.134249269962311e-05, -5.814153701066971e-05, -5.494058132171631e-05, -5.173962563276291e-05, -4.853866994380951e-05, -4.533771425485611e-05, -4.213675856590271e-05, -3.893580287694931e-05, -3.573484718799591e-05, -3.253389149904251e-05, -2.933293581008911e-05, -2.613198012113571e-05, -2.2931024432182312e-05, -1.9730068743228912e-05, -1.6529113054275513e-05, -1.3328157365322113e-05, -1.0127201676368713e-05, -6.926245987415314e-06, -3.725290298461914e-06, -5.243346095085144e-07, 2.6766210794448853e-06, 5.877576768398285e-06, 9.078532457351685e-06, 1.2279488146305084e-05, 1.5480443835258484e-05, 1.8681399524211884e-05, 2.1882355213165283e-05, 2.5083310902118683e-05, 2.8284266591072083e-05, 3.148522228002548e-05, 3.468617796897888e-05, 3.788713365793228e-05, 4.108808934688568e-05, 4.428904503583908e-05, 4.749000072479248e-05, 5.069095641374588e-05, 5.389191210269928e-05, 5.709286779165268e-05, 6.029382348060608e-05, 6.349477916955948e-05, 6.669573485851288e-05, 6.989669054746628e-05, 7.309764623641968e-05, 7.629860192537308e-05, 7.949955761432648e-05, 8.270051330327988e-05, 8.590146899223328e-05, 8.910242468118668e-05, 9.230338037014008e-05, 9.550433605909348e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 2.0, 6.0, 9.0, 3.0, 10.0, 15.0, 28.0, 28.0, 50.0, 83.0, 148.0, 242.0, 478.0, 879.0, 1873.0, 4548.0, 15518.0, 108740.0, 794635.0, 98444.0, 14677.0, 4438.0, 1758.0, 903.0, 425.0, 245.0, 131.0, 71.0, 49.0, 36.0, 21.0, 14.0, 11.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34619140625, -0.3351936340332031, -0.32419586181640625, -0.3131980895996094, -0.3022003173828125, -0.2912025451660156, -0.28020477294921875, -0.2692070007324219, -0.258209228515625, -0.24721145629882812, -0.23621368408203125, -0.22521591186523438, -0.2142181396484375, -0.20322036743164062, -0.19222259521484375, -0.18122482299804688, -0.17022705078125, -0.15922927856445312, -0.14823150634765625, -0.13723373413085938, -0.1262359619140625, -0.11523818969726562, -0.10424041748046875, -0.09324264526367188, -0.082244873046875, -0.07124710083007812, -0.06024932861328125, -0.049251556396484375, -0.0382537841796875, -0.027256011962890625, -0.01625823974609375, -0.005260467529296875, 0.0057373046875, 0.016735076904296875, 0.02773284912109375, 0.038730621337890625, 0.0497283935546875, 0.060726165771484375, 0.07172393798828125, 0.08272171020507812, 0.093719482421875, 0.10471725463867188, 0.11571502685546875, 0.12671279907226562, 0.1377105712890625, 0.14870834350585938, 0.15970611572265625, 0.17070388793945312, 0.18170166015625, 0.19269943237304688, 0.20369720458984375, 0.21469497680664062, 0.2256927490234375, 0.23669052124023438, 0.24768829345703125, 0.2586860656738281, 0.269683837890625, 0.2806816101074219, 0.29167938232421875, 0.3026771545410156, 0.3136749267578125, 0.3246726989746094, 0.33567047119140625, 0.3466682434082031, 0.357666015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 23.0, 41.0, 53.0, 82.0, 168.0, 208.0, 159.0, 89.0, 63.0, 33.0, 18.0, 10.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.42317962646484375, -0.4083709716796875, -0.39356231689453125, -0.378753662109375, -0.36394500732421875, -0.3491363525390625, -0.33432769775390625, -0.31951904296875, -0.30471038818359375, -0.2899017333984375, -0.27509307861328125, -0.260284423828125, -0.24547576904296875, -0.2306671142578125, -0.21585845947265625, -0.2010498046875, -0.18624114990234375, -0.1714324951171875, -0.15662384033203125, -0.141815185546875, -0.12700653076171875, -0.1121978759765625, -0.09738922119140625, -0.08258056640625, -0.06777191162109375, -0.0529632568359375, -0.03815460205078125, -0.023345947265625, -0.00853729248046875, 0.0062713623046875, 0.02108001708984375, 0.035888671875, 0.05069732666015625, 0.0655059814453125, 0.08031463623046875, 0.095123291015625, 0.10993194580078125, 0.1247406005859375, 0.13954925537109375, 0.15435791015625, 0.16916656494140625, 0.1839752197265625, 0.19878387451171875, 0.213592529296875, 0.22840118408203125, 0.2432098388671875, 0.25801849365234375, 0.2728271484375, 0.28763580322265625, 0.3024444580078125, 0.31725311279296875, 0.332061767578125, 0.34687042236328125, 0.3616790771484375, 0.37648773193359375, 0.39129638671875, 0.40610504150390625, 0.4209136962890625, 0.43572235107421875, 0.450531005859375, 0.46533966064453125, 0.4801483154296875, 0.49495697021484375, 0.509765625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 14.0, 67.0, 273.0, 434.0, 147.0, 51.0, 15.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.775846481323242, -7.489560127258301, -7.203273773193359, -6.916987895965576, -6.630701541900635, -6.344415187835693, -6.05812931060791, -5.771842956542969, -5.485556602478027, -5.199270248413086, -4.9129838943481445, -4.626698017120361, -4.34041166305542, -4.0541253089904785, -3.767839193344116, -3.481553077697754, -3.1952667236328125, -2.908980369567871, -2.622694253921509, -2.3364081382751465, -2.050121784210205, -1.7638355493545532, -1.4775493144989014, -1.191263198852539, -0.9049768447875977, -0.6186906099319458, -0.33240437507629395, -0.04611814022064209, 0.24016809463500977, 0.5264543294906616, 0.8127405643463135, 1.0990266799926758, 1.3853130340576172, 1.671599268913269, 1.957885503768921, 2.244171619415283, 2.5304579734802246, 2.816744327545166, 3.1030304431915283, 3.3893165588378906, 3.675602912902832, 3.9618892669677734, 4.248175621032715, 4.534461498260498, 4.8207478523254395, 5.107034206390381, 5.393320083618164, 5.6796064376831055, 5.965892791748047, 6.252179145812988, 6.53846549987793, 6.824751377105713, 7.111037731170654, 7.397324085235596, 7.683609962463379, 7.96989631652832, 8.256182670593262, 8.542469024658203, 8.828755378723145, 9.115041732788086, 9.401327133178711, 9.687613487243652, 9.973899841308594, 10.260186195373535, 10.546472549438477]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 4.0, 6.0, 8.0, 8.0, 11.0, 16.0, 14.0, 22.0, 19.0, 15.0, 28.0, 27.0, 25.0, 38.0, 24.0, 35.0, 27.0, 51.0, 40.0, 31.0, 43.0, 39.0, 46.0, 38.0, 35.0, 40.0, 38.0, 36.0, 34.0, 30.0, 24.0, 24.0, 18.0, 15.0, 10.0, 8.0, 14.0, 11.0, 9.0, 6.0, 4.0, 9.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.003347873687744, -1.9367088079452515, -1.8700697422027588, -1.8034306764602661, -1.7367916107177734, -1.6701526641845703, -1.6035135984420776, -1.536874532699585, -1.4702354669570923, -1.4035964012145996, -1.336957335472107, -1.2703182697296143, -1.2036793231964111, -1.137040138244629, -1.0704011917114258, -1.003762125968933, -0.9371230602264404, -0.8704839944839478, -0.8038449287414551, -0.7372059226036072, -0.6705668568611145, -0.6039277911186218, -0.5372887849807739, -0.47064971923828125, -0.4040106534957886, -0.3373715877532959, -0.2707325518131256, -0.20409350097179413, -0.13745445013046265, -0.07081538438796997, -0.004176348447799683, 0.062462687492370605, 0.12910175323486328, 0.19574080407619476, 0.26237985491752625, 0.32901889085769653, 0.3956579566001892, 0.4622970223426819, 0.5289360284805298, 0.5955750942230225, 0.6622141599655151, 0.7288532257080078, 0.7954922914505005, 0.8621312975883484, 0.9287703633308411, 0.9954094290733337, 1.0620484352111816, 1.1286875009536743, 1.195326566696167, 1.2619656324386597, 1.3286046981811523, 1.395243763923645, 1.4618828296661377, 1.5285217761993408, 1.5951608419418335, 1.6617999076843262, 1.7284389734268188, 1.7950780391693115, 1.8617171049118042, 1.9283561706542969, 1.9949951171875, 2.0616343021392822, 2.1282732486724854, 2.1949124336242676, 2.2615513801574707]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 13.0, 14.0, 17.0, 30.0, 39.0, 65.0, 91.0, 134.0, 251.0, 418.0, 799.0, 1760.0, 5085.0, 23163.0, 2460466.0, 1671044.0, 23183.0, 4617.0, 1621.0, 684.0, 330.0, 173.0, 95.0, 66.0, 28.0, 28.0, 16.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.8408203125, -0.8207969665527344, -0.8007736206054688, -0.7807502746582031, -0.7607269287109375, -0.7407035827636719, -0.7206802368164062, -0.7006568908691406, -0.680633544921875, -0.6606101989746094, -0.6405868530273438, -0.6205635070800781, -0.6005401611328125, -0.5805168151855469, -0.5604934692382812, -0.5404701232910156, -0.52044677734375, -0.5004234313964844, -0.48040008544921875, -0.4603767395019531, -0.4403533935546875, -0.4203300476074219, -0.40030670166015625, -0.3802833557128906, -0.360260009765625, -0.3402366638183594, -0.32021331787109375, -0.3001899719238281, -0.2801666259765625, -0.2601432800292969, -0.24011993408203125, -0.22009658813476562, -0.2000732421875, -0.18004989624023438, -0.16002655029296875, -0.14000320434570312, -0.1199798583984375, -0.09995651245117188, -0.07993316650390625, -0.059909820556640625, -0.039886474609375, -0.019863128662109375, 0.00016021728515625, 0.020183563232421875, 0.0402069091796875, 0.060230255126953125, 0.08025360107421875, 0.10027694702148438, 0.12030029296875, 0.14032363891601562, 0.16034698486328125, 0.18037033081054688, 0.2003936767578125, 0.22041702270507812, 0.24044036865234375, 0.2604637145996094, 0.280487060546875, 0.3005104064941406, 0.32053375244140625, 0.3405570983886719, 0.3605804443359375, 0.3806037902832031, 0.40062713623046875, 0.4206504821777344, 0.440673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 9.0, 8.0, 22.0, 31.0, 26.0, 74.0, 106.0, 113.0, 117.0, 119.0, 98.0, 98.0, 60.0, 56.0, 17.0, 17.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19882583618164062, -0.19293975830078125, -0.18705368041992188, -0.1811676025390625, -0.17528152465820312, -0.16939544677734375, -0.16350936889648438, -0.157623291015625, -0.15173721313476562, -0.14585113525390625, -0.13996505737304688, -0.1340789794921875, -0.12819290161132812, -0.12230682373046875, -0.11642074584960938, -0.11053466796875, -0.10464859008789062, -0.09876251220703125, -0.09287643432617188, -0.0869903564453125, -0.08110427856445312, -0.07521820068359375, -0.06933212280273438, -0.063446044921875, -0.057559967041015625, -0.05167388916015625, -0.045787811279296875, -0.0399017333984375, -0.034015655517578125, -0.02812957763671875, -0.022243499755859375, -0.016357421875, -0.010471343994140625, -0.00458526611328125, 0.001300811767578125, 0.0071868896484375, 0.013072967529296875, 0.01895904541015625, 0.024845123291015625, 0.030731201171875, 0.036617279052734375, 0.04250335693359375, 0.048389434814453125, 0.0542755126953125, 0.060161590576171875, 0.06604766845703125, 0.07193374633789062, 0.07781982421875, 0.08370590209960938, 0.08959197998046875, 0.09547805786132812, 0.1013641357421875, 0.10725021362304688, 0.11313629150390625, 0.11902236938476562, 0.124908447265625, 0.13079452514648438, 0.13668060302734375, 0.14256668090820312, 0.1484527587890625, 0.15433883666992188, 0.16022491455078125, 0.16611099243164062, 0.1719970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 8.0, 14.0, 15.0, 30.0, 49.0, 100.0, 256.0, 575.0, 1550.0, 5347.0, 32150.0, 2414678.0, 1702405.0, 29566.0, 5164.0, 1431.0, 523.0, 226.0, 92.0, 53.0, 16.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.703125, -0.685089111328125, -0.66705322265625, -0.649017333984375, -0.6309814453125, -0.612945556640625, -0.59490966796875, -0.576873779296875, -0.558837890625, -0.540802001953125, -0.52276611328125, -0.504730224609375, -0.4866943359375, -0.468658447265625, -0.45062255859375, -0.432586669921875, -0.41455078125, -0.396514892578125, -0.37847900390625, -0.360443115234375, -0.3424072265625, -0.324371337890625, -0.30633544921875, -0.288299560546875, -0.270263671875, -0.252227783203125, -0.23419189453125, -0.216156005859375, -0.1981201171875, -0.180084228515625, -0.16204833984375, -0.144012451171875, -0.1259765625, -0.107940673828125, -0.08990478515625, -0.071868896484375, -0.0538330078125, -0.035797119140625, -0.01776123046875, 0.000274658203125, 0.018310546875, 0.036346435546875, 0.05438232421875, 0.072418212890625, 0.0904541015625, 0.108489990234375, 0.12652587890625, 0.144561767578125, 0.16259765625, 0.180633544921875, 0.19866943359375, 0.216705322265625, 0.2347412109375, 0.252777099609375, 0.27081298828125, 0.288848876953125, 0.306884765625, 0.324920654296875, 0.34295654296875, 0.360992431640625, 0.3790283203125, 0.397064208984375, 0.41510009765625, 0.433135986328125, 0.451171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 10.0, 6.0, 14.0, 17.0, 32.0, 34.0, 44.0, 80.0, 185.0, 499.0, 1601.0, 951.0, 303.0, 124.0, 54.0, 26.0, 29.0, 12.0, 11.0, 12.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.1390094757080078, -0.13434219360351562, -0.12967491149902344, -0.12500762939453125, -0.12034034729003906, -0.11567306518554688, -0.11100578308105469, -0.1063385009765625, -0.10167121887207031, -0.09700393676757812, -0.09233665466308594, -0.08766937255859375, -0.08300209045410156, -0.07833480834960938, -0.07366752624511719, -0.069000244140625, -0.06433296203613281, -0.059665679931640625, -0.05499839782714844, -0.05033111572265625, -0.04566383361816406, -0.040996551513671875, -0.03632926940917969, -0.0316619873046875, -0.026994705200195312, -0.022327423095703125, -0.017660140991210938, -0.01299285888671875, -0.008325576782226562, -0.003658294677734375, 0.0010089874267578125, 0.00567626953125, 0.010343551635742188, 0.015010833740234375, 0.019678115844726562, 0.02434539794921875, 0.029012680053710938, 0.033679962158203125, 0.03834724426269531, 0.0430145263671875, 0.04768180847167969, 0.052349090576171875, 0.05701637268066406, 0.06168365478515625, 0.06635093688964844, 0.07101821899414062, 0.07568550109863281, 0.080352783203125, 0.08502006530761719, 0.08968734741210938, 0.09435462951660156, 0.09902191162109375, 0.10368919372558594, 0.10835647583007812, 0.11302375793457031, 0.1176910400390625, 0.12235832214355469, 0.12702560424804688, 0.13169288635253906, 0.13636016845703125, 0.14102745056152344, 0.14569473266601562, 0.1503620147705078, 0.155029296875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 16.0, 20.0, 53.0, 73.0, 119.0, 170.0, 184.0, 162.0, 81.0, 55.0, 26.0, 14.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.856290340423584, -0.8283697366714478, -0.8004491329193115, -0.7725285291671753, -0.7446079254150391, -0.7166873216629028, -0.6887667179107666, -0.6608460545539856, -0.6329254508018494, -0.6050048470497131, -0.5770842432975769, -0.5491636395454407, -0.5212430357933044, -0.4933224022388458, -0.4654017984867096, -0.437481164932251, -0.40956059098243713, -0.3816399872303009, -0.3537193834781647, -0.32579874992370605, -0.2978781461715698, -0.2699575424194336, -0.24203693866729736, -0.21411632001399994, -0.1861957162618637, -0.15827511250972748, -0.13035449385643005, -0.10243389010429382, -0.074513278901577, -0.04659266769886017, -0.018672063946723938, 0.009248554706573486, 0.03716915845870972, 0.06508976966142654, 0.09301038086414337, 0.1209309846162796, 0.14885160326957703, 0.17677220702171326, 0.2046928107738495, 0.2326134294271469, 0.26053404808044434, 0.28845465183258057, 0.3163752555847168, 0.344295859336853, 0.37221649289131165, 0.4001370966434479, 0.4280577003955841, 0.4559783339500427, 0.48389890789985657, 0.5118195414543152, 0.5397401452064514, 0.5676607489585876, 0.5955813527107239, 0.6235019564628601, 0.6514225602149963, 0.6793431639671326, 0.7072637677192688, 0.735184371471405, 0.7631049752235413, 0.7910255789756775, 0.8189461827278137, 0.8468668460845947, 0.874787449836731, 0.9027080535888672, 0.9306286573410034]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 3.0, 9.0, 18.0, 28.0, 22.0, 39.0, 40.0, 45.0, 37.0, 52.0, 55.0, 53.0, 56.0, 67.0, 64.0, 74.0, 55.0, 41.0, 38.0, 41.0, 40.0, 20.0, 22.0, 18.0, 18.0, 14.0, 10.0, 6.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5382129549980164, -0.5204073190689087, -0.502601683139801, -0.48479604721069336, -0.4669904112815857, -0.449184775352478, -0.43137913942337036, -0.4135735034942627, -0.39576786756515503, -0.37796223163604736, -0.3601565957069397, -0.34235095977783203, -0.32454532384872437, -0.3067396879196167, -0.28893405199050903, -0.27112841606140137, -0.2533227801322937, -0.23551714420318604, -0.21771150827407837, -0.1999058723449707, -0.18210023641586304, -0.16429460048675537, -0.1464889645576477, -0.12868332862854004, -0.11087769269943237, -0.09307205677032471, -0.07526642084121704, -0.057460784912109375, -0.03965514898300171, -0.021849513053894043, -0.004043877124786377, 0.013761758804321289, 0.03156733512878418, 0.049372971057891846, 0.06717860698699951, 0.08498424291610718, 0.10278987884521484, 0.12059551477432251, 0.13840115070343018, 0.15620678663253784, 0.1740124225616455, 0.19181805849075317, 0.20962369441986084, 0.2274293303489685, 0.24523496627807617, 0.26304060220718384, 0.2808462381362915, 0.29865187406539917, 0.31645750999450684, 0.3342631459236145, 0.35206878185272217, 0.36987441778182983, 0.3876800537109375, 0.40548568964004517, 0.42329132556915283, 0.4410969614982605, 0.45890259742736816, 0.47670823335647583, 0.4945138692855835, 0.5123195052146912, 0.5301251411437988, 0.5479307770729065, 0.5657364130020142, 0.5835420489311218, 0.6013476848602295]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 18.0, 16.0, 22.0, 43.0, 44.0, 97.0, 126.0, 261.0, 407.0, 837.0, 1887.0, 5746.0, 31308.0, 494774.0, 473879.0, 29713.0, 5504.0, 1917.0, 821.0, 451.0, 253.0, 138.0, 96.0, 55.0, 46.0, 29.0, 14.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8679885864257812, -0.8399810791015625, -0.8119735717773438, -0.783966064453125, -0.7559585571289062, -0.7279510498046875, -0.6999435424804688, -0.67193603515625, -0.6439285278320312, -0.6159210205078125, -0.5879135131835938, -0.559906005859375, -0.5318984985351562, -0.5038909912109375, -0.47588348388671875, -0.4478759765625, -0.41986846923828125, -0.3918609619140625, -0.36385345458984375, -0.335845947265625, -0.30783843994140625, -0.2798309326171875, -0.25182342529296875, -0.22381591796875, -0.19580841064453125, -0.1678009033203125, -0.13979339599609375, -0.111785888671875, -0.08377838134765625, -0.0557708740234375, -0.02776336669921875, 0.000244140625, 0.02825164794921875, 0.0562591552734375, 0.08426666259765625, 0.112274169921875, 0.14028167724609375, 0.1682891845703125, 0.19629669189453125, 0.22430419921875, 0.25231170654296875, 0.2803192138671875, 0.30832672119140625, 0.336334228515625, 0.36434173583984375, 0.3923492431640625, 0.42035675048828125, 0.4483642578125, 0.47637176513671875, 0.5043792724609375, 0.5323867797851562, 0.560394287109375, 0.5884017944335938, 0.6164093017578125, 0.6444168090820312, 0.67242431640625, 0.7004318237304688, 0.7284393310546875, 0.7564468383789062, 0.784454345703125, 0.8124618530273438, 0.8404693603515625, 0.8684768676757812, 0.896484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 7.0, 10.0, 24.0, 28.0, 43.0, 68.0, 114.0, 125.0, 112.0, 113.0, 98.0, 83.0, 62.0, 48.0, 19.0, 15.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.1951160430908203, -0.18930435180664062, -0.18349266052246094, -0.17768096923828125, -0.17186927795410156, -0.16605758666992188, -0.1602458953857422, -0.1544342041015625, -0.1486225128173828, -0.14281082153320312, -0.13699913024902344, -0.13118743896484375, -0.12537574768066406, -0.11956405639648438, -0.11375236511230469, -0.107940673828125, -0.10212898254394531, -0.09631729125976562, -0.09050559997558594, -0.08469390869140625, -0.07888221740722656, -0.07307052612304688, -0.06725883483886719, -0.0614471435546875, -0.05563545227050781, -0.049823760986328125, -0.04401206970214844, -0.03820037841796875, -0.03238868713378906, -0.026576995849609375, -0.020765304565429688, -0.01495361328125, -0.009141921997070312, -0.003330230712890625, 0.0024814605712890625, 0.00829315185546875, 0.014104843139648438, 0.019916534423828125, 0.025728225708007812, 0.0315399169921875, 0.03735160827636719, 0.043163299560546875, 0.04897499084472656, 0.05478668212890625, 0.06059837341308594, 0.06641006469726562, 0.07222175598144531, 0.078033447265625, 0.08384513854980469, 0.08965682983398438, 0.09546852111816406, 0.10128021240234375, 0.10709190368652344, 0.11290359497070312, 0.11871528625488281, 0.1245269775390625, 0.1303386688232422, 0.13615036010742188, 0.14196205139160156, 0.14777374267578125, 0.15358543395996094, 0.15939712524414062, 0.1652088165283203, 0.1710205078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 5.0, 8.0, 19.0, 16.0, 27.0, 36.0, 43.0, 57.0, 87.0, 124.0, 167.0, 258.0, 350.0, 558.0, 847.0, 1424.0, 2541.0, 4704.0, 9531.0, 20049.0, 44897.0, 107053.0, 244265.0, 320629.0, 163189.0, 69107.0, 29906.0, 13477.0, 6598.0, 3501.0, 1832.0, 1151.0, 713.0, 453.0, 297.0, 182.0, 109.0, 82.0, 66.0, 46.0, 51.0, 26.0, 22.0, 12.0, 13.0, 7.0, 6.0, 9.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.2652130126953125, -0.256988525390625, -0.2487640380859375, -0.24053955078125, -0.2323150634765625, -0.224090576171875, -0.2158660888671875, -0.2076416015625, -0.1994171142578125, -0.191192626953125, -0.1829681396484375, -0.17474365234375, -0.1665191650390625, -0.158294677734375, -0.1500701904296875, -0.141845703125, -0.1336212158203125, -0.125396728515625, -0.1171722412109375, -0.10894775390625, -0.1007232666015625, -0.092498779296875, -0.0842742919921875, -0.0760498046875, -0.0678253173828125, -0.059600830078125, -0.0513763427734375, -0.04315185546875, -0.0349273681640625, -0.026702880859375, -0.0184783935546875, -0.01025390625, -0.0020294189453125, 0.006195068359375, 0.0144195556640625, 0.02264404296875, 0.0308685302734375, 0.039093017578125, 0.0473175048828125, 0.0555419921875, 0.0637664794921875, 0.071990966796875, 0.0802154541015625, 0.08843994140625, 0.0966644287109375, 0.104888916015625, 0.1131134033203125, 0.121337890625, 0.1295623779296875, 0.137786865234375, 0.1460113525390625, 0.15423583984375, 0.1624603271484375, 0.170684814453125, 0.1789093017578125, 0.1871337890625, 0.1953582763671875, 0.203582763671875, 0.2118072509765625, 0.22003173828125, 0.2282562255859375, 0.236480712890625, 0.2447052001953125, 0.2529296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 9.0, 11.0, 12.0, 16.0, 16.0, 22.0, 21.0, 23.0, 18.0, 33.0, 27.0, 34.0, 40.0, 37.0, 46.0, 43.0, 34.0, 45.0, 37.0, 57.0, 35.0, 35.0, 36.0, 37.0, 41.0, 38.0, 24.0, 15.0, 19.0, 27.0, 19.0, 13.0, 19.0, 8.0, 9.0, 4.0, 9.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.387939453125, -0.3761177062988281, -0.36429595947265625, -0.3524742126464844, -0.3406524658203125, -0.3288307189941406, -0.31700897216796875, -0.3051872253417969, -0.293365478515625, -0.2815437316894531, -0.26972198486328125, -0.2579002380371094, -0.2460784912109375, -0.23425674438476562, -0.22243499755859375, -0.21061325073242188, -0.19879150390625, -0.18696975708007812, -0.17514801025390625, -0.16332626342773438, -0.1515045166015625, -0.13968276977539062, -0.12786102294921875, -0.11603927612304688, -0.104217529296875, -0.09239578247070312, -0.08057403564453125, -0.06875228881835938, -0.0569305419921875, -0.045108795166015625, -0.03328704833984375, -0.021465301513671875, -0.0096435546875, 0.002178192138671875, 0.01399993896484375, 0.025821685791015625, 0.0376434326171875, 0.049465179443359375, 0.06128692626953125, 0.07310867309570312, 0.084930419921875, 0.09675216674804688, 0.10857391357421875, 0.12039566040039062, 0.1322174072265625, 0.14403915405273438, 0.15586090087890625, 0.16768264770507812, 0.17950439453125, 0.19132614135742188, 0.20314788818359375, 0.21496963500976562, 0.2267913818359375, 0.23861312866210938, 0.25043487548828125, 0.2622566223144531, 0.274078369140625, 0.2859001159667969, 0.29772186279296875, 0.3095436096191406, 0.3213653564453125, 0.3331871032714844, 0.34500885009765625, 0.3568305969238281, 0.36865234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 8.0, 9.0, 5.0, 16.0, 35.0, 44.0, 65.0, 131.0, 242.0, 488.0, 983.0, 2409.0, 7462.0, 40318.0, 619894.0, 340885.0, 26191.0, 5680.0, 1947.0, 779.0, 432.0, 209.0, 121.0, 70.0, 39.0, 30.0, 15.0, 14.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.333251953125, -0.3231201171875, -0.31298828125, -0.3028564453125, -0.292724609375, -0.2825927734375, -0.2724609375, -0.2623291015625, -0.252197265625, -0.2420654296875, -0.23193359375, -0.2218017578125, -0.211669921875, -0.2015380859375, -0.19140625, -0.1812744140625, -0.171142578125, -0.1610107421875, -0.15087890625, -0.1407470703125, -0.130615234375, -0.1204833984375, -0.1103515625, -0.1002197265625, -0.090087890625, -0.0799560546875, -0.06982421875, -0.0596923828125, -0.049560546875, -0.0394287109375, -0.029296875, -0.0191650390625, -0.009033203125, 0.0010986328125, 0.01123046875, 0.0213623046875, 0.031494140625, 0.0416259765625, 0.0517578125, 0.0618896484375, 0.072021484375, 0.0821533203125, 0.09228515625, 0.1024169921875, 0.112548828125, 0.1226806640625, 0.1328125, 0.1429443359375, 0.153076171875, 0.1632080078125, 0.17333984375, 0.1834716796875, 0.193603515625, 0.2037353515625, 0.2138671875, 0.2239990234375, 0.234130859375, 0.2442626953125, 0.25439453125, 0.2645263671875, 0.274658203125, 0.2847900390625, 0.294921875, 0.3050537109375, 0.315185546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 0.0, 4.0, 7.0, 10.0, 14.0, 17.0, 17.0, 22.0, 28.0, 34.0, 41.0, 52.0, 65.0, 79.0, 114.0, 105.0, 76.0, 54.0, 60.0, 34.0, 28.0, 20.0, 26.0, 22.0, 20.0, 9.0, 11.0, 10.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010508298873901367, -0.00010134372860193253, -9.760446846485138e-05, -9.386520832777023e-05, -9.012594819068909e-05, -8.638668805360794e-05, -8.26474279165268e-05, -7.890816777944565e-05, -7.51689076423645e-05, -7.142964750528336e-05, -6.769038736820221e-05, -6.395112723112106e-05, -6.021186709403992e-05, -5.647260695695877e-05, -5.2733346819877625e-05, -4.899408668279648e-05, -4.525482654571533e-05, -4.1515566408634186e-05, -3.777630627155304e-05, -3.403704613447189e-05, -3.0297785997390747e-05, -2.65585258603096e-05, -2.2819265723228455e-05, -1.908000558614731e-05, -1.5340745449066162e-05, -1.1601485311985016e-05, -7.86222517490387e-06, -4.122965037822723e-06, -3.8370490074157715e-07, 3.355555236339569e-06, 7.094815373420715e-06, 1.0834075510501862e-05, 1.4573335647583008e-05, 1.8312595784664154e-05, 2.20518559217453e-05, 2.5791116058826447e-05, 2.9530376195907593e-05, 3.326963633298874e-05, 3.7008896470069885e-05, 4.074815660715103e-05, 4.448741674423218e-05, 4.8226676881313324e-05, 5.196593701839447e-05, 5.5705197155475616e-05, 5.944445729255676e-05, 6.318371742963791e-05, 6.692297756671906e-05, 7.06622377038002e-05, 7.440149784088135e-05, 7.81407579779625e-05, 8.188001811504364e-05, 8.561927825212479e-05, 8.935853838920593e-05, 9.309779852628708e-05, 9.683705866336823e-05, 0.00010057631880044937, 0.00010431557893753052, 0.00010805483907461166, 0.00011179409921169281, 0.00011553335934877396, 0.0001192726194858551, 0.00012301187962293625, 0.0001267511397600174, 0.00013049039989709854, 0.0001342296600341797]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 12.0, 24.0, 30.0, 47.0, 85.0, 132.0, 272.0, 646.0, 1640.0, 5252.0, 21809.0, 194329.0, 739852.0, 68070.0, 11178.0, 3122.0, 1104.0, 470.0, 210.0, 98.0, 68.0, 31.0, 24.0, 14.0, 6.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3199882507324219, -0.30867767333984375, -0.2973670959472656, -0.2860565185546875, -0.2747459411621094, -0.26343536376953125, -0.2521247863769531, -0.240814208984375, -0.22950363159179688, -0.21819305419921875, -0.20688247680664062, -0.1955718994140625, -0.18426132202148438, -0.17295074462890625, -0.16164016723632812, -0.15032958984375, -0.13901901245117188, -0.12770843505859375, -0.11639785766601562, -0.1050872802734375, -0.09377670288085938, -0.08246612548828125, -0.07115554809570312, -0.059844970703125, -0.048534393310546875, -0.03722381591796875, -0.025913238525390625, -0.0146026611328125, -0.003292083740234375, 0.00801849365234375, 0.019329071044921875, 0.0306396484375, 0.041950225830078125, 0.05326080322265625, 0.06457138061523438, 0.0758819580078125, 0.08719253540039062, 0.09850311279296875, 0.10981369018554688, 0.121124267578125, 0.13243484497070312, 0.14374542236328125, 0.15505599975585938, 0.1663665771484375, 0.17767715454101562, 0.18898773193359375, 0.20029830932617188, 0.21160888671875, 0.22291946411132812, 0.23423004150390625, 0.24554061889648438, 0.2568511962890625, 0.2681617736816406, 0.27947235107421875, 0.2907829284667969, 0.302093505859375, 0.3134040832519531, 0.32471466064453125, 0.3360252380371094, 0.3473358154296875, 0.3586463928222656, 0.36995697021484375, 0.3812675476074219, 0.392578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 0.0, 5.0, 5.0, 10.0, 11.0, 14.0, 29.0, 27.0, 27.0, 52.0, 62.0, 73.0, 98.0, 119.0, 118.0, 74.0, 55.0, 53.0, 38.0, 22.0, 16.0, 16.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2379150390625, -0.22928810119628906, -0.22066116333007812, -0.2120342254638672, -0.20340728759765625, -0.1947803497314453, -0.18615341186523438, -0.17752647399902344, -0.1688995361328125, -0.16027259826660156, -0.15164566040039062, -0.1430187225341797, -0.13439178466796875, -0.1257648468017578, -0.11713790893554688, -0.10851097106933594, -0.099884033203125, -0.09125709533691406, -0.08263015747070312, -0.07400321960449219, -0.06537628173828125, -0.05674934387207031, -0.048122406005859375, -0.03949546813964844, -0.0308685302734375, -0.022241592407226562, -0.013614654541015625, -0.0049877166748046875, 0.00363922119140625, 0.012266159057617188, 0.020893096923828125, 0.029520034790039062, 0.03814697265625, 0.04677391052246094, 0.055400848388671875, 0.06402778625488281, 0.07265472412109375, 0.08128166198730469, 0.08990859985351562, 0.09853553771972656, 0.1071624755859375, 0.11578941345214844, 0.12441635131835938, 0.1330432891845703, 0.14167022705078125, 0.1502971649169922, 0.15892410278320312, 0.16755104064941406, 0.176177978515625, 0.18480491638183594, 0.19343185424804688, 0.2020587921142578, 0.21068572998046875, 0.2193126678466797, 0.22793960571289062, 0.23656654357910156, 0.2451934814453125, 0.25382041931152344, 0.2624473571777344, 0.2710742950439453, 0.27970123291015625, 0.2883281707763672, 0.2969551086425781, 0.30558204650878906, 0.314208984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 30.0, 69.0, 168.0, 265.0, 203.0, 132.0, 69.0, 20.0, 15.0, 11.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.605701446533203, -6.420915126800537, -6.236128807067871, -6.051342487335205, -5.866556167602539, -5.681770324707031, -5.496984004974365, -5.312197685241699, -5.127411365509033, -4.942625045776367, -4.757838726043701, -4.573052406311035, -4.388266563415527, -4.203480243682861, -4.018693923950195, -3.8339076042175293, -3.6491212844848633, -3.4643349647521973, -3.2795486450195312, -3.0947625637054443, -2.9099762439727783, -2.7251899242401123, -2.5404038429260254, -2.3556175231933594, -2.1708312034606934, -1.9860448837280273, -1.8012586832046509, -1.6164724826812744, -1.4316861629486084, -1.2468998432159424, -1.062113642692566, -0.8773274421691895, -0.6925411224365234, -0.5077548623085022, -0.32296860218048096, -0.13818234205245972, 0.04660391807556152, 0.23139017820358276, 0.416176438331604, 0.6009626388549805, 0.7857489585876465, 0.9705352187156677, 1.155321478843689, 1.3401076793670654, 1.5248939990997314, 1.7096803188323975, 1.894466519355774, 2.0792527198791504, 2.2640390396118164, 2.4488253593444824, 2.6336116790771484, 2.8183977603912354, 3.0031840801239014, 3.1879703998565674, 3.3727564811706543, 3.5575428009033203, 3.7423291206359863, 3.9271154403686523, 4.111901760101318, 4.296688079833984, 4.481473922729492, 4.666260242462158, 4.851046562194824, 5.03583288192749, 5.220619201660156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 6.0, 2.0, 12.0, 14.0, 13.0, 18.0, 12.0, 16.0, 10.0, 30.0, 24.0, 31.0, 45.0, 34.0, 29.0, 25.0, 34.0, 35.0, 41.0, 43.0, 44.0, 52.0, 50.0, 45.0, 47.0, 42.0, 32.0, 24.0, 25.0, 14.0, 24.0, 17.0, 23.0, 17.0, 16.0, 8.0, 8.0, 8.0, 4.0, 4.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.5272819995880127, -2.450314521789551, -2.373347043991089, -2.296379566192627, -2.219412326812744, -2.1424448490142822, -2.0654773712158203, -1.9885098934173584, -1.9115424156188965, -1.8345749378204346, -1.7576075792312622, -1.6806401014328003, -1.6036726236343384, -1.526705265045166, -1.449737787246704, -1.3727703094482422, -1.2958029508590698, -1.218835473060608, -1.1418681144714355, -1.0649006366729736, -0.9879331588745117, -0.9109657406806946, -0.8339983224868774, -0.7570308446884155, -0.6800634264945984, -0.6030960083007812, -0.5261285305023193, -0.4491611123085022, -0.37219366431236267, -0.29522621631622314, -0.218258798122406, -0.1412913203239441, -0.06432390213012695, 0.012643538415431976, 0.0896109789609909, 0.16657841205596924, 0.24354586005210876, 0.3205133080482483, 0.39748072624206543, 0.47444820404052734, 0.5514156222343445, 0.6283830404281616, 0.7053505182266235, 0.7823179364204407, 0.8592853546142578, 0.9362528324127197, 1.0132203102111816, 1.0901877880096436, 1.167155146598816, 1.2441226243972778, 1.3210899829864502, 1.398057460784912, 1.475024938583374, 1.551992416381836, 1.6289597749710083, 1.7059272527694702, 1.7828946113586426, 1.8598620891571045, 1.9368294477462769, 2.013796806335449, 2.090764284133911, 2.167731761932373, 2.244699239730835, 2.321666717529297, 2.398634195327759]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 7.0, 8.0, 13.0, 22.0, 24.0, 36.0, 50.0, 78.0, 90.0, 135.0, 215.0, 347.0, 586.0, 1099.0, 2250.0, 5237.0, 17048.0, 108258.0, 3815733.0, 207743.0, 23667.0, 6447.0, 2551.0, 1222.0, 598.0, 297.0, 174.0, 102.0, 75.0, 46.0, 32.0, 20.0, 14.0, 10.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4642143249511719, -0.45040130615234375, -0.4365882873535156, -0.4227752685546875, -0.4089622497558594, -0.39514923095703125, -0.3813362121582031, -0.367523193359375, -0.3537101745605469, -0.33989715576171875, -0.3260841369628906, -0.3122711181640625, -0.2984580993652344, -0.28464508056640625, -0.2708320617675781, -0.25701904296875, -0.24320602416992188, -0.22939300537109375, -0.21557998657226562, -0.2017669677734375, -0.18795394897460938, -0.17414093017578125, -0.16032791137695312, -0.146514892578125, -0.13270187377929688, -0.11888885498046875, -0.10507583618164062, -0.0912628173828125, -0.07744979858398438, -0.06363677978515625, -0.049823760986328125, -0.0360107421875, -0.022197723388671875, -0.00838470458984375, 0.005428314208984375, 0.0192413330078125, 0.033054351806640625, 0.04686737060546875, 0.060680389404296875, 0.074493408203125, 0.08830642700195312, 0.10211944580078125, 0.11593246459960938, 0.1297454833984375, 0.14355850219726562, 0.15737152099609375, 0.17118453979492188, 0.18499755859375, 0.19881057739257812, 0.21262359619140625, 0.22643661499023438, 0.2402496337890625, 0.2540626525878906, 0.26787567138671875, 0.2816886901855469, 0.295501708984375, 0.3093147277832031, 0.32312774658203125, 0.3369407653808594, 0.3507537841796875, 0.3645668029785156, 0.37837982177734375, 0.3921928405761719, 0.406005859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 14.0, 14.0, 18.0, 26.0, 31.0, 62.0, 105.0, 99.0, 105.0, 116.0, 104.0, 67.0, 78.0, 52.0, 29.0, 28.0, 24.0, 6.0, 3.0, 7.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199462890625, -0.19361114501953125, -0.1877593994140625, -0.18190765380859375, -0.176055908203125, -0.17020416259765625, -0.1643524169921875, -0.15850067138671875, -0.15264892578125, -0.14679718017578125, -0.1409454345703125, -0.13509368896484375, -0.129241943359375, -0.12339019775390625, -0.1175384521484375, -0.11168670654296875, -0.1058349609375, -0.09998321533203125, -0.0941314697265625, -0.08827972412109375, -0.082427978515625, -0.07657623291015625, -0.0707244873046875, -0.06487274169921875, -0.05902099609375, -0.05316925048828125, -0.0473175048828125, -0.04146575927734375, -0.035614013671875, -0.02976226806640625, -0.0239105224609375, -0.01805877685546875, -0.01220703125, -0.00635528564453125, -0.0005035400390625, 0.00534820556640625, 0.011199951171875, 0.01705169677734375, 0.0229034423828125, 0.02875518798828125, 0.03460693359375, 0.04045867919921875, 0.0463104248046875, 0.05216217041015625, 0.058013916015625, 0.06386566162109375, 0.0697174072265625, 0.07556915283203125, 0.0814208984375, 0.08727264404296875, 0.0931243896484375, 0.09897613525390625, 0.104827880859375, 0.11067962646484375, 0.1165313720703125, 0.12238311767578125, 0.12823486328125, 0.13408660888671875, 0.1399383544921875, 0.14579010009765625, 0.151641845703125, 0.15749359130859375, 0.1633453369140625, 0.16919708251953125, 0.175048828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 13.0, 18.0, 44.0, 76.0, 142.0, 287.0, 607.0, 1702.0, 5340.0, 23075.0, 258867.0, 3787604.0, 96602.0, 13999.0, 3648.0, 1289.0, 524.0, 218.0, 103.0, 55.0, 31.0, 16.0, 13.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.5541801452636719, -0.5375595092773438, -0.5209388732910156, -0.5043182373046875, -0.4876976013183594, -0.47107696533203125, -0.4544563293457031, -0.437835693359375, -0.4212150573730469, -0.40459442138671875, -0.3879737854003906, -0.3713531494140625, -0.3547325134277344, -0.33811187744140625, -0.3214912414550781, -0.30487060546875, -0.2882499694824219, -0.27162933349609375, -0.2550086975097656, -0.2383880615234375, -0.22176742553710938, -0.20514678955078125, -0.18852615356445312, -0.171905517578125, -0.15528488159179688, -0.13866424560546875, -0.12204360961914062, -0.1054229736328125, -0.08880233764648438, -0.07218170166015625, -0.055561065673828125, -0.0389404296875, -0.022319793701171875, -0.00569915771484375, 0.010921478271484375, 0.0275421142578125, 0.044162750244140625, 0.06078338623046875, 0.07740402221679688, 0.094024658203125, 0.11064529418945312, 0.12726593017578125, 0.14388656616210938, 0.1605072021484375, 0.17712783813476562, 0.19374847412109375, 0.21036911010742188, 0.22698974609375, 0.24361038208007812, 0.26023101806640625, 0.2768516540527344, 0.2934722900390625, 0.3100929260253906, 0.32671356201171875, 0.3433341979980469, 0.359954833984375, 0.3765754699707031, 0.39319610595703125, 0.4098167419433594, 0.4264373779296875, 0.4430580139160156, 0.45967864990234375, 0.4762992858886719, 0.492919921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 21.0, 23.0, 30.0, 54.0, 99.0, 235.0, 919.0, 1868.0, 461.0, 145.0, 72.0, 40.0, 24.0, 14.0, 17.0, 11.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24578475952148438, -0.23839569091796875, -0.23100662231445312, -0.2236175537109375, -0.21622848510742188, -0.20883941650390625, -0.20145034790039062, -0.194061279296875, -0.18667221069335938, -0.17928314208984375, -0.17189407348632812, -0.1645050048828125, -0.15711593627929688, -0.14972686767578125, -0.14233779907226562, -0.13494873046875, -0.12755966186523438, -0.12017059326171875, -0.11278152465820312, -0.1053924560546875, -0.09800338745117188, -0.09061431884765625, -0.08322525024414062, -0.075836181640625, -0.06844711303710938, -0.06105804443359375, -0.053668975830078125, -0.0462799072265625, -0.038890838623046875, -0.03150177001953125, -0.024112701416015625, -0.0167236328125, -0.009334564208984375, -0.00194549560546875, 0.005443572998046875, 0.0128326416015625, 0.020221710205078125, 0.02761077880859375, 0.034999847412109375, 0.042388916015625, 0.049777984619140625, 0.05716705322265625, 0.06455612182617188, 0.0719451904296875, 0.07933425903320312, 0.08672332763671875, 0.09411239624023438, 0.10150146484375, 0.10889053344726562, 0.11627960205078125, 0.12366867065429688, 0.1310577392578125, 0.13844680786132812, 0.14583587646484375, 0.15322494506835938, 0.160614013671875, 0.16800308227539062, 0.17539215087890625, 0.18278121948242188, 0.1901702880859375, 0.19755935668945312, 0.20494842529296875, 0.21233749389648438, 0.2197265625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 14.0, 46.0, 100.0, 169.0, 213.0, 208.0, 132.0, 67.0, 27.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8922836780548096, -0.8475372195243835, -0.8027907013893127, -0.7580442428588867, -0.7132977247238159, -0.6685512661933899, -0.6238048076629639, -0.5790582895278931, -0.534311830997467, -0.48956534266471863, -0.4448188543319702, -0.4000723958015442, -0.3553259074687958, -0.31057941913604736, -0.26583296060562134, -0.22108647227287292, -0.1763399839401245, -0.1315934956073761, -0.08684702217578888, -0.04210054874420166, 0.002645939588546753, 0.047392427921295166, 0.09213888645172119, 0.1368853747844696, 0.18163186311721802, 0.22637835144996643, 0.27112483978271484, 0.31587129831314087, 0.3606177866458893, 0.4053642749786377, 0.4501107335090637, 0.49485722184181213, 0.5396037101745605, 0.5843501687049866, 0.6290966868400574, 0.6738431453704834, 0.7185896635055542, 0.7633361220359802, 0.8080825805664062, 0.852829098701477, 0.8975755572319031, 0.9423220157623291, 0.9870685338973999, 1.0318150520324707, 1.076561450958252, 1.1213079690933228, 1.1660544872283936, 1.2108008861541748, 1.2555474042892456, 1.3002939224243164, 1.3450403213500977, 1.3897868394851685, 1.4345333576202393, 1.4792797565460205, 1.5240262746810913, 1.568772792816162, 1.6135191917419434, 1.6582657098770142, 1.7030121088027954, 1.7477586269378662, 1.792505145072937, 1.8372516632080078, 1.881998062133789, 1.9267445802688599, 1.9714910984039307]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 9.0, 14.0, 14.0, 10.0, 26.0, 17.0, 29.0, 35.0, 31.0, 39.0, 36.0, 33.0, 42.0, 52.0, 43.0, 43.0, 49.0, 50.0, 48.0, 50.0, 57.0, 49.0, 37.0, 33.0, 15.0, 19.0, 28.0, 20.0, 11.0, 10.0, 10.0, 5.0, 11.0, 3.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5624531507492065, -0.5436984896659851, -0.5249438285827637, -0.5061891674995422, -0.4874345064163208, -0.46867984533309937, -0.44992515444755554, -0.4311704933643341, -0.41241583228111267, -0.39366117119789124, -0.3749065101146698, -0.35615184903144836, -0.33739715814590454, -0.3186424970626831, -0.29988783597946167, -0.28113317489624023, -0.2623785138130188, -0.24362385272979736, -0.22486919164657593, -0.2061145156621933, -0.18735985457897186, -0.16860519349575043, -0.1498505175113678, -0.13109585642814636, -0.11234119534492493, -0.09358653426170349, -0.07483186572790146, -0.056077200919389725, -0.03732253611087799, -0.018567875027656555, 0.0001867935061454773, 0.01894146203994751, 0.037696123123168945, 0.05645078793168068, 0.07520545274019241, 0.09396012127399445, 0.11271478235721588, 0.13146944344043732, 0.15022411942481995, 0.16897878050804138, 0.18773344159126282, 0.20648810267448425, 0.2252427637577057, 0.24399743974208832, 0.26275211572647095, 0.2815067768096924, 0.3002614378929138, 0.31901609897613525, 0.3377707600593567, 0.3565254211425781, 0.37528008222579956, 0.394034743309021, 0.41278940439224243, 0.43154406547546387, 0.4502987563610077, 0.4690534174442291, 0.48780807852745056, 0.5065627694129944, 0.5253174304962158, 0.5440720915794373, 0.5628267526626587, 0.5815814137458801, 0.6003360748291016, 0.619090735912323, 0.6378453969955444]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 14.0, 7.0, 16.0, 15.0, 21.0, 39.0, 35.0, 46.0, 71.0, 94.0, 155.0, 230.0, 390.0, 762.0, 1566.0, 3695.0, 13368.0, 75603.0, 748983.0, 170434.0, 22911.0, 5631.0, 2165.0, 960.0, 491.0, 276.0, 185.0, 125.0, 83.0, 59.0, 38.0, 20.0, 21.0, 12.0, 11.0, 0.0, 1.0, 9.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5161895751953125, -0.495269775390625, -0.4743499755859375, -0.45343017578125, -0.4325103759765625, -0.411590576171875, -0.3906707763671875, -0.3697509765625, -0.3488311767578125, -0.327911376953125, -0.3069915771484375, -0.28607177734375, -0.2651519775390625, -0.244232177734375, -0.2233123779296875, -0.202392578125, -0.1814727783203125, -0.160552978515625, -0.1396331787109375, -0.11871337890625, -0.0977935791015625, -0.076873779296875, -0.0559539794921875, -0.0350341796875, -0.0141143798828125, 0.006805419921875, 0.0277252197265625, 0.04864501953125, 0.0695648193359375, 0.090484619140625, 0.1114044189453125, 0.13232421875, 0.1532440185546875, 0.174163818359375, 0.1950836181640625, 0.21600341796875, 0.2369232177734375, 0.257843017578125, 0.2787628173828125, 0.2996826171875, 0.3206024169921875, 0.341522216796875, 0.3624420166015625, 0.38336181640625, 0.4042816162109375, 0.425201416015625, 0.4461212158203125, 0.467041015625, 0.4879608154296875, 0.508880615234375, 0.5298004150390625, 0.55072021484375, 0.5716400146484375, 0.592559814453125, 0.6134796142578125, 0.6343994140625, 0.6553192138671875, 0.676239013671875, 0.6971588134765625, 0.71807861328125, 0.7389984130859375, 0.759918212890625, 0.7808380126953125, 0.8017578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 11.0, 18.0, 14.0, 34.0, 39.0, 75.0, 97.0, 111.0, 97.0, 120.0, 95.0, 76.0, 68.0, 42.0, 30.0, 22.0, 18.0, 9.0, 2.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1949462890625, -0.189178466796875, -0.18341064453125, -0.177642822265625, -0.171875, -0.166107177734375, -0.16033935546875, -0.154571533203125, -0.1488037109375, -0.143035888671875, -0.13726806640625, -0.131500244140625, -0.125732421875, -0.119964599609375, -0.11419677734375, -0.108428955078125, -0.1026611328125, -0.096893310546875, -0.09112548828125, -0.085357666015625, -0.07958984375, -0.073822021484375, -0.06805419921875, -0.062286376953125, -0.0565185546875, -0.050750732421875, -0.04498291015625, -0.039215087890625, -0.033447265625, -0.027679443359375, -0.02191162109375, -0.016143798828125, -0.0103759765625, -0.004608154296875, 0.00115966796875, 0.006927490234375, 0.0126953125, 0.018463134765625, 0.02423095703125, 0.029998779296875, 0.0357666015625, 0.041534423828125, 0.04730224609375, 0.053070068359375, 0.058837890625, 0.064605712890625, 0.07037353515625, 0.076141357421875, 0.0819091796875, 0.087677001953125, 0.09344482421875, 0.099212646484375, 0.10498046875, 0.110748291015625, 0.11651611328125, 0.122283935546875, 0.1280517578125, 0.133819580078125, 0.13958740234375, 0.145355224609375, 0.151123046875, 0.156890869140625, 0.16265869140625, 0.168426513671875, 0.1741943359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 9.0, 14.0, 5.0, 14.0, 16.0, 29.0, 37.0, 62.0, 107.0, 183.0, 330.0, 682.0, 1718.0, 4863.0, 16035.0, 73973.0, 676244.0, 227313.0, 33204.0, 8682.0, 2823.0, 1130.0, 461.0, 225.0, 132.0, 88.0, 52.0, 37.0, 27.0, 15.0, 13.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5506744384765625, -0.531524658203125, -0.5123748779296875, -0.49322509765625, -0.4740753173828125, -0.454925537109375, -0.4357757568359375, -0.4166259765625, -0.3974761962890625, -0.378326416015625, -0.3591766357421875, -0.34002685546875, -0.3208770751953125, -0.301727294921875, -0.2825775146484375, -0.263427734375, -0.2442779541015625, -0.225128173828125, -0.2059783935546875, -0.18682861328125, -0.1676788330078125, -0.148529052734375, -0.1293792724609375, -0.1102294921875, -0.0910797119140625, -0.071929931640625, -0.0527801513671875, -0.03363037109375, -0.0144805908203125, 0.004669189453125, 0.0238189697265625, 0.04296875, 0.0621185302734375, 0.081268310546875, 0.1004180908203125, 0.11956787109375, 0.1387176513671875, 0.157867431640625, 0.1770172119140625, 0.1961669921875, 0.2153167724609375, 0.234466552734375, 0.2536163330078125, 0.27276611328125, 0.2919158935546875, 0.311065673828125, 0.3302154541015625, 0.349365234375, 0.3685150146484375, 0.387664794921875, 0.4068145751953125, 0.42596435546875, 0.4451141357421875, 0.464263916015625, 0.4834136962890625, 0.5025634765625, 0.5217132568359375, 0.540863037109375, 0.5600128173828125, 0.57916259765625, 0.5983123779296875, 0.617462158203125, 0.6366119384765625, 0.65576171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 0.0, 7.0, 9.0, 8.0, 11.0, 13.0, 12.0, 8.0, 21.0, 19.0, 20.0, 33.0, 18.0, 27.0, 27.0, 33.0, 33.0, 45.0, 44.0, 46.0, 44.0, 46.0, 42.0, 39.0, 41.0, 46.0, 30.0, 30.0, 38.0, 22.0, 26.0, 31.0, 23.0, 13.0, 23.0, 10.0, 10.0, 11.0, 9.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.34989166259765625, -0.3377227783203125, -0.32555389404296875, -0.313385009765625, -0.30121612548828125, -0.2890472412109375, -0.27687835693359375, -0.26470947265625, -0.25254058837890625, -0.2403717041015625, -0.22820281982421875, -0.216033935546875, -0.20386505126953125, -0.1916961669921875, -0.17952728271484375, -0.1673583984375, -0.15518951416015625, -0.1430206298828125, -0.13085174560546875, -0.118682861328125, -0.10651397705078125, -0.0943450927734375, -0.08217620849609375, -0.07000732421875, -0.05783843994140625, -0.0456695556640625, -0.03350067138671875, -0.021331787109375, -0.00916290283203125, 0.0030059814453125, 0.01517486572265625, 0.02734375, 0.03951263427734375, 0.0516815185546875, 0.06385040283203125, 0.076019287109375, 0.08818817138671875, 0.1003570556640625, 0.11252593994140625, 0.12469482421875, 0.13686370849609375, 0.1490325927734375, 0.16120147705078125, 0.173370361328125, 0.18553924560546875, 0.1977081298828125, 0.20987701416015625, 0.2220458984375, 0.23421478271484375, 0.2463836669921875, 0.25855255126953125, 0.270721435546875, 0.28289031982421875, 0.2950592041015625, 0.30722808837890625, 0.31939697265625, 0.33156585693359375, 0.3437347412109375, 0.35590362548828125, 0.368072509765625, 0.38024139404296875, 0.3924102783203125, 0.40457916259765625, 0.416748046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 8.0, 11.0, 8.0, 21.0, 24.0, 54.0, 56.0, 120.0, 250.0, 601.0, 2414.0, 17587.0, 527373.0, 479672.0, 16921.0, 2300.0, 564.0, 276.0, 105.0, 75.0, 39.0, 25.0, 12.0, 9.0, 7.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33464813232421875, -0.3231048583984375, -0.31156158447265625, -0.300018310546875, -0.28847503662109375, -0.2769317626953125, -0.26538848876953125, -0.25384521484375, -0.24230194091796875, -0.2307586669921875, -0.21921539306640625, -0.207672119140625, -0.19612884521484375, -0.1845855712890625, -0.17304229736328125, -0.1614990234375, -0.14995574951171875, -0.1384124755859375, -0.12686920166015625, -0.115325927734375, -0.10378265380859375, -0.0922393798828125, -0.08069610595703125, -0.06915283203125, -0.05760955810546875, -0.0460662841796875, -0.03452301025390625, -0.022979736328125, -0.01143646240234375, 0.0001068115234375, 0.01165008544921875, 0.023193359375, 0.03473663330078125, 0.0462799072265625, 0.05782318115234375, 0.069366455078125, 0.08090972900390625, 0.0924530029296875, 0.10399627685546875, 0.11553955078125, 0.12708282470703125, 0.1386260986328125, 0.15016937255859375, 0.161712646484375, 0.17325592041015625, 0.1847991943359375, 0.19634246826171875, 0.2078857421875, 0.21942901611328125, 0.2309722900390625, 0.24251556396484375, 0.254058837890625, 0.26560211181640625, 0.2771453857421875, 0.28868865966796875, 0.30023193359375, 0.31177520751953125, 0.3233184814453125, 0.33486175537109375, 0.346405029296875, 0.35794830322265625, 0.3694915771484375, 0.38103485107421875, 0.392578125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 14.0, 35.0, 76.0, 156.0, 296.0, 207.0, 90.0, 52.0, 33.0, 10.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030112266540527344, -0.0002894066274166107, -0.000277690589427948, -0.0002659745514392853, -0.00025425851345062256, -0.00024254247546195984, -0.00023082643747329712, -0.0002191103994846344, -0.00020739436149597168, -0.00019567832350730896, -0.00018396228551864624, -0.00017224624752998352, -0.0001605302095413208, -0.00014881417155265808, -0.00013709813356399536, -0.00012538209557533264, -0.00011366605758666992, -0.0001019500195980072, -9.023398160934448e-05, -7.851794362068176e-05, -6.680190563201904e-05, -5.508586764335632e-05, -4.3369829654693604e-05, -3.1653791666030884e-05, -1.9937753677368164e-05, -8.221715688705444e-06, 3.4943222999572754e-06, 1.5210360288619995e-05, 2.6926398277282715e-05, 3.8642436265945435e-05, 5.0358474254608154e-05, 6.207451224327087e-05, 7.37905502319336e-05, 8.550658822059631e-05, 9.722262620925903e-05, 0.00010893866419792175, 0.00012065470218658447, 0.0001323707401752472, 0.0001440867781639099, 0.00015580281615257263, 0.00016751885414123535, 0.00017923489212989807, 0.0001909509301185608, 0.0002026669681072235, 0.00021438300609588623, 0.00022609904408454895, 0.00023781508207321167, 0.0002495311200618744, 0.0002612471580505371, 0.00027296319603919983, 0.00028467923402786255, 0.00029639527201652527, 0.000308111310005188, 0.0003198273479938507, 0.00033154338598251343, 0.00034325942397117615, 0.00035497546195983887, 0.0003666914999485016, 0.0003784075379371643, 0.000390123575925827, 0.00040183961391448975, 0.00041355565190315247, 0.0004252716898918152, 0.0004369877278804779, 0.0004487037658691406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 5.0, 15.0, 14.0, 13.0, 25.0, 41.0, 69.0, 106.0, 157.0, 329.0, 1005.0, 4916.0, 68406.0, 921447.0, 46524.0, 3839.0, 871.0, 334.0, 149.0, 99.0, 57.0, 48.0, 22.0, 20.0, 9.0, 9.0, 6.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.51318359375, -0.49828338623046875, -0.4833831787109375, -0.46848297119140625, -0.453582763671875, -0.43868255615234375, -0.4237823486328125, -0.40888214111328125, -0.39398193359375, -0.37908172607421875, -0.3641815185546875, -0.34928131103515625, -0.334381103515625, -0.31948089599609375, -0.3045806884765625, -0.28968048095703125, -0.2747802734375, -0.25988006591796875, -0.2449798583984375, -0.23007965087890625, -0.215179443359375, -0.20027923583984375, -0.1853790283203125, -0.17047882080078125, -0.15557861328125, -0.14067840576171875, -0.1257781982421875, -0.11087799072265625, -0.095977783203125, -0.08107757568359375, -0.0661773681640625, -0.05127716064453125, -0.036376953125, -0.02147674560546875, -0.0065765380859375, 0.00832366943359375, 0.023223876953125, 0.03812408447265625, 0.0530242919921875, 0.06792449951171875, 0.08282470703125, 0.09772491455078125, 0.1126251220703125, 0.12752532958984375, 0.142425537109375, 0.15732574462890625, 0.1722259521484375, 0.18712615966796875, 0.2020263671875, 0.21692657470703125, 0.2318267822265625, 0.24672698974609375, 0.261627197265625, 0.27652740478515625, 0.2914276123046875, 0.30632781982421875, 0.32122802734375, 0.33612823486328125, 0.3510284423828125, 0.36592864990234375, 0.380828857421875, 0.39572906494140625, 0.4106292724609375, 0.42552947998046875, 0.4404296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 13.0, 10.0, 16.0, 25.0, 36.0, 43.0, 54.0, 57.0, 120.0, 118.0, 122.0, 99.0, 66.0, 43.0, 32.0, 22.0, 15.0, 19.0, 13.0, 13.0, 8.0, 6.0, 4.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.185546875, -0.17972183227539062, -0.17389678955078125, -0.16807174682617188, -0.1622467041015625, -0.15642166137695312, -0.15059661865234375, -0.14477157592773438, -0.138946533203125, -0.13312149047851562, -0.12729644775390625, -0.12147140502929688, -0.1156463623046875, -0.10982131958007812, -0.10399627685546875, -0.09817123413085938, -0.09234619140625, -0.08652114868164062, -0.08069610595703125, -0.07487106323242188, -0.0690460205078125, -0.06322097778320312, -0.05739593505859375, -0.051570892333984375, -0.045745849609375, -0.039920806884765625, -0.03409576416015625, -0.028270721435546875, -0.0224456787109375, -0.016620635986328125, -0.01079559326171875, -0.004970550537109375, 0.0008544921875, 0.006679534912109375, 0.01250457763671875, 0.018329620361328125, 0.0241546630859375, 0.029979705810546875, 0.03580474853515625, 0.041629791259765625, 0.047454833984375, 0.053279876708984375, 0.05910491943359375, 0.06492996215820312, 0.0707550048828125, 0.07658004760742188, 0.08240509033203125, 0.08823013305664062, 0.09405517578125, 0.09988021850585938, 0.10570526123046875, 0.11153030395507812, 0.1173553466796875, 0.12318038940429688, 0.12900543212890625, 0.13483047485351562, 0.140655517578125, 0.14648056030273438, 0.15230560302734375, 0.15813064575195312, 0.1639556884765625, 0.16978073120117188, 0.17560577392578125, 0.18143081665039062, 0.187255859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 15.0, 39.0, 75.0, 172.0, 232.0, 211.0, 102.0, 78.0, 30.0, 20.0, 8.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16450572013855, -2.0163140296936035, -1.8681225776672363, -1.71993088722229, -1.5717393159866333, -1.4235477447509766, -1.2753560543060303, -1.1271644830703735, -0.9789729118347168, -0.8307813405990601, -0.6825897097587585, -0.534398078918457, -0.3862065076828003, -0.23801493644714355, -0.08982330560684204, 0.05836832523345947, 0.2065598964691162, 0.35475149750709534, 0.5029430985450745, 0.651134729385376, 0.7993263006210327, 0.9475178718566895, 1.0957095623016357, 1.2439011335372925, 1.3920927047729492, 1.540284276008606, 1.6884758472442627, 1.836667537689209, 1.9848591089248657, 2.1330506801605225, 2.2812423706054688, 2.429433822631836, 2.5776257514953613, 2.7258174419403076, 2.874008893966675, 3.022200584411621, 3.1703920364379883, 3.3185837268829346, 3.466775417327881, 3.614966869354248, 3.7631585597991943, 3.9113502502441406, 4.059541702270508, 4.207733154296875, 4.3559250831604, 4.504116535186768, 4.652307987213135, 4.80049991607666, 4.948691368103027, 5.0968828201293945, 5.24507474899292, 5.393266201019287, 5.541457653045654, 5.68964958190918, 5.837841033935547, 5.986032485961914, 6.134223937988281, 6.282415390014648, 6.430607318878174, 6.578798770904541, 6.726990222930908, 6.875182151794434, 7.023373603820801, 7.171565055847168, 7.319756984710693]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 11.0, 8.0, 7.0, 18.0, 13.0, 16.0, 26.0, 24.0, 21.0, 32.0, 29.0, 28.0, 37.0, 39.0, 43.0, 46.0, 58.0, 53.0, 37.0, 51.0, 33.0, 55.0, 37.0, 36.0, 40.0, 40.0, 33.0, 17.0, 22.0, 23.0, 13.0, 14.0, 11.0, 6.0, 6.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4904160499572754, -2.4153387546539307, -2.340261459350586, -2.2651844024658203, -2.1901071071624756, -2.115029811859131, -2.0399527549743652, -1.9648754596710205, -1.8897981643676758, -1.814720869064331, -1.7396436929702759, -1.6645665168762207, -1.589489221572876, -1.5144119262695312, -1.439334750175476, -1.364257574081421, -1.2891802787780762, -1.2141029834747314, -1.1390258073806763, -1.063948631286621, -0.9888713359832764, -0.9137941002845764, -0.8387168645858765, -0.7636396288871765, -0.6885623931884766, -0.6134851574897766, -0.5384079217910767, -0.4633306860923767, -0.38825345039367676, -0.3131762146949768, -0.23809897899627686, -0.1630217432975769, -0.08794450759887695, -0.012867271900177002, 0.06220996379852295, 0.1372871994972229, 0.21236443519592285, 0.2874416708946228, 0.36251890659332275, 0.4375961422920227, 0.5126733779907227, 0.5877506136894226, 0.6628278493881226, 0.7379050850868225, 0.8129823207855225, 0.8880595564842224, 0.9631367921829224, 1.0382139682769775, 1.1132912635803223, 1.188368558883667, 1.2634457349777222, 1.3385229110717773, 1.413600206375122, 1.4886775016784668, 1.563754677772522, 1.6388318538665771, 1.7139091491699219, 1.7889864444732666, 1.8640636205673218, 1.939140796661377, 2.0142180919647217, 2.0892953872680664, 2.164372444152832, 2.2394497394561768, 2.3145270347595215]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 8.0, 6.0, 10.0, 8.0, 17.0, 18.0, 31.0, 49.0, 66.0, 108.0, 178.0, 404.0, 973.0, 2672.0, 11006.0, 145461.0, 3989187.0, 35628.0, 5721.0, 1621.0, 573.0, 215.0, 139.0, 76.0, 31.0, 30.0, 20.0, 13.0, 3.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212890625, -0.7966156005859375, -0.771942138671875, -0.7472686767578125, -0.72259521484375, -0.6979217529296875, -0.673248291015625, -0.6485748291015625, -0.6239013671875, -0.5992279052734375, -0.574554443359375, -0.5498809814453125, -0.52520751953125, -0.5005340576171875, -0.475860595703125, -0.4511871337890625, -0.426513671875, -0.4018402099609375, -0.377166748046875, -0.3524932861328125, -0.32781982421875, -0.3031463623046875, -0.278472900390625, -0.2537994384765625, -0.2291259765625, -0.2044525146484375, -0.179779052734375, -0.1551055908203125, -0.13043212890625, -0.1057586669921875, -0.081085205078125, -0.0564117431640625, -0.03173828125, -0.0070648193359375, 0.017608642578125, 0.0422821044921875, 0.06695556640625, 0.0916290283203125, 0.116302490234375, 0.1409759521484375, 0.1656494140625, 0.1903228759765625, 0.214996337890625, 0.2396697998046875, 0.26434326171875, 0.2890167236328125, 0.313690185546875, 0.3383636474609375, 0.363037109375, 0.3877105712890625, 0.412384033203125, 0.4370574951171875, 0.46173095703125, 0.4864044189453125, 0.511077880859375, 0.5357513427734375, 0.5604248046875, 0.5850982666015625, 0.609771728515625, 0.6344451904296875, 0.65911865234375, 0.6837921142578125, 0.708465576171875, 0.7331390380859375, 0.7578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 12.0, 13.0, 23.0, 24.0, 38.0, 61.0, 74.0, 113.0, 114.0, 118.0, 93.0, 77.0, 64.0, 52.0, 33.0, 28.0, 21.0, 16.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19587135314941406, -0.18996047973632812, -0.1840496063232422, -0.17813873291015625, -0.1722278594970703, -0.16631698608398438, -0.16040611267089844, -0.1544952392578125, -0.14858436584472656, -0.14267349243164062, -0.1367626190185547, -0.13085174560546875, -0.12494087219238281, -0.11902999877929688, -0.11311912536621094, -0.107208251953125, -0.10129737854003906, -0.09538650512695312, -0.08947563171386719, -0.08356475830078125, -0.07765388488769531, -0.07174301147460938, -0.06583213806152344, -0.0599212646484375, -0.05401039123535156, -0.048099517822265625, -0.04218864440917969, -0.03627777099609375, -0.030366897583007812, -0.024456024169921875, -0.018545150756835938, -0.01263427734375, -0.0067234039306640625, -0.000812530517578125, 0.0050983428955078125, 0.01100921630859375, 0.016920089721679688, 0.022830963134765625, 0.028741836547851562, 0.0346527099609375, 0.04056358337402344, 0.046474456787109375, 0.05238533020019531, 0.05829620361328125, 0.06420707702636719, 0.07011795043945312, 0.07602882385253906, 0.081939697265625, 0.08785057067871094, 0.09376144409179688, 0.09967231750488281, 0.10558319091796875, 0.11149406433105469, 0.11740493774414062, 0.12331581115722656, 0.1292266845703125, 0.13513755798339844, 0.14104843139648438, 0.1469593048095703, 0.15287017822265625, 0.1587810516357422, 0.16469192504882812, 0.17060279846191406, 0.176513671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 14.0, 17.0, 42.0, 68.0, 129.0, 290.0, 688.0, 1921.0, 7144.0, 40909.0, 3666554.0, 447909.0, 21551.0, 4660.0, 1422.0, 512.0, 227.0, 89.0, 57.0, 27.0, 17.0, 14.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84375, -0.8220291137695312, -0.8003082275390625, -0.7785873413085938, -0.756866455078125, -0.7351455688476562, -0.7134246826171875, -0.6917037963867188, -0.66998291015625, -0.6482620239257812, -0.6265411376953125, -0.6048202514648438, -0.583099365234375, -0.5613784790039062, -0.5396575927734375, -0.5179367065429688, -0.4962158203125, -0.47449493408203125, -0.4527740478515625, -0.43105316162109375, -0.409332275390625, -0.38761138916015625, -0.3658905029296875, -0.34416961669921875, -0.32244873046875, -0.30072784423828125, -0.2790069580078125, -0.25728607177734375, -0.235565185546875, -0.21384429931640625, -0.1921234130859375, -0.17040252685546875, -0.148681640625, -0.12696075439453125, -0.1052398681640625, -0.08351898193359375, -0.061798095703125, -0.04007720947265625, -0.0183563232421875, 0.00336456298828125, 0.02508544921875, 0.04680633544921875, 0.0685272216796875, 0.09024810791015625, 0.111968994140625, 0.13368988037109375, 0.1554107666015625, 0.17713165283203125, 0.1988525390625, 0.22057342529296875, 0.2422943115234375, 0.26401519775390625, 0.285736083984375, 0.30745697021484375, 0.3291778564453125, 0.35089874267578125, 0.37261962890625, 0.39434051513671875, 0.4160614013671875, 0.43778228759765625, 0.459503173828125, 0.48122406005859375, 0.5029449462890625, 0.5246658325195312, 0.54638671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 10.0, 19.0, 26.0, 54.0, 108.0, 338.0, 2523.0, 687.0, 147.0, 63.0, 35.0, 18.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.4140625, -0.40499305725097656, -0.3959236145019531, -0.3868541717529297, -0.37778472900390625, -0.3687152862548828, -0.3596458435058594, -0.35057640075683594, -0.3415069580078125, -0.33243751525878906, -0.3233680725097656, -0.3142986297607422, -0.30522918701171875, -0.2961597442626953, -0.2870903015136719, -0.27802085876464844, -0.268951416015625, -0.25988197326660156, -0.2508125305175781, -0.2417430877685547, -0.23267364501953125, -0.2236042022705078, -0.21453475952148438, -0.20546531677246094, -0.1963958740234375, -0.18732643127441406, -0.17825698852539062, -0.1691875457763672, -0.16011810302734375, -0.1510486602783203, -0.14197921752929688, -0.13290977478027344, -0.12384033203125, -0.11477088928222656, -0.10570144653320312, -0.09663200378417969, -0.08756256103515625, -0.07849311828613281, -0.06942367553710938, -0.06035423278808594, -0.0512847900390625, -0.04221534729003906, -0.033145904541015625, -0.024076461791992188, -0.01500701904296875, -0.0059375762939453125, 0.003131866455078125, 0.012201309204101562, 0.021270751953125, 0.030340194702148438, 0.039409637451171875, 0.04847908020019531, 0.05754852294921875, 0.06661796569824219, 0.07568740844726562, 0.08475685119628906, 0.0938262939453125, 0.10289573669433594, 0.11196517944335938, 0.12103462219238281, 0.13010406494140625, 0.1391735076904297, 0.14824295043945312, 0.15731239318847656, 0.1663818359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 9.0, 8.0, 20.0, 45.0, 69.0, 90.0, 100.0, 149.0, 137.0, 109.0, 107.0, 54.0, 30.0, 21.0, 13.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6373927593231201, -0.6108295321464539, -0.5842663645744324, -0.5577031373977661, -0.5311399698257446, -0.5045767426490784, -0.4780135154724121, -0.45145031809806824, -0.42488712072372437, -0.3983239233493805, -0.3717607259750366, -0.34519749879837036, -0.3186343014240265, -0.2920711040496826, -0.26550787687301636, -0.23894467949867249, -0.2123814821243286, -0.18581828474998474, -0.15925507247447968, -0.1326918601989746, -0.10612866282463074, -0.07956546545028687, -0.0530022531747818, -0.026439040899276733, 0.00012415647506713867, 0.026687361299991608, 0.05325056612491608, 0.07981377094984055, 0.10637697577476501, 0.1329401731491089, 0.15950338542461395, 0.18606659770011902, 0.2126297950744629, 0.23919299244880676, 0.26575618982315063, 0.2923194169998169, 0.31888261437416077, 0.34544581174850464, 0.3720090389251709, 0.39857223629951477, 0.42513543367385864, 0.4516986310482025, 0.4782618284225464, 0.5048250555992126, 0.5313882827758789, 0.5579514503479004, 0.5845146775245667, 0.6110779047012329, 0.6376410722732544, 0.6642042994499207, 0.6907674670219421, 0.7173306941986084, 0.7438938617706299, 0.7704570889472961, 0.7970203161239624, 0.8235834836959839, 0.8501467108726501, 0.8767099380493164, 0.9032731056213379, 0.9298363327980042, 0.9563995599746704, 0.9829627275466919, 1.0095258951187134, 1.0360891819000244, 1.062652349472046]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 6.0, 15.0, 25.0, 27.0, 42.0, 37.0, 61.0, 56.0, 63.0, 59.0, 65.0, 79.0, 72.0, 69.0, 66.0, 55.0, 47.0, 42.0, 33.0, 22.0, 22.0, 14.0, 12.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5507141351699829, -0.524960994720459, -0.49920785427093506, -0.4734547436237335, -0.4477016031742096, -0.42194846272468567, -0.39619535207748413, -0.3704422116279602, -0.3446890711784363, -0.31893593072891235, -0.2931827902793884, -0.2674296796321869, -0.24167653918266296, -0.21592339873313904, -0.1901702731847763, -0.16441714763641357, -0.13866400718688965, -0.11291087418794632, -0.08715774118900299, -0.06140460819005966, -0.03565147519111633, -0.009898334741592407, 0.015854790806770325, 0.04160791635513306, 0.06736105680465698, 0.09311418980360031, 0.11886732280254364, 0.14462044835090637, 0.1703735888004303, 0.19612672924995422, 0.22187985479831696, 0.2476329803466797, 0.2733861207962036, 0.29913926124572754, 0.32489240169525146, 0.350645512342453, 0.37639865279197693, 0.40215179324150085, 0.4279049038887024, 0.4536580443382263, 0.47941118478775024, 0.5051643252372742, 0.5309174656867981, 0.556670606136322, 0.5824236869812012, 0.6081768274307251, 0.633929967880249, 0.659683108329773, 0.6854362487792969, 0.7111893892288208, 0.7369425296783447, 0.7626956701278687, 0.7884488105773926, 0.8142019510269165, 0.8399550318717957, 0.8657081723213196, 0.8914613127708435, 0.9172144532203674, 0.9429675936698914, 0.9687207341194153, 0.9944738149642944, 1.0202269554138184, 1.0459800958633423, 1.0717332363128662, 1.0974863767623901]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 11.0, 8.0, 9.0, 18.0, 24.0, 32.0, 37.0, 52.0, 80.0, 111.0, 198.0, 267.0, 463.0, 774.0, 1424.0, 2947.0, 7766.0, 27805.0, 137210.0, 642753.0, 176569.0, 33839.0, 8966.0, 3337.0, 1517.0, 821.0, 518.0, 302.0, 209.0, 143.0, 93.0, 64.0, 53.0, 24.0, 29.0, 26.0, 12.0, 4.0, 4.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.464599609375, -0.4488868713378906, -0.43317413330078125, -0.4174613952636719, -0.4017486572265625, -0.3860359191894531, -0.37032318115234375, -0.3546104431152344, -0.338897705078125, -0.3231849670410156, -0.30747222900390625, -0.2917594909667969, -0.2760467529296875, -0.2603340148925781, -0.24462127685546875, -0.22890853881835938, -0.21319580078125, -0.19748306274414062, -0.18177032470703125, -0.16605758666992188, -0.1503448486328125, -0.13463211059570312, -0.11891937255859375, -0.10320663452148438, -0.087493896484375, -0.07178115844726562, -0.05606842041015625, -0.040355682373046875, -0.0246429443359375, -0.008930206298828125, 0.00678253173828125, 0.022495269775390625, 0.0382080078125, 0.053920745849609375, 0.06963348388671875, 0.08534622192382812, 0.1010589599609375, 0.11677169799804688, 0.13248443603515625, 0.14819717407226562, 0.163909912109375, 0.17962265014648438, 0.19533538818359375, 0.21104812622070312, 0.2267608642578125, 0.24247360229492188, 0.25818634033203125, 0.2738990783691406, 0.28961181640625, 0.3053245544433594, 0.32103729248046875, 0.3367500305175781, 0.3524627685546875, 0.3681755065917969, 0.38388824462890625, 0.3996009826660156, 0.415313720703125, 0.4310264587402344, 0.44673919677734375, 0.4624519348144531, 0.4781646728515625, 0.4938774108886719, 0.5095901489257812, 0.5253028869628906, 0.541015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 11.0, 15.0, 18.0, 26.0, 29.0, 59.0, 71.0, 81.0, 117.0, 101.0, 112.0, 101.0, 67.0, 54.0, 33.0, 32.0, 25.0, 15.0, 8.0, 10.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19677734375, -0.19091224670410156, -0.18504714965820312, -0.1791820526123047, -0.17331695556640625, -0.1674518585205078, -0.16158676147460938, -0.15572166442871094, -0.1498565673828125, -0.14399147033691406, -0.13812637329101562, -0.1322612762451172, -0.12639617919921875, -0.12053108215332031, -0.11466598510742188, -0.10880088806152344, -0.102935791015625, -0.09707069396972656, -0.09120559692382812, -0.08534049987792969, -0.07947540283203125, -0.07361030578613281, -0.06774520874023438, -0.06188011169433594, -0.0560150146484375, -0.05014991760253906, -0.044284820556640625, -0.03841972351074219, -0.03255462646484375, -0.026689529418945312, -0.020824432373046875, -0.014959335327148438, -0.00909423828125, -0.0032291412353515625, 0.002635955810546875, 0.008501052856445312, 0.01436614990234375, 0.020231246948242188, 0.026096343994140625, 0.03196144104003906, 0.0378265380859375, 0.04369163513183594, 0.049556732177734375, 0.05542182922363281, 0.06128692626953125, 0.06715202331542969, 0.07301712036132812, 0.07888221740722656, 0.084747314453125, 0.09061241149902344, 0.09647750854492188, 0.10234260559082031, 0.10820770263671875, 0.11407279968261719, 0.11993789672851562, 0.12580299377441406, 0.1316680908203125, 0.13753318786621094, 0.14339828491210938, 0.1492633819580078, 0.15512847900390625, 0.1609935760498047, 0.16685867309570312, 0.17272377014160156, 0.1785888671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 21.0, 21.0, 28.0, 41.0, 55.0, 103.0, 169.0, 298.0, 529.0, 1104.0, 2767.0, 7286.0, 23083.0, 92014.0, 554815.0, 288529.0, 53864.0, 14962.0, 5016.0, 1946.0, 832.0, 409.0, 221.0, 143.0, 99.0, 67.0, 36.0, 26.0, 21.0, 4.0, 9.0, 11.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.456146240234375, -0.44134521484375, -0.426544189453125, -0.4117431640625, -0.396942138671875, -0.38214111328125, -0.367340087890625, -0.3525390625, -0.337738037109375, -0.32293701171875, -0.308135986328125, -0.2933349609375, -0.278533935546875, -0.26373291015625, -0.248931884765625, -0.234130859375, -0.219329833984375, -0.20452880859375, -0.189727783203125, -0.1749267578125, -0.160125732421875, -0.14532470703125, -0.130523681640625, -0.11572265625, -0.100921630859375, -0.08612060546875, -0.071319580078125, -0.0565185546875, -0.041717529296875, -0.02691650390625, -0.012115478515625, 0.002685546875, 0.017486572265625, 0.03228759765625, 0.047088623046875, 0.0618896484375, 0.076690673828125, 0.09149169921875, 0.106292724609375, 0.12109375, 0.135894775390625, 0.15069580078125, 0.165496826171875, 0.1802978515625, 0.195098876953125, 0.20989990234375, 0.224700927734375, 0.239501953125, 0.254302978515625, 0.26910400390625, 0.283905029296875, 0.2987060546875, 0.313507080078125, 0.32830810546875, 0.343109130859375, 0.35791015625, 0.372711181640625, 0.38751220703125, 0.402313232421875, 0.4171142578125, 0.431915283203125, 0.44671630859375, 0.461517333984375, 0.476318359375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 7.0, 17.0, 9.0, 16.0, 20.0, 25.0, 30.0, 25.0, 34.0, 34.0, 35.0, 45.0, 47.0, 41.0, 43.0, 51.0, 36.0, 49.0, 48.0, 33.0, 45.0, 53.0, 36.0, 32.0, 32.0, 33.0, 17.0, 10.0, 18.0, 17.0, 10.0, 7.0, 3.0, 7.0, 5.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.447998046875, -0.4348602294921875, -0.421722412109375, -0.4085845947265625, -0.39544677734375, -0.3823089599609375, -0.369171142578125, -0.3560333251953125, -0.3428955078125, -0.3297576904296875, -0.316619873046875, -0.3034820556640625, -0.29034423828125, -0.2772064208984375, -0.264068603515625, -0.2509307861328125, -0.23779296875, -0.2246551513671875, -0.211517333984375, -0.1983795166015625, -0.18524169921875, -0.1721038818359375, -0.158966064453125, -0.1458282470703125, -0.1326904296875, -0.1195526123046875, -0.106414794921875, -0.0932769775390625, -0.08013916015625, -0.0670013427734375, -0.053863525390625, -0.0407257080078125, -0.027587890625, -0.0144500732421875, -0.001312255859375, 0.0118255615234375, 0.02496337890625, 0.0381011962890625, 0.051239013671875, 0.0643768310546875, 0.0775146484375, 0.0906524658203125, 0.103790283203125, 0.1169281005859375, 0.13006591796875, 0.1432037353515625, 0.156341552734375, 0.1694793701171875, 0.1826171875, 0.1957550048828125, 0.208892822265625, 0.2220306396484375, 0.23516845703125, 0.2483062744140625, 0.261444091796875, 0.2745819091796875, 0.2877197265625, 0.3008575439453125, 0.313995361328125, 0.3271331787109375, 0.34027099609375, 0.3534088134765625, 0.366546630859375, 0.3796844482421875, 0.392822265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 11.0, 31.0, 64.0, 133.0, 407.0, 1990.0, 53512.0, 968821.0, 21660.0, 1377.0, 354.0, 103.0, 45.0, 23.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.492919921875, -0.4772224426269531, -0.46152496337890625, -0.4458274841308594, -0.4301300048828125, -0.4144325256347656, -0.39873504638671875, -0.3830375671386719, -0.367340087890625, -0.3516426086425781, -0.33594512939453125, -0.3202476501464844, -0.3045501708984375, -0.2888526916503906, -0.27315521240234375, -0.2574577331542969, -0.24176025390625, -0.22606277465820312, -0.21036529541015625, -0.19466781616210938, -0.1789703369140625, -0.16327285766601562, -0.14757537841796875, -0.13187789916992188, -0.116180419921875, -0.10048294067382812, -0.08478546142578125, -0.06908798217773438, -0.0533905029296875, -0.037693023681640625, -0.02199554443359375, -0.006298065185546875, 0.0093994140625, 0.025096893310546875, 0.04079437255859375, 0.056491851806640625, 0.0721893310546875, 0.08788681030273438, 0.10358428955078125, 0.11928176879882812, 0.134979248046875, 0.15067672729492188, 0.16637420654296875, 0.18207168579101562, 0.1977691650390625, 0.21346664428710938, 0.22916412353515625, 0.24486160278320312, 0.26055908203125, 0.2762565612792969, 0.29195404052734375, 0.3076515197753906, 0.3233489990234375, 0.3390464782714844, 0.35474395751953125, 0.3704414367675781, 0.386138916015625, 0.4018363952636719, 0.41753387451171875, 0.4332313537597656, 0.4489288330078125, 0.4646263122558594, 0.48032379150390625, 0.4960212707519531, 0.51171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 19.0, 26.0, 54.0, 68.0, 93.0, 179.0, 196.0, 148.0, 82.0, 54.0, 28.0, 19.0, 17.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003497600555419922, -0.0003398619592189789, -0.0003299638628959656, -0.00032006576657295227, -0.00031016767024993896, -0.00030026957392692566, -0.00029037147760391235, -0.00028047338128089905, -0.00027057528495788574, -0.00026067718863487244, -0.00025077909231185913, -0.00024088099598884583, -0.00023098289966583252, -0.00022108480334281921, -0.0002111867070198059, -0.0002012886106967926, -0.0001913905143737793, -0.000181492418050766, -0.00017159432172775269, -0.00016169622540473938, -0.00015179812908172607, -0.00014190003275871277, -0.00013200193643569946, -0.00012210384011268616, -0.00011220574378967285, -0.00010230764746665955, -9.240955114364624e-05, -8.251145482063293e-05, -7.261335849761963e-05, -6.271526217460632e-05, -5.281716585159302e-05, -4.291906952857971e-05, -3.3020973205566406e-05, -2.31228768825531e-05, -1.3224780559539795e-05, -3.3266842365264893e-06, 6.571412086486816e-06, 1.6469508409500122e-05, 2.6367604732513428e-05, 3.6265701055526733e-05, 4.616379737854004e-05, 5.6061893701553345e-05, 6.595999002456665e-05, 7.585808634757996e-05, 8.575618267059326e-05, 9.565427899360657e-05, 0.00010555237531661987, 0.00011545047163963318, 0.00012534856796264648, 0.0001352466642856598, 0.0001451447606086731, 0.0001550428569316864, 0.0001649409532546997, 0.000174839049577713, 0.00018473714590072632, 0.00019463524222373962, 0.00020453333854675293, 0.00021443143486976624, 0.00022432953119277954, 0.00023422762751579285, 0.00024412572383880615, 0.00025402382016181946, 0.00026392191648483276, 0.00027382001280784607, 0.0002837181091308594]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 8.0, 5.0, 14.0, 31.0, 53.0, 95.0, 175.0, 393.0, 1259.0, 4324.0, 33017.0, 738515.0, 251076.0, 15433.0, 2665.0, 821.0, 338.0, 142.0, 88.0, 48.0, 20.0, 13.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.270172119140625, -0.26080322265625, -0.251434326171875, -0.2420654296875, -0.232696533203125, -0.22332763671875, -0.213958740234375, -0.20458984375, -0.195220947265625, -0.18585205078125, -0.176483154296875, -0.1671142578125, -0.157745361328125, -0.14837646484375, -0.139007568359375, -0.129638671875, -0.120269775390625, -0.11090087890625, -0.101531982421875, -0.0921630859375, -0.082794189453125, -0.07342529296875, -0.064056396484375, -0.0546875, -0.045318603515625, -0.03594970703125, -0.026580810546875, -0.0172119140625, -0.007843017578125, 0.00152587890625, 0.010894775390625, 0.020263671875, 0.029632568359375, 0.03900146484375, 0.048370361328125, 0.0577392578125, 0.067108154296875, 0.07647705078125, 0.085845947265625, 0.09521484375, 0.104583740234375, 0.11395263671875, 0.123321533203125, 0.1326904296875, 0.142059326171875, 0.15142822265625, 0.160797119140625, 0.170166015625, 0.179534912109375, 0.18890380859375, 0.198272705078125, 0.2076416015625, 0.217010498046875, 0.22637939453125, 0.235748291015625, 0.2451171875, 0.254486083984375, 0.26385498046875, 0.273223876953125, 0.2825927734375, 0.291961669921875, 0.30133056640625, 0.310699462890625, 0.320068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 8.0, 9.0, 9.0, 17.0, 24.0, 23.0, 61.0, 81.0, 131.0, 176.0, 167.0, 105.0, 68.0, 30.0, 34.0, 24.0, 9.0, 8.0, 8.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2391357421875, -0.23110389709472656, -0.22307205200195312, -0.2150402069091797, -0.20700836181640625, -0.1989765167236328, -0.19094467163085938, -0.18291282653808594, -0.1748809814453125, -0.16684913635253906, -0.15881729125976562, -0.1507854461669922, -0.14275360107421875, -0.1347217559814453, -0.12668991088867188, -0.11865806579589844, -0.110626220703125, -0.10259437561035156, -0.09456253051757812, -0.08653068542480469, -0.07849884033203125, -0.07046699523925781, -0.062435150146484375, -0.05440330505371094, -0.0463714599609375, -0.03833961486816406, -0.030307769775390625, -0.022275924682617188, -0.01424407958984375, -0.0062122344970703125, 0.001819610595703125, 0.009851455688476562, 0.01788330078125, 0.025915145874023438, 0.033946990966796875, 0.04197883605957031, 0.05001068115234375, 0.05804252624511719, 0.06607437133789062, 0.07410621643066406, 0.0821380615234375, 0.09016990661621094, 0.09820175170898438, 0.10623359680175781, 0.11426544189453125, 0.12229728698730469, 0.13032913208007812, 0.13836097717285156, 0.146392822265625, 0.15442466735839844, 0.16245651245117188, 0.1704883575439453, 0.17852020263671875, 0.1865520477294922, 0.19458389282226562, 0.20261573791503906, 0.2106475830078125, 0.21867942810058594, 0.22671127319335938, 0.2347431182861328, 0.24277496337890625, 0.2508068084716797, 0.2588386535644531, 0.26687049865722656, 0.27490234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 16.0, 82.0, 635.0, 252.0, 25.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.62903594970703, -18.192445755004883, -17.7558536529541, -17.319263458251953, -16.882673263549805, -16.446081161499023, -16.009490966796875, -15.572900772094727, -15.136309623718262, -14.699718475341797, -14.263128280639648, -13.826537132263184, -13.389945983886719, -12.95335578918457, -12.516764640808105, -12.08017349243164, -11.643583297729492, -11.206992149353027, -10.770401954650879, -10.333810806274414, -9.89721965789795, -9.4606294631958, -9.024038314819336, -8.587448120117188, -8.150856018066406, -7.7142653465271, -7.277674198150635, -6.841083526611328, -6.4044928550720215, -5.967902183532715, -5.53131103515625, -5.094720363616943, -4.658129692077637, -4.22153902053833, -3.7849481105804443, -3.3483572006225586, -2.911766529083252, -2.475175619125366, -2.0385847091674805, -1.6019940376281738, -1.165403127670288, -0.7288123369216919, -0.2922214865684509, 0.14436936378479004, 0.5809601545333862, 1.0175509452819824, 1.4541418552398682, 1.8907325267791748, 2.3273234367370605, 2.7639143466949463, 3.200505018234253, 3.6370959281921387, 4.073686599731445, 4.51027774810791, 4.946868419647217, 5.383459091186523, 5.820050239562988, 6.256640911102295, 6.69323205947876, 7.129822731018066, 7.566413402557373, 8.00300407409668, 8.439595222473145, 8.87618637084961, 9.312776565551758]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 10.0, 13.0, 16.0, 18.0, 13.0, 18.0, 27.0, 18.0, 29.0, 23.0, 39.0, 33.0, 44.0, 36.0, 50.0, 47.0, 49.0, 42.0, 49.0, 35.0, 34.0, 45.0, 42.0, 38.0, 37.0, 26.0, 22.0, 25.0, 28.0, 16.0, 16.0, 13.0, 6.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7476615905761719, -1.6891059875488281, -1.6305503845214844, -1.5719947814941406, -1.5134391784667969, -1.4548835754394531, -1.3963279724121094, -1.337772250175476, -1.2792166471481323, -1.2206610441207886, -1.1621054410934448, -1.103549838066101, -1.0449942350387573, -0.9864385724067688, -0.927882969379425, -0.8693273067474365, -0.8107717633247375, -0.7522161602973938, -0.69366055727005, -0.6351048946380615, -0.5765492916107178, -0.517993688583374, -0.4594380855560303, -0.40088245272636414, -0.3423268496990204, -0.28377124667167664, -0.2252156138420105, -0.16666001081466675, -0.1081043928861618, -0.04954877495765686, 0.00900682806968689, 0.06756246089935303, 0.12611806392669678, 0.18467368185520172, 0.24322929978370667, 0.3017849028110504, 0.36034053564071655, 0.4188961386680603, 0.47745174169540405, 0.5360074043273926, 0.5945630073547363, 0.6531186103820801, 0.7116742134094238, 0.7702298164367676, 0.8287854790687561, 0.8873410820960999, 0.9458966851234436, 1.0044523477554321, 1.0630078315734863, 1.12156343460083, 1.1801190376281738, 1.2386746406555176, 1.2972302436828613, 1.355785846710205, 1.4143414497375488, 1.4728971719741821, 1.5314527750015259, 1.5900083780288696, 1.6485639810562134, 1.7071195840835571, 1.7656751871109009, 1.8242309093475342, 1.882786512374878, 1.9413421154022217, 1.9998977184295654]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 9.0, 7.0, 12.0, 6.0, 23.0, 18.0, 26.0, 36.0, 50.0, 58.0, 96.0, 162.0, 231.0, 340.0, 613.0, 1171.0, 2613.0, 6687.0, 23795.0, 345878.0, 3749003.0, 46584.0, 9962.0, 3515.0, 1534.0, 744.0, 393.0, 237.0, 131.0, 86.0, 77.0, 52.0, 22.0, 19.0, 18.0, 15.0, 10.0, 5.0, 3.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.91552734375, -0.8879318237304688, -0.8603363037109375, -0.8327407836914062, -0.805145263671875, -0.7775497436523438, -0.7499542236328125, -0.7223587036132812, -0.69476318359375, -0.6671676635742188, -0.6395721435546875, -0.6119766235351562, -0.584381103515625, -0.5567855834960938, -0.5291900634765625, -0.5015945434570312, -0.4739990234375, -0.44640350341796875, -0.4188079833984375, -0.39121246337890625, -0.363616943359375, -0.33602142333984375, -0.3084259033203125, -0.28083038330078125, -0.25323486328125, -0.22563934326171875, -0.1980438232421875, -0.17044830322265625, -0.142852783203125, -0.11525726318359375, -0.0876617431640625, -0.06006622314453125, -0.032470703125, -0.00487518310546875, 0.0227203369140625, 0.05031585693359375, 0.077911376953125, 0.10550689697265625, 0.1331024169921875, 0.16069793701171875, 0.18829345703125, 0.21588897705078125, 0.2434844970703125, 0.27108001708984375, 0.298675537109375, 0.32627105712890625, 0.3538665771484375, 0.38146209716796875, 0.4090576171875, 0.43665313720703125, 0.4642486572265625, 0.49184417724609375, 0.519439697265625, 0.5470352172851562, 0.5746307373046875, 0.6022262573242188, 0.62982177734375, 0.6574172973632812, 0.6850128173828125, 0.7126083374023438, 0.740203857421875, 0.7677993774414062, 0.7953948974609375, 0.8229904174804688, 0.8505859375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 9.0, 10.0, 14.0, 21.0, 24.0, 30.0, 53.0, 70.0, 92.0, 108.0, 114.0, 112.0, 83.0, 71.0, 49.0, 40.0, 27.0, 32.0, 11.0, 7.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1995849609375, -0.193634033203125, -0.18768310546875, -0.181732177734375, -0.17578125, -0.169830322265625, -0.16387939453125, -0.157928466796875, -0.1519775390625, -0.146026611328125, -0.14007568359375, -0.134124755859375, -0.128173828125, -0.122222900390625, -0.11627197265625, -0.110321044921875, -0.1043701171875, -0.098419189453125, -0.09246826171875, -0.086517333984375, -0.08056640625, -0.074615478515625, -0.06866455078125, -0.062713623046875, -0.0567626953125, -0.050811767578125, -0.04486083984375, -0.038909912109375, -0.032958984375, -0.027008056640625, -0.02105712890625, -0.015106201171875, -0.0091552734375, -0.003204345703125, 0.00274658203125, 0.008697509765625, 0.0146484375, 0.020599365234375, 0.02655029296875, 0.032501220703125, 0.0384521484375, 0.044403076171875, 0.05035400390625, 0.056304931640625, 0.062255859375, 0.068206787109375, 0.07415771484375, 0.080108642578125, 0.0860595703125, 0.092010498046875, 0.09796142578125, 0.103912353515625, 0.10986328125, 0.115814208984375, 0.12176513671875, 0.127716064453125, 0.1336669921875, 0.139617919921875, 0.14556884765625, 0.151519775390625, 0.157470703125, 0.163421630859375, 0.16937255859375, 0.175323486328125, 0.1812744140625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 9.0, 9.0, 18.0, 27.0, 39.0, 51.0, 112.0, 153.0, 265.0, 495.0, 1037.0, 2149.0, 5449.0, 15375.0, 69342.0, 3384822.0, 651371.0, 44000.0, 11492.0, 4286.0, 1892.0, 826.0, 469.0, 235.0, 130.0, 87.0, 63.0, 31.0, 17.0, 10.0, 6.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7602005004882812, -0.7401275634765625, -0.7200546264648438, -0.699981689453125, -0.6799087524414062, -0.6598358154296875, -0.6397628784179688, -0.61968994140625, -0.5996170043945312, -0.5795440673828125, -0.5594711303710938, -0.539398193359375, -0.5193252563476562, -0.4992523193359375, -0.47917938232421875, -0.4591064453125, -0.43903350830078125, -0.4189605712890625, -0.39888763427734375, -0.378814697265625, -0.35874176025390625, -0.3386688232421875, -0.31859588623046875, -0.29852294921875, -0.27845001220703125, -0.2583770751953125, -0.23830413818359375, -0.218231201171875, -0.19815826416015625, -0.1780853271484375, -0.15801239013671875, -0.137939453125, -0.11786651611328125, -0.0977935791015625, -0.07772064208984375, -0.057647705078125, -0.03757476806640625, -0.0175018310546875, 0.00257110595703125, 0.02264404296875, 0.04271697998046875, 0.0627899169921875, 0.08286285400390625, 0.102935791015625, 0.12300872802734375, 0.1430816650390625, 0.16315460205078125, 0.1832275390625, 0.20330047607421875, 0.2233734130859375, 0.24344635009765625, 0.263519287109375, 0.28359222412109375, 0.3036651611328125, 0.32373809814453125, 0.34381103515625, 0.36388397216796875, 0.3839569091796875, 0.40402984619140625, 0.424102783203125, 0.44417572021484375, 0.4642486572265625, 0.48432159423828125, 0.50439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 6.0, 5.0, 12.0, 13.0, 18.0, 50.0, 54.0, 117.0, 360.0, 2359.0, 673.0, 166.0, 86.0, 42.0, 19.0, 22.0, 17.0, 7.0, 6.0, 6.0, 7.0, 2.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35302734375, -0.3445549011230469, -0.33608245849609375, -0.3276100158691406, -0.3191375732421875, -0.3106651306152344, -0.30219268798828125, -0.2937202453613281, -0.285247802734375, -0.2767753601074219, -0.26830291748046875, -0.2598304748535156, -0.2513580322265625, -0.24288558959960938, -0.23441314697265625, -0.22594070434570312, -0.21746826171875, -0.20899581909179688, -0.20052337646484375, -0.19205093383789062, -0.1835784912109375, -0.17510604858398438, -0.16663360595703125, -0.15816116333007812, -0.149688720703125, -0.14121627807617188, -0.13274383544921875, -0.12427139282226562, -0.1157989501953125, -0.10732650756835938, -0.09885406494140625, -0.09038162231445312, -0.0819091796875, -0.07343673706054688, -0.06496429443359375, -0.056491851806640625, -0.0480194091796875, -0.039546966552734375, -0.03107452392578125, -0.022602081298828125, -0.014129638671875, -0.005657196044921875, 0.00281524658203125, 0.011287689208984375, 0.0197601318359375, 0.028232574462890625, 0.03670501708984375, 0.045177459716796875, 0.05364990234375, 0.062122344970703125, 0.07059478759765625, 0.07906723022460938, 0.0875396728515625, 0.09601211547851562, 0.10448455810546875, 0.11295700073242188, 0.121429443359375, 0.12990188598632812, 0.13837432861328125, 0.14684677124023438, 0.1553192138671875, 0.16379165649414062, 0.17226409912109375, 0.18073654174804688, 0.189208984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 17.0, 98.0, 306.0, 358.0, 168.0, 33.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9152201414108276, -0.8144505620002747, -0.7136809825897217, -0.6129114031791687, -0.5121418237686157, -0.41137224435806274, -0.31060266494750977, -0.2098330855369568, -0.10906350612640381, -0.00829392671585083, 0.09247565269470215, 0.19324523210525513, 0.2940148115158081, 0.3947843909263611, 0.49555397033691406, 0.596323549747467, 0.69709312915802, 0.797862708568573, 0.898632287979126, 0.999401867389679, 1.100171446800232, 1.2009410858154297, 1.301710605621338, 1.402480125427246, 1.5032497644424438, 1.6040194034576416, 1.7047889232635498, 1.805558443069458, 1.9063280820846558, 2.0070977210998535, 2.1078672409057617, 2.20863676071167, 2.309406280517578, 2.4101758003234863, 2.5109453201293945, 2.611715078353882, 2.71248459815979, 2.8132541179656982, 2.9140238761901855, 3.0147933959960938, 3.115562915802002, 3.21633243560791, 3.3171019554138184, 3.4178717136383057, 3.518641233444214, 3.619410753250122, 3.7201805114746094, 3.8209500312805176, 3.921719551086426, 4.022489070892334, 4.123258590698242, 4.22402811050415, 4.324797630310059, 4.425567626953125, 4.526337146759033, 4.627106666564941, 4.72787618637085, 4.828645706176758, 4.929415225982666, 5.030184745788574, 5.130954742431641, 5.231724262237549, 5.332493782043457, 5.433263301849365, 5.534032821655273]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 11.0, 13.0, 19.0, 14.0, 25.0, 30.0, 36.0, 32.0, 37.0, 60.0, 55.0, 45.0, 60.0, 70.0, 55.0, 41.0, 42.0, 57.0, 48.0, 44.0, 35.0, 30.0, 31.0, 23.0, 16.0, 18.0, 19.0, 10.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7623158693313599, -0.7360689640045166, -0.7098220586776733, -0.6835751533508301, -0.6573282480239868, -0.6310813426971436, -0.6048344373703003, -0.5785874724388123, -0.552340567111969, -0.5260936617851257, -0.49984675645828247, -0.4735998511314392, -0.44735291600227356, -0.4211060106754303, -0.39485910534858704, -0.3686121702194214, -0.3423652946949005, -0.31611838936805725, -0.289871484041214, -0.26362454891204834, -0.23737764358520508, -0.21113073825836182, -0.18488383293151855, -0.1586369127035141, -0.13239000737667084, -0.10614309459924698, -0.07989618182182312, -0.05364927649497986, -0.027402363717556, -0.0011554509401321411, 0.02509145438671112, 0.051338374614715576, 0.07758527994155884, 0.1038321927189827, 0.13007910549640656, 0.15632601082324982, 0.18257293105125427, 0.20881983637809753, 0.2350667417049408, 0.26131367683410645, 0.2875605821609497, 0.31380748748779297, 0.34005439281463623, 0.3663012981414795, 0.39254823327064514, 0.4187951385974884, 0.44504204392433167, 0.4712889790534973, 0.4975358545780182, 0.5237827897071838, 0.5500296950340271, 0.5762766003608704, 0.6025235056877136, 0.6287704110145569, 0.6550173163414001, 0.6812642216682434, 0.7075111269950867, 0.7337580323219299, 0.7600049376487732, 0.7862518429756165, 0.8124987483024597, 0.8387457132339478, 0.864992618560791, 0.8912395238876343, 0.9174864292144775]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 14.0, 19.0, 28.0, 33.0, 37.0, 60.0, 107.0, 130.0, 172.0, 317.0, 547.0, 996.0, 2115.0, 5057.0, 16600.0, 86867.0, 601249.0, 279293.0, 38637.0, 9451.0, 3328.0, 1569.0, 731.0, 417.0, 224.0, 163.0, 112.0, 60.0, 47.0, 33.0, 31.0, 24.0, 20.0, 7.0, 9.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.068359375, -1.0384979248046875, -1.008636474609375, -0.9787750244140625, -0.94891357421875, -0.9190521240234375, -0.889190673828125, -0.8593292236328125, -0.8294677734375, -0.7996063232421875, -0.769744873046875, -0.7398834228515625, -0.71002197265625, -0.6801605224609375, -0.650299072265625, -0.6204376220703125, -0.590576171875, -0.5607147216796875, -0.530853271484375, -0.5009918212890625, -0.47113037109375, -0.4412689208984375, -0.411407470703125, -0.3815460205078125, -0.3516845703125, -0.3218231201171875, -0.291961669921875, -0.2621002197265625, -0.23223876953125, -0.2023773193359375, -0.172515869140625, -0.1426544189453125, -0.11279296875, -0.0829315185546875, -0.053070068359375, -0.0232086181640625, 0.00665283203125, 0.0365142822265625, 0.066375732421875, 0.0962371826171875, 0.1260986328125, 0.1559600830078125, 0.185821533203125, 0.2156829833984375, 0.24554443359375, 0.2754058837890625, 0.305267333984375, 0.3351287841796875, 0.364990234375, 0.3948516845703125, 0.424713134765625, 0.4545745849609375, 0.48443603515625, 0.5142974853515625, 0.544158935546875, 0.5740203857421875, 0.6038818359375, 0.6337432861328125, 0.663604736328125, 0.6934661865234375, 0.72332763671875, 0.7531890869140625, 0.783050537109375, 0.8129119873046875, 0.8427734375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 13.0, 16.0, 25.0, 30.0, 36.0, 63.0, 73.0, 120.0, 99.0, 115.0, 95.0, 86.0, 56.0, 43.0, 37.0, 28.0, 24.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1993408203125, -0.19330787658691406, -0.18727493286132812, -0.1812419891357422, -0.17520904541015625, -0.1691761016845703, -0.16314315795898438, -0.15711021423339844, -0.1510772705078125, -0.14504432678222656, -0.13901138305664062, -0.1329784393310547, -0.12694549560546875, -0.12091255187988281, -0.11487960815429688, -0.10884666442871094, -0.102813720703125, -0.09678077697753906, -0.09074783325195312, -0.08471488952636719, -0.07868194580078125, -0.07264900207519531, -0.06661605834960938, -0.06058311462402344, -0.0545501708984375, -0.04851722717285156, -0.042484283447265625, -0.03645133972167969, -0.03041839599609375, -0.024385452270507812, -0.018352508544921875, -0.012319564819335938, -0.00628662109375, -0.0002536773681640625, 0.005779266357421875, 0.011812210083007812, 0.01784515380859375, 0.023878097534179688, 0.029911041259765625, 0.03594398498535156, 0.0419769287109375, 0.04800987243652344, 0.054042816162109375, 0.06007575988769531, 0.06610870361328125, 0.07214164733886719, 0.07817459106445312, 0.08420753479003906, 0.090240478515625, 0.09627342224121094, 0.10230636596679688, 0.10833930969238281, 0.11437225341796875, 0.12040519714355469, 0.12643814086914062, 0.13247108459472656, 0.1385040283203125, 0.14453697204589844, 0.15056991577148438, 0.1566028594970703, 0.16263580322265625, 0.1686687469482422, 0.17470169067382812, 0.18073463439941406, 0.186767578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 1.0, 5.0, 6.0, 8.0, 14.0, 26.0, 34.0, 41.0, 77.0, 127.0, 215.0, 371.0, 640.0, 1247.0, 2815.0, 7517.0, 26193.0, 156663.0, 679098.0, 137075.0, 23723.0, 7143.0, 2801.0, 1175.0, 611.0, 343.0, 201.0, 140.0, 58.0, 65.0, 34.0, 25.0, 13.0, 12.0, 11.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78125, -0.7547378540039062, -0.7282257080078125, -0.7017135620117188, -0.675201416015625, -0.6486892700195312, -0.6221771240234375, -0.5956649780273438, -0.56915283203125, -0.5426406860351562, -0.5161285400390625, -0.48961639404296875, -0.463104248046875, -0.43659210205078125, -0.4100799560546875, -0.38356781005859375, -0.3570556640625, -0.33054351806640625, -0.3040313720703125, -0.27751922607421875, -0.251007080078125, -0.22449493408203125, -0.1979827880859375, -0.17147064208984375, -0.14495849609375, -0.11844635009765625, -0.0919342041015625, -0.06542205810546875, -0.038909912109375, -0.01239776611328125, 0.0141143798828125, 0.04062652587890625, 0.067138671875, 0.09365081787109375, 0.1201629638671875, 0.14667510986328125, 0.173187255859375, 0.19969940185546875, 0.2262115478515625, 0.25272369384765625, 0.27923583984375, 0.30574798583984375, 0.3322601318359375, 0.35877227783203125, 0.385284423828125, 0.41179656982421875, 0.4383087158203125, 0.46482086181640625, 0.4913330078125, 0.5178451538085938, 0.5443572998046875, 0.5708694458007812, 0.597381591796875, 0.6238937377929688, 0.6504058837890625, 0.6769180297851562, 0.70343017578125, 0.7299423217773438, 0.7564544677734375, 0.7829666137695312, 0.809478759765625, 0.8359909057617188, 0.8625030517578125, 0.8890151977539062, 0.91552734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 7.0, 6.0, 10.0, 14.0, 14.0, 11.0, 35.0, 28.0, 41.0, 52.0, 60.0, 59.0, 66.0, 85.0, 75.0, 78.0, 59.0, 51.0, 38.0, 49.0, 34.0, 26.0, 22.0, 19.0, 14.0, 13.0, 11.0, 7.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5363311767578125, -0.513092041015625, -0.4898529052734375, -0.46661376953125, -0.4433746337890625, -0.420135498046875, -0.3968963623046875, -0.3736572265625, -0.3504180908203125, -0.327178955078125, -0.3039398193359375, -0.28070068359375, -0.2574615478515625, -0.234222412109375, -0.2109832763671875, -0.187744140625, -0.1645050048828125, -0.141265869140625, -0.1180267333984375, -0.09478759765625, -0.0715484619140625, -0.048309326171875, -0.0250701904296875, -0.0018310546875, 0.0214080810546875, 0.044647216796875, 0.0678863525390625, 0.09112548828125, 0.1143646240234375, 0.137603759765625, 0.1608428955078125, 0.18408203125, 0.2073211669921875, 0.230560302734375, 0.2537994384765625, 0.27703857421875, 0.3002777099609375, 0.323516845703125, 0.3467559814453125, 0.3699951171875, 0.3932342529296875, 0.416473388671875, 0.4397125244140625, 0.46295166015625, 0.4861907958984375, 0.509429931640625, 0.5326690673828125, 0.555908203125, 0.5791473388671875, 0.602386474609375, 0.6256256103515625, 0.64886474609375, 0.6721038818359375, 0.695343017578125, 0.7185821533203125, 0.7418212890625, 0.7650604248046875, 0.788299560546875, 0.8115386962890625, 0.83477783203125, 0.8580169677734375, 0.881256103515625, 0.9044952392578125, 0.927734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 10.0, 12.0, 16.0, 50.0, 99.0, 225.0, 564.0, 2404.0, 21323.0, 1003062.0, 17679.0, 2160.0, 539.0, 217.0, 92.0, 38.0, 23.0, 13.0, 4.0, 1.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.337890625, -2.252777099609375, -2.16766357421875, -2.082550048828125, -1.9974365234375, -1.912322998046875, -1.82720947265625, -1.742095947265625, -1.656982421875, -1.571868896484375, -1.48675537109375, -1.401641845703125, -1.3165283203125, -1.231414794921875, -1.14630126953125, -1.061187744140625, -0.97607421875, -0.890960693359375, -0.80584716796875, -0.720733642578125, -0.6356201171875, -0.550506591796875, -0.46539306640625, -0.380279541015625, -0.295166015625, -0.210052490234375, -0.12493896484375, -0.039825439453125, 0.0452880859375, 0.130401611328125, 0.21551513671875, 0.300628662109375, 0.3857421875, 0.470855712890625, 0.55596923828125, 0.641082763671875, 0.7261962890625, 0.811309814453125, 0.89642333984375, 0.981536865234375, 1.066650390625, 1.151763916015625, 1.23687744140625, 1.321990966796875, 1.4071044921875, 1.492218017578125, 1.57733154296875, 1.662445068359375, 1.74755859375, 1.832672119140625, 1.91778564453125, 2.002899169921875, 2.0880126953125, 2.173126220703125, 2.25823974609375, 2.343353271484375, 2.428466796875, 2.513580322265625, 2.59869384765625, 2.683807373046875, 2.7689208984375, 2.854034423828125, 2.93914794921875, 3.024261474609375, 3.109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 20.0, 26.0, 32.0, 59.0, 61.0, 89.0, 185.0, 145.0, 90.0, 76.0, 63.0, 36.0, 27.0, 23.0, 20.0, 11.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.0003962516784667969, -0.0003879815340042114, -0.000379711389541626, -0.00037144124507904053, -0.0003631711006164551, -0.00035490095615386963, -0.0003466308116912842, -0.00033836066722869873, -0.0003300905227661133, -0.00032182037830352783, -0.0003135502338409424, -0.00030528008937835693, -0.0002970099449157715, -0.00028873980045318604, -0.0002804696559906006, -0.00027219951152801514, -0.0002639293670654297, -0.00025565922260284424, -0.0002473890781402588, -0.00023911893367767334, -0.0002308487892150879, -0.00022257864475250244, -0.000214308500289917, -0.00020603835582733154, -0.0001977682113647461, -0.00018949806690216064, -0.0001812279224395752, -0.00017295777797698975, -0.0001646876335144043, -0.00015641748905181885, -0.0001481473445892334, -0.00013987720012664795, -0.0001316070556640625, -0.00012333691120147705, -0.0001150667667388916, -0.00010679662227630615, -9.85264778137207e-05, -9.025633335113525e-05, -8.19861888885498e-05, -7.371604442596436e-05, -6.54458999633789e-05, -5.717575550079346e-05, -4.890561103820801e-05, -4.063546657562256e-05, -3.236532211303711e-05, -2.409517765045166e-05, -1.582503318786621e-05, -7.554888725280762e-06, 7.152557373046875e-07, 8.985400199890137e-06, 1.7255544662475586e-05, 2.5525689125061035e-05, 3.3795833587646484e-05, 4.2065978050231934e-05, 5.033612251281738e-05, 5.860626697540283e-05, 6.687641143798828e-05, 7.514655590057373e-05, 8.341670036315918e-05, 9.168684482574463e-05, 9.995698928833008e-05, 0.00010822713375091553, 0.00011649727821350098, 0.00012476742267608643, 0.00013303756713867188]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 10.0, 17.0, 44.0, 92.0, 195.0, 408.0, 1117.0, 4942.0, 128589.0, 900524.0, 10029.0, 1581.0, 554.0, 238.0, 108.0, 39.0, 25.0, 15.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.0536041259765625, -1.999786376953125, -1.9459686279296875, -1.89215087890625, -1.8383331298828125, -1.784515380859375, -1.7306976318359375, -1.6768798828125, -1.6230621337890625, -1.569244384765625, -1.5154266357421875, -1.46160888671875, -1.4077911376953125, -1.353973388671875, -1.3001556396484375, -1.246337890625, -1.1925201416015625, -1.138702392578125, -1.0848846435546875, -1.03106689453125, -0.9772491455078125, -0.923431396484375, -0.8696136474609375, -0.8157958984375, -0.7619781494140625, -0.708160400390625, -0.6543426513671875, -0.60052490234375, -0.5467071533203125, -0.492889404296875, -0.4390716552734375, -0.38525390625, -0.3314361572265625, -0.277618408203125, -0.2238006591796875, -0.16998291015625, -0.1161651611328125, -0.062347412109375, -0.0085296630859375, 0.0452880859375, 0.0991058349609375, 0.152923583984375, 0.2067413330078125, 0.26055908203125, 0.3143768310546875, 0.368194580078125, 0.4220123291015625, 0.475830078125, 0.5296478271484375, 0.583465576171875, 0.6372833251953125, 0.69110107421875, 0.7449188232421875, 0.798736572265625, 0.8525543212890625, 0.9063720703125, 0.9601898193359375, 1.014007568359375, 1.0678253173828125, 1.12164306640625, 1.1754608154296875, 1.229278564453125, 1.2830963134765625, 1.3369140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 11.0, 23.0, 29.0, 82.0, 165.0, 381.0, 151.0, 60.0, 20.0, 13.0, 11.0, 5.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.611328125, -1.5733261108398438, -1.5353240966796875, -1.4973220825195312, -1.459320068359375, -1.4213180541992188, -1.3833160400390625, -1.3453140258789062, -1.30731201171875, -1.2693099975585938, -1.2313079833984375, -1.1933059692382812, -1.155303955078125, -1.1173019409179688, -1.0792999267578125, -1.0412979125976562, -1.0032958984375, -0.9652938842773438, -0.9272918701171875, -0.8892898559570312, -0.851287841796875, -0.8132858276367188, -0.7752838134765625, -0.7372817993164062, -0.69927978515625, -0.6612777709960938, -0.6232757568359375, -0.5852737426757812, -0.547271728515625, -0.5092697143554688, -0.4712677001953125, -0.43326568603515625, -0.395263671875, -0.35726165771484375, -0.3192596435546875, -0.28125762939453125, -0.243255615234375, -0.20525360107421875, -0.1672515869140625, -0.12924957275390625, -0.09124755859375, -0.05324554443359375, -0.0152435302734375, 0.02275848388671875, 0.060760498046875, 0.09876251220703125, 0.1367645263671875, 0.17476654052734375, 0.2127685546875, 0.25077056884765625, 0.2887725830078125, 0.32677459716796875, 0.364776611328125, 0.40277862548828125, 0.4407806396484375, 0.47878265380859375, 0.51678466796875, 0.5547866821289062, 0.5927886962890625, 0.6307907104492188, 0.668792724609375, 0.7067947387695312, 0.7447967529296875, 0.7827987670898438, 0.82080078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 18.0, 41.0, 88.0, 178.0, 263.0, 200.0, 110.0, 48.0, 30.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.211750030517578, -15.74354362487793, -15.275337219238281, -14.807130813598633, -14.338924407958984, -13.870718002319336, -13.402511596679688, -12.934305191040039, -12.46609878540039, -11.997892379760742, -11.529685974121094, -11.061479568481445, -10.593273162841797, -10.125066757202148, -9.6568603515625, -9.188653945922852, -8.720446586608887, -8.252240180969238, -7.78403377532959, -7.315827369689941, -6.847620964050293, -6.3794145584106445, -5.911207675933838, -5.4430012702941895, -4.974794864654541, -4.506588459014893, -4.038382053375244, -3.5701754093170166, -3.101969003677368, -2.6337625980377197, -2.165555953979492, -1.6973495483398438, -1.2291440963745117, -0.7609376311302185, -0.2927311658859253, 0.1754753589630127, 0.6436817646026611, 1.1118881702423096, 1.580094814300537, 2.0483012199401855, 2.516507625579834, 2.9847140312194824, 3.452920436859131, 3.9211270809173584, 4.389333724975586, 4.857540130615234, 5.325746536254883, 5.793952941894531, 6.26215934753418, 6.730365753173828, 7.198572158813477, 7.666778564453125, 8.134984970092773, 8.603191375732422, 9.07139778137207, 9.539604187011719, 10.007810592651367, 10.476016998291016, 10.944223403930664, 11.412429809570312, 11.880636215209961, 12.34884262084961, 12.817049026489258, 13.285255432128906, 13.753462791442871]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 7.0, 11.0, 12.0, 16.0, 26.0, 19.0, 26.0, 35.0, 34.0, 35.0, 45.0, 48.0, 42.0, 58.0, 64.0, 67.0, 50.0, 65.0, 51.0, 51.0, 47.0, 46.0, 26.0, 26.0, 24.0, 13.0, 13.0, 12.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.072422504425049, -5.903326034545898, -5.73422908782959, -5.5651326179504395, -5.396036148071289, -5.2269392013549805, -5.05784273147583, -4.88874626159668, -4.719649314880371, -4.550552845001221, -4.381455898284912, -4.212359428405762, -4.043262958526611, -3.8741660118103027, -3.7050695419311523, -3.535972833633423, -3.3668763637542725, -3.197779655456543, -3.0286831855773926, -2.859586477279663, -2.6904897689819336, -2.521393299102783, -2.3522965908050537, -2.183199882507324, -2.014103412628174, -1.8450068235397339, -1.6759101152420044, -1.5068135261535645, -1.337716817855835, -1.168620228767395, -0.9995236396789551, -0.8304269313812256, -0.6613302230834961, -0.4922335743904114, -0.32313695549964905, -0.15404033660888672, 0.015056312084197998, 0.18415296077728271, 0.35324954986572266, 0.5223462581634521, 0.6914428472518921, 0.8605394959449768, 1.0296361446380615, 1.1987327337265015, 1.3678293228149414, 1.536926031112671, 1.7060226202011108, 1.8751193284988403, 2.0442159175872803, 2.2133126258850098, 2.38240909576416, 2.5515058040618896, 2.720602512359619, 2.8896989822387695, 3.058795690536499, 3.2278923988342285, 3.396988868713379, 3.5660855770111084, 3.735182046890259, 3.9042787551879883, 4.073375225067139, 4.242472171783447, 4.411568641662598, 4.580665588378906, 4.749762058258057]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 9.0, 6.0, 7.0, 13.0, 20.0, 26.0, 24.0, 40.0, 76.0, 108.0, 135.0, 257.0, 411.0, 683.0, 1219.0, 2363.0, 4969.0, 12908.0, 45721.0, 491541.0, 3501123.0, 98106.0, 20818.0, 7063.0, 3094.0, 1498.0, 777.0, 501.0, 291.0, 173.0, 86.0, 84.0, 37.0, 29.0, 14.0, 16.0, 6.0, 6.0, 0.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77197265625, -0.7472381591796875, -0.722503662109375, -0.6977691650390625, -0.67303466796875, -0.6483001708984375, -0.623565673828125, -0.5988311767578125, -0.5740966796875, -0.5493621826171875, -0.524627685546875, -0.4998931884765625, -0.47515869140625, -0.4504241943359375, -0.425689697265625, -0.4009552001953125, -0.376220703125, -0.3514862060546875, -0.326751708984375, -0.3020172119140625, -0.27728271484375, -0.2525482177734375, -0.227813720703125, -0.2030792236328125, -0.1783447265625, -0.1536102294921875, -0.128875732421875, -0.1041412353515625, -0.07940673828125, -0.0546722412109375, -0.029937744140625, -0.0052032470703125, 0.01953125, 0.0442657470703125, 0.069000244140625, 0.0937347412109375, 0.11846923828125, 0.1432037353515625, 0.167938232421875, 0.1926727294921875, 0.2174072265625, 0.2421417236328125, 0.266876220703125, 0.2916107177734375, 0.31634521484375, 0.3410797119140625, 0.365814208984375, 0.3905487060546875, 0.415283203125, 0.4400177001953125, 0.464752197265625, 0.4894866943359375, 0.51422119140625, 0.5389556884765625, 0.563690185546875, 0.5884246826171875, 0.6131591796875, 0.6378936767578125, 0.662628173828125, 0.6873626708984375, 0.71209716796875, 0.7368316650390625, 0.761566162109375, 0.7863006591796875, 0.81103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 13.0, 8.0, 14.0, 26.0, 22.0, 30.0, 40.0, 43.0, 65.0, 71.0, 82.0, 94.0, 78.0, 83.0, 76.0, 58.0, 51.0, 37.0, 32.0, 23.0, 14.0, 11.0, 7.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.19744491577148438, -0.19139862060546875, -0.18535232543945312, -0.1793060302734375, -0.17325973510742188, -0.16721343994140625, -0.16116714477539062, -0.155120849609375, -0.14907455444335938, -0.14302825927734375, -0.13698196411132812, -0.1309356689453125, -0.12488937377929688, -0.11884307861328125, -0.11279678344726562, -0.10675048828125, -0.10070419311523438, -0.09465789794921875, -0.08861160278320312, -0.0825653076171875, -0.07651901245117188, -0.07047271728515625, -0.06442642211914062, -0.058380126953125, -0.052333831787109375, -0.04628753662109375, -0.040241241455078125, -0.0341949462890625, -0.028148651123046875, -0.02210235595703125, -0.016056060791015625, -0.010009765625, -0.003963470458984375, 0.00208282470703125, 0.008129119873046875, 0.0141754150390625, 0.020221710205078125, 0.02626800537109375, 0.032314300537109375, 0.038360595703125, 0.044406890869140625, 0.05045318603515625, 0.056499481201171875, 0.0625457763671875, 0.06859207153320312, 0.07463836669921875, 0.08068466186523438, 0.08673095703125, 0.09277725219726562, 0.09882354736328125, 0.10486984252929688, 0.1109161376953125, 0.11696243286132812, 0.12300872802734375, 0.12905502319335938, 0.135101318359375, 0.14114761352539062, 0.14719390869140625, 0.15324020385742188, 0.1592864990234375, 0.16533279418945312, 0.17137908935546875, 0.17742538452148438, 0.1834716796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 12.0, 14.0, 19.0, 39.0, 40.0, 74.0, 84.0, 96.0, 153.0, 217.0, 339.0, 486.0, 766.0, 1296.0, 2682.0, 6343.0, 18375.0, 91674.0, 3406612.0, 597014.0, 46198.0, 12085.0, 4525.0, 2018.0, 1086.0, 636.0, 416.0, 280.0, 201.0, 140.0, 95.0, 72.0, 44.0, 45.0, 19.0, 19.0, 11.0, 13.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84619140625, -0.8187332153320312, -0.7912750244140625, -0.7638168334960938, -0.736358642578125, -0.7089004516601562, -0.6814422607421875, -0.6539840698242188, -0.62652587890625, -0.5990676879882812, -0.5716094970703125, -0.5441513061523438, -0.516693115234375, -0.48923492431640625, -0.4617767333984375, -0.43431854248046875, -0.4068603515625, -0.37940216064453125, -0.3519439697265625, -0.32448577880859375, -0.297027587890625, -0.26956939697265625, -0.2421112060546875, -0.21465301513671875, -0.18719482421875, -0.15973663330078125, -0.1322784423828125, -0.10482025146484375, -0.077362060546875, -0.04990386962890625, -0.0224456787109375, 0.00501251220703125, 0.032470703125, 0.05992889404296875, 0.0873870849609375, 0.11484527587890625, 0.142303466796875, 0.16976165771484375, 0.1972198486328125, 0.22467803955078125, 0.25213623046875, 0.27959442138671875, 0.3070526123046875, 0.33451080322265625, 0.361968994140625, 0.38942718505859375, 0.4168853759765625, 0.44434356689453125, 0.4718017578125, 0.49925994873046875, 0.5267181396484375, 0.5541763305664062, 0.581634521484375, 0.6090927124023438, 0.6365509033203125, 0.6640090942382812, 0.69146728515625, 0.7189254760742188, 0.7463836669921875, 0.7738418579101562, 0.801300048828125, 0.8287582397460938, 0.8562164306640625, 0.8836746215820312, 0.9111328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 12.0, 8.0, 11.0, 26.0, 40.0, 96.0, 232.0, 1739.0, 1460.0, 239.0, 87.0, 40.0, 22.0, 14.0, 9.0, 8.0, 4.0, 9.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57080078125, -0.5503997802734375, -0.529998779296875, -0.5095977783203125, -0.48919677734375, -0.4687957763671875, -0.448394775390625, -0.4279937744140625, -0.4075927734375, -0.3871917724609375, -0.366790771484375, -0.3463897705078125, -0.32598876953125, -0.3055877685546875, -0.285186767578125, -0.2647857666015625, -0.244384765625, -0.2239837646484375, -0.203582763671875, -0.1831817626953125, -0.16278076171875, -0.1423797607421875, -0.121978759765625, -0.1015777587890625, -0.0811767578125, -0.0607757568359375, -0.040374755859375, -0.0199737548828125, 0.00042724609375, 0.0208282470703125, 0.041229248046875, 0.0616302490234375, 0.08203125, 0.1024322509765625, 0.122833251953125, 0.1432342529296875, 0.16363525390625, 0.1840362548828125, 0.204437255859375, 0.2248382568359375, 0.2452392578125, 0.2656402587890625, 0.286041259765625, 0.3064422607421875, 0.32684326171875, 0.3472442626953125, 0.367645263671875, 0.3880462646484375, 0.408447265625, 0.4288482666015625, 0.449249267578125, 0.4696502685546875, 0.49005126953125, 0.5104522705078125, 0.530853271484375, 0.5512542724609375, 0.5716552734375, 0.5920562744140625, 0.612457275390625, 0.6328582763671875, 0.65325927734375, 0.6736602783203125, 0.694061279296875, 0.7144622802734375, 0.73486328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 21.0, 45.0, 72.0, 115.0, 159.0, 194.0, 152.0, 82.0, 64.0, 35.0, 20.0, 9.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5355024337768555, -4.439301490783691, -4.343100547790527, -4.246899604797363, -4.150698661804199, -4.054497718811035, -3.958296775817871, -3.862095832824707, -3.765894889831543, -3.669693946838379, -3.573493003845215, -3.477292060852051, -3.3810911178588867, -3.2848901748657227, -3.1886892318725586, -3.0924882888793945, -2.9962873458862305, -2.9000864028930664, -2.8038854598999023, -2.7076845169067383, -2.611483573913574, -2.51528263092041, -2.419081687927246, -2.322880744934082, -2.226679801940918, -2.130478858947754, -2.03427791595459, -1.9380769729614258, -1.8418760299682617, -1.7456750869750977, -1.6494741439819336, -1.5532732009887695, -1.4570720195770264, -1.3608710765838623, -1.2646701335906982, -1.1684691905975342, -1.0722682476043701, -0.976067304611206, -0.879866361618042, -0.7836654186248779, -0.6874644756317139, -0.5912635326385498, -0.49506258964538574, -0.3988616466522217, -0.3026607036590576, -0.20645976066589355, -0.11025881767272949, -0.01405787467956543, 0.08214306831359863, 0.1783440113067627, 0.27454495429992676, 0.3707458972930908, 0.4669468402862549, 0.563147783279419, 0.659348726272583, 0.7555496692657471, 0.8517506122589111, 0.9479515552520752, 1.0441524982452393, 1.1403534412384033, 1.2365543842315674, 1.3327553272247314, 1.4289562702178955, 1.5251572132110596, 1.6213581562042236]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 0.0, 2.0, 6.0, 5.0, 7.0, 10.0, 17.0, 15.0, 19.0, 29.0, 28.0, 29.0, 24.0, 32.0, 36.0, 35.0, 41.0, 41.0, 35.0, 45.0, 45.0, 62.0, 56.0, 50.0, 48.0, 45.0, 43.0, 30.0, 33.0, 29.0, 16.0, 9.0, 18.0, 13.0, 17.0, 8.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5683906078338623, -1.5192416906356812, -1.4700926542282104, -1.4209437370300293, -1.3717948198318481, -1.3226457834243774, -1.2734968662261963, -1.2243478298187256, -1.1751989126205444, -1.1260499954223633, -1.0769009590148926, -1.0277520418167114, -0.9786030650138855, -0.9294540882110596, -0.8803051710128784, -0.8311561942100525, -0.7820072770118713, -0.7328583002090454, -0.6837093830108643, -0.6345604062080383, -0.5854114294052124, -0.5362625122070312, -0.4871135354042053, -0.4379645586013794, -0.38881561160087585, -0.3396666646003723, -0.2905176877975464, -0.24136874079704285, -0.1922197788953781, -0.14307081699371338, -0.09392186999320984, -0.04477289319038391, 0.004376053810119629, 0.053525011986494064, 0.1026739701628685, 0.15182292461395264, 0.20097188651561737, 0.2501208484172821, 0.29926979541778564, 0.3484187722206116, 0.3975677192211151, 0.44671666622161865, 0.4958656430244446, 0.5450146198272705, 0.5941635370254517, 0.6433125138282776, 0.6924614906311035, 0.7416104078292847, 0.7907593846321106, 0.8399083614349365, 0.8890572786331177, 0.9382062554359436, 0.9873552322387695, 1.0365041494369507, 1.0856530666351318, 1.1348021030426025, 1.1839510202407837, 1.2330999374389648, 1.2822489738464355, 1.3313978910446167, 1.3805468082427979, 1.4296958446502686, 1.4788447618484497, 1.5279936790466309, 1.5771427154541016]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 11.0, 13.0, 24.0, 29.0, 42.0, 74.0, 129.0, 166.0, 298.0, 473.0, 895.0, 1823.0, 4058.0, 10510.0, 31580.0, 121796.0, 451201.0, 316282.0, 74322.0, 21097.0, 7441.0, 3064.0, 1441.0, 752.0, 378.0, 253.0, 120.0, 85.0, 57.0, 35.0, 33.0, 16.0, 15.0, 13.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74755859375, -0.7206954956054688, -0.6938323974609375, -0.6669692993164062, -0.640106201171875, -0.6132431030273438, -0.5863800048828125, -0.5595169067382812, -0.53265380859375, -0.5057907104492188, -0.4789276123046875, -0.45206451416015625, -0.425201416015625, -0.39833831787109375, -0.3714752197265625, -0.34461212158203125, -0.3177490234375, -0.29088592529296875, -0.2640228271484375, -0.23715972900390625, -0.210296630859375, -0.18343353271484375, -0.1565704345703125, -0.12970733642578125, -0.10284423828125, -0.07598114013671875, -0.0491180419921875, -0.02225494384765625, 0.004608154296875, 0.03147125244140625, 0.0583343505859375, 0.08519744873046875, 0.112060546875, 0.13892364501953125, 0.1657867431640625, 0.19264984130859375, 0.219512939453125, 0.24637603759765625, 0.2732391357421875, 0.30010223388671875, 0.32696533203125, 0.35382843017578125, 0.3806915283203125, 0.40755462646484375, 0.434417724609375, 0.46128082275390625, 0.4881439208984375, 0.5150070190429688, 0.5418701171875, 0.5687332153320312, 0.5955963134765625, 0.6224594116210938, 0.649322509765625, 0.6761856079101562, 0.7030487060546875, 0.7299118041992188, 0.75677490234375, 0.7836380004882812, 0.8105010986328125, 0.8373641967773438, 0.864227294921875, 0.8910903930664062, 0.9179534912109375, 0.9448165893554688, 0.9716796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 9.0, 8.0, 20.0, 25.0, 37.0, 35.0, 40.0, 64.0, 79.0, 68.0, 77.0, 80.0, 76.0, 74.0, 52.0, 70.0, 55.0, 29.0, 34.0, 22.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20291709899902344, -0.19660568237304688, -0.1902942657470703, -0.18398284912109375, -0.1776714324951172, -0.17136001586914062, -0.16504859924316406, -0.1587371826171875, -0.15242576599121094, -0.14611434936523438, -0.1398029327392578, -0.13349151611328125, -0.1271800994873047, -0.12086868286132812, -0.11455726623535156, -0.108245849609375, -0.10193443298339844, -0.09562301635742188, -0.08931159973144531, -0.08300018310546875, -0.07668876647949219, -0.07037734985351562, -0.06406593322753906, -0.0577545166015625, -0.05144309997558594, -0.045131683349609375, -0.03882026672363281, -0.03250885009765625, -0.026197433471679688, -0.019886016845703125, -0.013574600219726562, -0.00726318359375, -0.0009517669677734375, 0.005359649658203125, 0.011671066284179688, 0.01798248291015625, 0.024293899536132812, 0.030605316162109375, 0.03691673278808594, 0.0432281494140625, 0.04953956604003906, 0.055850982666015625, 0.06216239929199219, 0.06847381591796875, 0.07478523254394531, 0.08109664916992188, 0.08740806579589844, 0.093719482421875, 0.10003089904785156, 0.10634231567382812, 0.11265373229980469, 0.11896514892578125, 0.1252765655517578, 0.13158798217773438, 0.13789939880371094, 0.1442108154296875, 0.15052223205566406, 0.15683364868164062, 0.1631450653076172, 0.16945648193359375, 0.1757678985595703, 0.18207931518554688, 0.18839073181152344, 0.1947021484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 16.0, 7.0, 17.0, 21.0, 32.0, 51.0, 85.0, 105.0, 189.0, 326.0, 518.0, 917.0, 1919.0, 3869.0, 9382.0, 25890.0, 89283.0, 373691.0, 399859.0, 96816.0, 27295.0, 9890.0, 4076.0, 1912.0, 1015.0, 526.0, 321.0, 191.0, 114.0, 76.0, 41.0, 29.0, 24.0, 14.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8359375, -0.8098373413085938, -0.7837371826171875, -0.7576370239257812, -0.731536865234375, -0.7054367065429688, -0.6793365478515625, -0.6532363891601562, -0.62713623046875, -0.6010360717773438, -0.5749359130859375, -0.5488357543945312, -0.522735595703125, -0.49663543701171875, -0.4705352783203125, -0.44443511962890625, -0.4183349609375, -0.39223480224609375, -0.3661346435546875, -0.34003448486328125, -0.313934326171875, -0.28783416748046875, -0.2617340087890625, -0.23563385009765625, -0.20953369140625, -0.18343353271484375, -0.1573333740234375, -0.13123321533203125, -0.105133056640625, -0.07903289794921875, -0.0529327392578125, -0.02683258056640625, -0.000732421875, 0.02536773681640625, 0.0514678955078125, 0.07756805419921875, 0.103668212890625, 0.12976837158203125, 0.1558685302734375, 0.18196868896484375, 0.20806884765625, 0.23416900634765625, 0.2602691650390625, 0.28636932373046875, 0.312469482421875, 0.33856964111328125, 0.3646697998046875, 0.39076995849609375, 0.4168701171875, 0.44297027587890625, 0.4690704345703125, 0.49517059326171875, 0.521270751953125, 0.5473709106445312, 0.5734710693359375, 0.5995712280273438, 0.62567138671875, 0.6517715454101562, 0.6778717041015625, 0.7039718627929688, 0.730072021484375, 0.7561721801757812, 0.7822723388671875, 0.8083724975585938, 0.83447265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 3.0, 5.0, 6.0, 13.0, 11.0, 18.0, 25.0, 21.0, 30.0, 36.0, 52.0, 53.0, 59.0, 58.0, 52.0, 74.0, 57.0, 49.0, 53.0, 54.0, 52.0, 39.0, 36.0, 28.0, 21.0, 21.0, 13.0, 16.0, 15.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1806640625, -1.1495437622070312, -1.1184234619140625, -1.0873031616210938, -1.056182861328125, -1.0250625610351562, -0.9939422607421875, -0.9628219604492188, -0.93170166015625, -0.9005813598632812, -0.8694610595703125, -0.8383407592773438, -0.807220458984375, -0.7761001586914062, -0.7449798583984375, -0.7138595581054688, -0.6827392578125, -0.6516189575195312, -0.6204986572265625, -0.5893783569335938, -0.558258056640625, -0.5271377563476562, -0.4960174560546875, -0.46489715576171875, -0.43377685546875, -0.40265655517578125, -0.3715362548828125, -0.34041595458984375, -0.309295654296875, -0.27817535400390625, -0.2470550537109375, -0.21593475341796875, -0.184814453125, -0.15369415283203125, -0.1225738525390625, -0.09145355224609375, -0.060333251953125, -0.02921295166015625, 0.0019073486328125, 0.03302764892578125, 0.06414794921875, 0.09526824951171875, 0.1263885498046875, 0.15750885009765625, 0.188629150390625, 0.21974945068359375, 0.2508697509765625, 0.28199005126953125, 0.3131103515625, 0.34423065185546875, 0.3753509521484375, 0.40647125244140625, 0.437591552734375, 0.46871185302734375, 0.4998321533203125, 0.5309524536132812, 0.56207275390625, 0.5931930541992188, 0.6243133544921875, 0.6554336547851562, 0.686553955078125, 0.7176742553710938, 0.7487945556640625, 0.7799148559570312, 0.81103515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 12.0, 19.0, 21.0, 31.0, 75.0, 133.0, 288.0, 773.0, 3429.0, 46658.0, 954680.0, 37961.0, 3158.0, 779.0, 266.0, 121.0, 61.0, 32.0, 19.0, 11.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.3987274169921875, -1.333587646484375, -1.2684478759765625, -1.20330810546875, -1.1381683349609375, -1.073028564453125, -1.0078887939453125, -0.9427490234375, -0.8776092529296875, -0.812469482421875, -0.7473297119140625, -0.68218994140625, -0.6170501708984375, -0.551910400390625, -0.4867706298828125, -0.421630859375, -0.3564910888671875, -0.291351318359375, -0.2262115478515625, -0.16107177734375, -0.0959320068359375, -0.030792236328125, 0.0343475341796875, 0.0994873046875, 0.1646270751953125, 0.229766845703125, 0.2949066162109375, 0.36004638671875, 0.4251861572265625, 0.490325927734375, 0.5554656982421875, 0.62060546875, 0.6857452392578125, 0.750885009765625, 0.8160247802734375, 0.88116455078125, 0.9463043212890625, 1.011444091796875, 1.0765838623046875, 1.1417236328125, 1.2068634033203125, 1.272003173828125, 1.3371429443359375, 1.40228271484375, 1.4674224853515625, 1.532562255859375, 1.5977020263671875, 1.662841796875, 1.7279815673828125, 1.793121337890625, 1.8582611083984375, 1.92340087890625, 1.9885406494140625, 2.053680419921875, 2.1188201904296875, 2.1839599609375, 2.2490997314453125, 2.314239501953125, 2.3793792724609375, 2.44451904296875, 2.5096588134765625, 2.574798583984375, 2.6399383544921875, 2.705078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 11.0, 13.0, 15.0, 31.0, 39.0, 54.0, 61.0, 65.0, 105.0, 90.0, 91.0, 84.0, 78.0, 56.0, 52.0, 30.0, 28.0, 24.0, 19.0, 8.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022912025451660156, -0.00022213906049728394, -0.0002151578664779663, -0.00020817667245864868, -0.00020119547843933105, -0.00019421428442001343, -0.0001872330904006958, -0.00018025189638137817, -0.00017327070236206055, -0.00016628950834274292, -0.0001593083143234253, -0.00015232712030410767, -0.00014534592628479004, -0.0001383647322654724, -0.00013138353824615479, -0.00012440234422683716, -0.00011742115020751953, -0.0001104399561882019, -0.00010345876216888428, -9.647756814956665e-05, -8.949637413024902e-05, -8.25151801109314e-05, -7.553398609161377e-05, -6.855279207229614e-05, -6.157159805297852e-05, -5.459040403366089e-05, -4.760921001434326e-05, -4.0628015995025635e-05, -3.364682197570801e-05, -2.666562795639038e-05, -1.9684433937072754e-05, -1.2703239917755127e-05, -5.7220458984375e-06, 1.259148120880127e-06, 8.240342140197754e-06, 1.5221536159515381e-05, 2.2202730178833008e-05, 2.9183924198150635e-05, 3.616511821746826e-05, 4.314631223678589e-05, 5.0127506256103516e-05, 5.710870027542114e-05, 6.408989429473877e-05, 7.10710883140564e-05, 7.805228233337402e-05, 8.503347635269165e-05, 9.201467037200928e-05, 9.89958643913269e-05, 0.00010597705841064453, 0.00011295825242996216, 0.00011993944644927979, 0.0001269206404685974, 0.00013390183448791504, 0.00014088302850723267, 0.0001478642225265503, 0.00015484541654586792, 0.00016182661056518555, 0.00016880780458450317, 0.0001757889986038208, 0.00018277019262313843, 0.00018975138664245605, 0.00019673258066177368, 0.0002037137746810913, 0.00021069496870040894, 0.00021767616271972656]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 7.0, 6.0, 12.0, 6.0, 8.0, 12.0, 31.0, 30.0, 50.0, 66.0, 114.0, 163.0, 280.0, 443.0, 847.0, 1677.0, 3831.0, 11054.0, 42956.0, 290257.0, 591866.0, 78081.0, 16864.0, 5235.0, 2148.0, 1022.0, 541.0, 325.0, 192.0, 131.0, 78.0, 64.0, 49.0, 31.0, 24.0, 16.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6538314819335938, -0.6328582763671875, -0.6118850708007812, -0.590911865234375, -0.5699386596679688, -0.5489654541015625, -0.5279922485351562, -0.50701904296875, -0.48604583740234375, -0.4650726318359375, -0.44409942626953125, -0.423126220703125, -0.40215301513671875, -0.3811798095703125, -0.36020660400390625, -0.3392333984375, -0.31826019287109375, -0.2972869873046875, -0.27631378173828125, -0.255340576171875, -0.23436737060546875, -0.2133941650390625, -0.19242095947265625, -0.17144775390625, -0.15047454833984375, -0.1295013427734375, -0.10852813720703125, -0.087554931640625, -0.06658172607421875, -0.0456085205078125, -0.02463531494140625, -0.003662109375, 0.01731109619140625, 0.0382843017578125, 0.05925750732421875, 0.080230712890625, 0.10120391845703125, 0.1221771240234375, 0.14315032958984375, 0.16412353515625, 0.18509674072265625, 0.2060699462890625, 0.22704315185546875, 0.248016357421875, 0.26898956298828125, 0.2899627685546875, 0.31093597412109375, 0.3319091796875, 0.35288238525390625, 0.3738555908203125, 0.39482879638671875, 0.415802001953125, 0.43677520751953125, 0.4577484130859375, 0.47872161865234375, 0.49969482421875, 0.5206680297851562, 0.5416412353515625, 0.5626144409179688, 0.583587646484375, 0.6045608520507812, 0.6255340576171875, 0.6465072631835938, 0.66748046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 4.0, 5.0, 10.0, 3.0, 12.0, 6.0, 18.0, 13.0, 21.0, 21.0, 29.0, 55.0, 63.0, 104.0, 144.0, 111.0, 82.0, 77.0, 40.0, 22.0, 27.0, 20.0, 16.0, 16.0, 13.0, 12.0, 8.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7266616821289062, -0.7038116455078125, -0.6809616088867188, -0.658111572265625, -0.6352615356445312, -0.6124114990234375, -0.5895614624023438, -0.56671142578125, -0.5438613891601562, -0.5210113525390625, -0.49816131591796875, -0.475311279296875, -0.45246124267578125, -0.4296112060546875, -0.40676116943359375, -0.3839111328125, -0.36106109619140625, -0.3382110595703125, -0.31536102294921875, -0.292510986328125, -0.26966094970703125, -0.2468109130859375, -0.22396087646484375, -0.20111083984375, -0.17826080322265625, -0.1554107666015625, -0.13256072998046875, -0.109710693359375, -0.08686065673828125, -0.0640106201171875, -0.04116058349609375, -0.018310546875, 0.00453948974609375, 0.0273895263671875, 0.05023956298828125, 0.073089599609375, 0.09593963623046875, 0.1187896728515625, 0.14163970947265625, 0.16448974609375, 0.18733978271484375, 0.2101898193359375, 0.23303985595703125, 0.255889892578125, 0.27873992919921875, 0.3015899658203125, 0.32444000244140625, 0.3472900390625, 0.37014007568359375, 0.3929901123046875, 0.41584014892578125, 0.438690185546875, 0.46154022216796875, 0.4843902587890625, 0.5072402954101562, 0.53009033203125, 0.5529403686523438, 0.5757904052734375, 0.5986404418945312, 0.621490478515625, 0.6443405151367188, 0.6671905517578125, 0.6900405883789062, 0.712890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 11.0, 38.0, 78.0, 154.0, 201.0, 219.0, 154.0, 75.0, 30.0, 14.0, 12.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.661388397216797, -17.22071075439453, -16.780033111572266, -16.33935546875, -15.898676872253418, -15.457999229431152, -15.01732063293457, -14.576642990112305, -14.135965347290039, -13.695287704467773, -13.254610061645508, -12.813931465148926, -12.37325382232666, -11.932576179504395, -11.491897583007812, -11.051219940185547, -10.610542297363281, -10.169864654541016, -9.72918701171875, -9.288508415222168, -8.847830772399902, -8.407153129577637, -7.966475009918213, -7.525796890258789, -7.085119247436523, -6.644441604614258, -6.203763484954834, -5.76308536529541, -5.3224077224731445, -4.881730079650879, -4.441051959991455, -4.000373840332031, -3.559697151184082, -3.1190192699432373, -2.6783413887023926, -2.237663507461548, -1.7969856262207031, -1.3563077449798584, -0.9156298637390137, -0.47495198249816895, -0.03427410125732422, 0.4064037799835205, 0.8470816612243652, 1.28775954246521, 1.7284374237060547, 2.1691153049468994, 2.609793186187744, 3.050471067428589, 3.4911489486694336, 3.9318268299102783, 4.372504711151123, 4.813182830810547, 5.2538604736328125, 5.694538116455078, 6.135216236114502, 6.575894355773926, 7.016571998596191, 7.457249641418457, 7.897927761077881, 8.338605880737305, 8.77928352355957, 9.219961166381836, 9.660638809204102, 10.101317405700684, 10.54199504852295]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 9.0, 7.0, 8.0, 7.0, 8.0, 13.0, 17.0, 22.0, 18.0, 26.0, 26.0, 26.0, 46.0, 29.0, 31.0, 43.0, 42.0, 39.0, 52.0, 48.0, 47.0, 45.0, 48.0, 45.0, 37.0, 30.0, 28.0, 35.0, 28.0, 21.0, 12.0, 15.0, 13.0, 14.0, 13.0, 12.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.533259391784668, -5.363619327545166, -5.193979263305664, -5.024339199066162, -4.85469913482666, -4.68505859375, -4.515418529510498, -4.345778465270996, -4.176138401031494, -4.006498336791992, -3.8368582725524902, -3.667217969894409, -3.4975779056549072, -3.3279378414154053, -3.158297538757324, -2.9886574745178223, -2.8190174102783203, -2.6493773460388184, -2.4797372817993164, -2.3100969791412354, -2.1404569149017334, -1.9708168506622314, -1.80117666721344, -1.6315364837646484, -1.4618964195251465, -1.2922563552856445, -1.122616171836853, -0.9529760479927063, -0.7833359241485596, -0.6136958003044128, -0.4440556764602661, -0.2744154930114746, -0.10477495193481445, 0.06486517190933228, 0.234505295753479, 0.40414541959762573, 0.5737855434417725, 0.7434256672859192, 0.9130657911300659, 1.0827059745788574, 1.2523460388183594, 1.4219861030578613, 1.5916262865066528, 1.7612664699554443, 1.9309065341949463, 2.1005465984344482, 2.2701869010925293, 2.4398269653320312, 2.609467029571533, 2.779107093811035, 2.948747158050537, 3.118387460708618, 3.28802752494812, 3.457667589187622, 3.627307891845703, 3.796947956085205, 3.966588020324707, 4.136228084564209, 4.305868148803711, 4.475508213043213, 4.645148277282715, 4.814788818359375, 4.984428882598877, 5.154068946838379, 5.323709011077881]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 3.0, 9.0, 17.0, 21.0, 34.0, 41.0, 59.0, 99.0, 112.0, 226.0, 370.0, 572.0, 1023.0, 1867.0, 3831.0, 8784.0, 24810.0, 111151.0, 3804409.0, 183680.0, 32801.0, 10750.0, 4537.0, 2207.0, 1135.0, 651.0, 393.0, 237.0, 149.0, 78.0, 70.0, 48.0, 30.0, 16.0, 11.0, 8.0, 8.0, 7.0, 2.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83935546875, -0.81280517578125, -0.7862548828125, -0.75970458984375, -0.733154296875, -0.70660400390625, -0.6800537109375, -0.65350341796875, -0.626953125, -0.60040283203125, -0.5738525390625, -0.54730224609375, -0.520751953125, -0.49420166015625, -0.4676513671875, -0.44110107421875, -0.41455078125, -0.38800048828125, -0.3614501953125, -0.33489990234375, -0.308349609375, -0.28179931640625, -0.2552490234375, -0.22869873046875, -0.2021484375, -0.17559814453125, -0.1490478515625, -0.12249755859375, -0.095947265625, -0.06939697265625, -0.0428466796875, -0.01629638671875, 0.01025390625, 0.03680419921875, 0.0633544921875, 0.08990478515625, 0.116455078125, 0.14300537109375, 0.1695556640625, 0.19610595703125, 0.22265625, 0.24920654296875, 0.2757568359375, 0.30230712890625, 0.328857421875, 0.35540771484375, 0.3819580078125, 0.40850830078125, 0.43505859375, 0.46160888671875, 0.4881591796875, 0.51470947265625, 0.541259765625, 0.56781005859375, 0.5943603515625, 0.62091064453125, 0.6474609375, 0.67401123046875, 0.7005615234375, 0.72711181640625, 0.753662109375, 0.78021240234375, 0.8067626953125, 0.83331298828125, 0.85986328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 14.0, 16.0, 15.0, 21.0, 21.0, 42.0, 33.0, 54.0, 49.0, 67.0, 65.0, 75.0, 85.0, 47.0, 83.0, 44.0, 39.0, 42.0, 34.0, 37.0, 26.0, 15.0, 12.0, 6.0, 14.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.23004531860351562, -0.22327423095703125, -0.21650314331054688, -0.2097320556640625, -0.20296096801757812, -0.19618988037109375, -0.18941879272460938, -0.182647705078125, -0.17587661743164062, -0.16910552978515625, -0.16233444213867188, -0.1555633544921875, -0.14879226684570312, -0.14202117919921875, -0.13525009155273438, -0.12847900390625, -0.12170791625976562, -0.11493682861328125, -0.10816574096679688, -0.1013946533203125, -0.09462356567382812, -0.08785247802734375, -0.08108139038085938, -0.074310302734375, -0.06753921508789062, -0.06076812744140625, -0.053997039794921875, -0.0472259521484375, -0.040454864501953125, -0.03368377685546875, -0.026912689208984375, -0.0201416015625, -0.013370513916015625, -0.00659942626953125, 0.000171661376953125, 0.0069427490234375, 0.013713836669921875, 0.02048492431640625, 0.027256011962890625, 0.034027099609375, 0.040798187255859375, 0.04756927490234375, 0.054340362548828125, 0.0611114501953125, 0.06788253784179688, 0.07465362548828125, 0.08142471313476562, 0.08819580078125, 0.09496688842773438, 0.10173797607421875, 0.10850906372070312, 0.1152801513671875, 0.12205123901367188, 0.12882232666015625, 0.13559341430664062, 0.142364501953125, 0.14913558959960938, 0.15590667724609375, 0.16267776489257812, 0.1694488525390625, 0.17621994018554688, 0.18299102783203125, 0.18976211547851562, 0.196533203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 10.0, 10.0, 11.0, 23.0, 18.0, 29.0, 44.0, 68.0, 89.0, 147.0, 224.0, 334.0, 582.0, 968.0, 1761.0, 3852.0, 10062.0, 44058.0, 3535619.0, 546778.0, 33736.0, 8392.0, 3351.0, 1703.0, 920.0, 543.0, 345.0, 196.0, 130.0, 96.0, 63.0, 39.0, 34.0, 9.0, 9.0, 11.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3349609375, -1.2967376708984375, -1.258514404296875, -1.2202911376953125, -1.18206787109375, -1.1438446044921875, -1.105621337890625, -1.0673980712890625, -1.0291748046875, -0.9909515380859375, -0.952728271484375, -0.9145050048828125, -0.87628173828125, -0.8380584716796875, -0.799835205078125, -0.7616119384765625, -0.723388671875, -0.6851654052734375, -0.646942138671875, -0.6087188720703125, -0.57049560546875, -0.5322723388671875, -0.494049072265625, -0.4558258056640625, -0.4176025390625, -0.3793792724609375, -0.341156005859375, -0.3029327392578125, -0.26470947265625, -0.2264862060546875, -0.188262939453125, -0.1500396728515625, -0.11181640625, -0.0735931396484375, -0.035369873046875, 0.0028533935546875, 0.04107666015625, 0.0792999267578125, 0.117523193359375, 0.1557464599609375, 0.1939697265625, 0.2321929931640625, 0.270416259765625, 0.3086395263671875, 0.34686279296875, 0.3850860595703125, 0.423309326171875, 0.4615325927734375, 0.499755859375, 0.5379791259765625, 0.576202392578125, 0.6144256591796875, 0.65264892578125, 0.6908721923828125, 0.729095458984375, 0.7673187255859375, 0.8055419921875, 0.8437652587890625, 0.881988525390625, 0.9202117919921875, 0.95843505859375, 0.9966583251953125, 1.034881591796875, 1.0731048583984375, 1.111328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 12.0, 6.0, 23.0, 44.0, 93.0, 328.0, 3125.0, 253.0, 66.0, 40.0, 26.0, 18.0, 8.0, 8.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3525390625, -0.3422966003417969, -0.33205413818359375, -0.3218116760253906, -0.3115692138671875, -0.3013267517089844, -0.29108428955078125, -0.2808418273925781, -0.270599365234375, -0.2603569030761719, -0.25011444091796875, -0.23987197875976562, -0.2296295166015625, -0.21938705444335938, -0.20914459228515625, -0.19890213012695312, -0.18865966796875, -0.17841720581054688, -0.16817474365234375, -0.15793228149414062, -0.1476898193359375, -0.13744735717773438, -0.12720489501953125, -0.11696243286132812, -0.106719970703125, -0.09647750854492188, -0.08623504638671875, -0.07599258422851562, -0.0657501220703125, -0.055507659912109375, -0.04526519775390625, -0.035022735595703125, -0.0247802734375, -0.014537811279296875, -0.00429534912109375, 0.005947113037109375, 0.0161895751953125, 0.026432037353515625, 0.03667449951171875, 0.046916961669921875, 0.057159423828125, 0.06740188598632812, 0.07764434814453125, 0.08788681030273438, 0.0981292724609375, 0.10837173461914062, 0.11861419677734375, 0.12885665893554688, 0.13909912109375, 0.14934158325195312, 0.15958404541015625, 0.16982650756835938, 0.1800689697265625, 0.19031143188476562, 0.20055389404296875, 0.21079635620117188, 0.221038818359375, 0.23128128051757812, 0.24152374267578125, 0.2517662048339844, 0.2620086669921875, 0.2722511291503906, 0.28249359130859375, 0.2927360534667969, 0.302978515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 13.0, 17.0, 28.0, 37.0, 72.0, 94.0, 130.0, 131.0, 128.0, 127.0, 74.0, 52.0, 32.0, 25.0, 13.0, 6.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.006881833076477, -0.9752042293548584, -0.9435266256332397, -0.9118490219116211, -0.8801714181900024, -0.8484938144683838, -0.8168161511421204, -0.7851385474205017, -0.7534609436988831, -0.7217833399772644, -0.6901057362556458, -0.6584281325340271, -0.6267504692077637, -0.595072865486145, -0.5633952617645264, -0.5317176580429077, -0.5000400543212891, -0.4683624505996704, -0.43668484687805176, -0.4050072133541107, -0.37332960963249207, -0.3416520059108734, -0.3099743723869324, -0.2782967686653137, -0.24661916494369507, -0.21494156122207642, -0.18326394259929657, -0.15158632397651672, -0.11990872025489807, -0.08823111653327942, -0.05655349791049957, -0.024875879287719727, 0.006801724433898926, 0.038479335606098175, 0.07015694677829742, 0.10183455795049667, 0.13351216912269592, 0.16518977284431458, 0.19686739146709442, 0.22854501008987427, 0.2602226138114929, 0.2919002175331116, 0.3235778212547302, 0.35525545477867126, 0.3869330585002899, 0.41861066222190857, 0.4502882957458496, 0.48196589946746826, 0.5136435031890869, 0.5453211069107056, 0.5769987106323242, 0.6086763143539429, 0.6403539180755615, 0.6720315217971802, 0.7037091851234436, 0.7353867888450623, 0.7670643925666809, 0.7987419962882996, 0.8304196000099182, 0.8620972037315369, 0.8937748670578003, 0.925452470779419, 0.9571300745010376, 0.9888076782226562, 1.020485281944275]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 6.0, 3.0, 8.0, 10.0, 7.0, 14.0, 18.0, 25.0, 17.0, 16.0, 23.0, 40.0, 30.0, 30.0, 35.0, 39.0, 37.0, 44.0, 56.0, 27.0, 53.0, 48.0, 41.0, 41.0, 38.0, 37.0, 29.0, 29.0, 30.0, 24.0, 18.0, 14.0, 16.0, 22.0, 13.0, 9.0, 11.0, 6.0, 8.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5253311991691589, -0.5084941387176514, -0.4916570782661438, -0.4748200476169586, -0.45798298716545105, -0.4411459267139435, -0.4243088960647583, -0.40747183561325073, -0.39063477516174316, -0.3737977147102356, -0.356960654258728, -0.34012362360954285, -0.3232865631580353, -0.3064495027065277, -0.28961247205734253, -0.27277541160583496, -0.2559383511543274, -0.23910129070281982, -0.22226424515247345, -0.20542719960212708, -0.1885901391506195, -0.17175307869911194, -0.15491603314876556, -0.1380789875984192, -0.12124192714691162, -0.10440487414598465, -0.08756782114505768, -0.0707307681441307, -0.053893715143203735, -0.037056662142276764, -0.020219609141349792, -0.003382556140422821, 0.013454437255859375, 0.030291490256786346, 0.04712854325771332, 0.06396559625864029, 0.08080264925956726, 0.09763970226049423, 0.1144767552614212, 0.13131380081176758, 0.14815086126327515, 0.16498792171478271, 0.1818249672651291, 0.19866201281547546, 0.21549907326698303, 0.2323361337184906, 0.24917317926883698, 0.26601022481918335, 0.2828472852706909, 0.2996843457221985, 0.31652140617370605, 0.33335843682289124, 0.3501954972743988, 0.36703255772590637, 0.38386958837509155, 0.4007066488265991, 0.4175437092781067, 0.43438076972961426, 0.4512178301811218, 0.468054860830307, 0.4848919212818146, 0.5017289519309998, 0.5185660123825073, 0.5354030728340149, 0.5522401332855225]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 24.0, 40.0, 53.0, 99.0, 160.0, 282.0, 599.0, 1293.0, 2973.0, 8292.0, 27667.0, 121163.0, 459747.0, 327614.0, 70787.0, 17681.0, 5806.0, 2265.0, 937.0, 459.0, 230.0, 137.0, 78.0, 54.0, 37.0, 18.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1827239990234375, -1.146697998046875, -1.1106719970703125, -1.07464599609375, -1.0386199951171875, -1.002593994140625, -0.9665679931640625, -0.9305419921875, -0.8945159912109375, -0.858489990234375, -0.8224639892578125, -0.78643798828125, -0.7504119873046875, -0.714385986328125, -0.6783599853515625, -0.642333984375, -0.6063079833984375, -0.570281982421875, -0.5342559814453125, -0.49822998046875, -0.4622039794921875, -0.426177978515625, -0.3901519775390625, -0.3541259765625, -0.3180999755859375, -0.282073974609375, -0.2460479736328125, -0.21002197265625, -0.1739959716796875, -0.137969970703125, -0.1019439697265625, -0.06591796875, -0.0298919677734375, 0.006134033203125, 0.0421600341796875, 0.07818603515625, 0.1142120361328125, 0.150238037109375, 0.1862640380859375, 0.2222900390625, 0.2583160400390625, 0.294342041015625, 0.3303680419921875, 0.36639404296875, 0.4024200439453125, 0.438446044921875, 0.4744720458984375, 0.510498046875, 0.5465240478515625, 0.582550048828125, 0.6185760498046875, 0.65460205078125, 0.6906280517578125, 0.726654052734375, 0.7626800537109375, 0.7987060546875, 0.8347320556640625, 0.870758056640625, 0.9067840576171875, 0.94281005859375, 0.9788360595703125, 1.014862060546875, 1.0508880615234375, 1.0869140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 6.0, 9.0, 10.0, 12.0, 18.0, 19.0, 29.0, 34.0, 44.0, 40.0, 45.0, 49.0, 81.0, 51.0, 81.0, 54.0, 59.0, 60.0, 41.0, 32.0, 44.0, 33.0, 33.0, 23.0, 23.0, 17.0, 16.0, 12.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24322128295898438, -0.23619842529296875, -0.22917556762695312, -0.2221527099609375, -0.21512985229492188, -0.20810699462890625, -0.20108413696289062, -0.194061279296875, -0.18703842163085938, -0.18001556396484375, -0.17299270629882812, -0.1659698486328125, -0.15894699096679688, -0.15192413330078125, -0.14490127563476562, -0.13787841796875, -0.13085556030273438, -0.12383270263671875, -0.11680984497070312, -0.1097869873046875, -0.10276412963867188, -0.09574127197265625, -0.08871841430664062, -0.081695556640625, -0.07467269897460938, -0.06764984130859375, -0.060626983642578125, -0.0536041259765625, -0.046581268310546875, -0.03955841064453125, -0.032535552978515625, -0.0255126953125, -0.018489837646484375, -0.01146697998046875, -0.004444122314453125, 0.0025787353515625, 0.009601593017578125, 0.01662445068359375, 0.023647308349609375, 0.030670166015625, 0.037693023681640625, 0.04471588134765625, 0.051738739013671875, 0.0587615966796875, 0.06578445434570312, 0.07280731201171875, 0.07983016967773438, 0.08685302734375, 0.09387588500976562, 0.10089874267578125, 0.10792160034179688, 0.1149444580078125, 0.12196731567382812, 0.12899017333984375, 0.13601303100585938, 0.143035888671875, 0.15005874633789062, 0.15708160400390625, 0.16410446166992188, 0.1711273193359375, 0.17815017700195312, 0.18517303466796875, 0.19219589233398438, 0.19921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 7.0, 13.0, 16.0, 20.0, 31.0, 64.0, 87.0, 171.0, 304.0, 533.0, 1132.0, 2558.0, 6953.0, 25900.0, 155830.0, 645897.0, 169274.0, 27243.0, 7436.0, 2709.0, 1106.0, 537.0, 315.0, 150.0, 96.0, 65.0, 28.0, 28.0, 21.0, 12.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3134765625, -1.2718048095703125, -1.230133056640625, -1.1884613037109375, -1.14678955078125, -1.1051177978515625, -1.063446044921875, -1.0217742919921875, -0.9801025390625, -0.9384307861328125, -0.896759033203125, -0.8550872802734375, -0.81341552734375, -0.7717437744140625, -0.730072021484375, -0.6884002685546875, -0.646728515625, -0.6050567626953125, -0.563385009765625, -0.5217132568359375, -0.48004150390625, -0.4383697509765625, -0.396697998046875, -0.3550262451171875, -0.3133544921875, -0.2716827392578125, -0.230010986328125, -0.1883392333984375, -0.14666748046875, -0.1049957275390625, -0.063323974609375, -0.0216522216796875, 0.02001953125, 0.0616912841796875, 0.103363037109375, 0.1450347900390625, 0.18670654296875, 0.2283782958984375, 0.270050048828125, 0.3117218017578125, 0.3533935546875, 0.3950653076171875, 0.436737060546875, 0.4784088134765625, 0.52008056640625, 0.5617523193359375, 0.603424072265625, 0.6450958251953125, 0.686767578125, 0.7284393310546875, 0.770111083984375, 0.8117828369140625, 0.85345458984375, 0.8951263427734375, 0.936798095703125, 0.9784698486328125, 1.0201416015625, 1.0618133544921875, 1.103485107421875, 1.1451568603515625, 1.18682861328125, 1.2285003662109375, 1.270172119140625, 1.3118438720703125, 1.353515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 7.0, 4.0, 11.0, 9.0, 19.0, 21.0, 35.0, 36.0, 46.0, 50.0, 45.0, 65.0, 65.0, 68.0, 78.0, 42.0, 64.0, 48.0, 35.0, 36.0, 41.0, 35.0, 31.0, 25.0, 23.0, 11.0, 9.0, 11.0, 9.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2158203125, -1.1701507568359375, -1.124481201171875, -1.0788116455078125, -1.03314208984375, -0.9874725341796875, -0.941802978515625, -0.8961334228515625, -0.8504638671875, -0.8047943115234375, -0.759124755859375, -0.7134552001953125, -0.66778564453125, -0.6221160888671875, -0.576446533203125, -0.5307769775390625, -0.485107421875, -0.4394378662109375, -0.393768310546875, -0.3480987548828125, -0.30242919921875, -0.2567596435546875, -0.211090087890625, -0.1654205322265625, -0.1197509765625, -0.0740814208984375, -0.028411865234375, 0.0172576904296875, 0.06292724609375, 0.1085968017578125, 0.154266357421875, 0.1999359130859375, 0.24560546875, 0.2912750244140625, 0.336944580078125, 0.3826141357421875, 0.42828369140625, 0.4739532470703125, 0.519622802734375, 0.5652923583984375, 0.6109619140625, 0.6566314697265625, 0.702301025390625, 0.7479705810546875, 0.79364013671875, 0.8393096923828125, 0.884979248046875, 0.9306488037109375, 0.976318359375, 1.0219879150390625, 1.067657470703125, 1.1133270263671875, 1.15899658203125, 1.2046661376953125, 1.250335693359375, 1.2960052490234375, 1.3416748046875, 1.3873443603515625, 1.433013916015625, 1.4786834716796875, 1.52435302734375, 1.5700225830078125, 1.615692138671875, 1.6613616943359375, 1.70703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 12.0, 26.0, 32.0, 51.0, 81.0, 149.0, 255.0, 552.0, 1403.0, 5127.0, 47268.0, 929906.0, 55516.0, 5530.0, 1456.0, 534.0, 279.0, 141.0, 92.0, 48.0, 26.0, 14.0, 12.0, 11.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.7833709716796875, -1.724945068359375, -1.6665191650390625, -1.60809326171875, -1.5496673583984375, -1.491241455078125, -1.4328155517578125, -1.3743896484375, -1.3159637451171875, -1.257537841796875, -1.1991119384765625, -1.14068603515625, -1.0822601318359375, -1.023834228515625, -0.9654083251953125, -0.906982421875, -0.8485565185546875, -0.790130615234375, -0.7317047119140625, -0.67327880859375, -0.6148529052734375, -0.556427001953125, -0.4980010986328125, -0.4395751953125, -0.3811492919921875, -0.322723388671875, -0.2642974853515625, -0.20587158203125, -0.1474456787109375, -0.089019775390625, -0.0305938720703125, 0.02783203125, 0.0862579345703125, 0.144683837890625, 0.2031097412109375, 0.26153564453125, 0.3199615478515625, 0.378387451171875, 0.4368133544921875, 0.4952392578125, 0.5536651611328125, 0.612091064453125, 0.6705169677734375, 0.72894287109375, 0.7873687744140625, 0.845794677734375, 0.9042205810546875, 0.962646484375, 1.0210723876953125, 1.079498291015625, 1.1379241943359375, 1.19635009765625, 1.2547760009765625, 1.313201904296875, 1.3716278076171875, 1.4300537109375, 1.4884796142578125, 1.546905517578125, 1.6053314208984375, 1.66375732421875, 1.7221832275390625, 1.780609130859375, 1.8390350341796875, 1.8974609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 16.0, 22.0, 36.0, 58.0, 108.0, 120.0, 144.0, 161.0, 110.0, 112.0, 47.0, 28.0, 15.0, 10.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0003917217254638672, -0.0003816969692707062, -0.00037167221307754517, -0.00036164745688438416, -0.00035162270069122314, -0.00034159794449806213, -0.0003315731883049011, -0.0003215484321117401, -0.0003115236759185791, -0.0003014989197254181, -0.0002914741635322571, -0.00028144940733909607, -0.00027142465114593506, -0.00026139989495277405, -0.00025137513875961304, -0.00024135038256645203, -0.00023132562637329102, -0.00022130087018013, -0.000211276113986969, -0.00020125135779380798, -0.00019122660160064697, -0.00018120184540748596, -0.00017117708921432495, -0.00016115233302116394, -0.00015112757682800293, -0.00014110282063484192, -0.0001310780644416809, -0.0001210533082485199, -0.00011102855205535889, -0.00010100379586219788, -9.097903966903687e-05, -8.095428347587585e-05, -7.092952728271484e-05, -6.090477108955383e-05, -5.088001489639282e-05, -4.085525870323181e-05, -3.08305025100708e-05, -2.080574631690979e-05, -1.078099012374878e-05, -7.562339305877686e-07, 9.268522262573242e-06, 1.9293278455734253e-05, 2.9318034648895264e-05, 3.9342790842056274e-05, 4.9367547035217285e-05, 5.9392303228378296e-05, 6.94170594215393e-05, 7.944181561470032e-05, 8.946657180786133e-05, 9.949132800102234e-05, 0.00010951608419418335, 0.00011954084038734436, 0.00012956559658050537, 0.00013959035277366638, 0.0001496151089668274, 0.0001596398651599884, 0.00016966462135314941, 0.00017968937754631042, 0.00018971413373947144, 0.00019973888993263245, 0.00020976364612579346, 0.00021978840231895447, 0.00022981315851211548, 0.0002398379147052765, 0.0002498626708984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 19.0, 12.0, 22.0, 34.0, 63.0, 96.0, 132.0, 268.0, 594.0, 1499.0, 5156.0, 36704.0, 840866.0, 148387.0, 10534.0, 2395.0, 838.0, 369.0, 204.0, 115.0, 59.0, 35.0, 36.0, 13.0, 22.0, 11.0, 14.0, 5.0, 5.0, 10.0, 3.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.083831787109375, -1.04168701171875, -0.999542236328125, -0.9573974609375, -0.915252685546875, -0.87310791015625, -0.830963134765625, -0.788818359375, -0.746673583984375, -0.70452880859375, -0.662384033203125, -0.6202392578125, -0.578094482421875, -0.53594970703125, -0.493804931640625, -0.45166015625, -0.409515380859375, -0.36737060546875, -0.325225830078125, -0.2830810546875, -0.240936279296875, -0.19879150390625, -0.156646728515625, -0.114501953125, -0.072357177734375, -0.03021240234375, 0.011932373046875, 0.0540771484375, 0.096221923828125, 0.13836669921875, 0.180511474609375, 0.22265625, 0.264801025390625, 0.30694580078125, 0.349090576171875, 0.3912353515625, 0.433380126953125, 0.47552490234375, 0.517669677734375, 0.559814453125, 0.601959228515625, 0.64410400390625, 0.686248779296875, 0.7283935546875, 0.770538330078125, 0.81268310546875, 0.854827880859375, 0.89697265625, 0.939117431640625, 0.98126220703125, 1.023406982421875, 1.0655517578125, 1.107696533203125, 1.14984130859375, 1.191986083984375, 1.234130859375, 1.276275634765625, 1.31842041015625, 1.360565185546875, 1.4027099609375, 1.444854736328125, 1.48699951171875, 1.529144287109375, 1.5712890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 1.0, 5.0, 3.0, 5.0, 9.0, 9.0, 16.0, 19.0, 35.0, 52.0, 79.0, 136.0, 218.0, 144.0, 78.0, 56.0, 39.0, 35.0, 14.0, 9.0, 8.0, 9.0, 3.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6282806396484375, -1.579803466796875, -1.5313262939453125, -1.48284912109375, -1.4343719482421875, -1.385894775390625, -1.3374176025390625, -1.2889404296875, -1.2404632568359375, -1.191986083984375, -1.1435089111328125, -1.09503173828125, -1.0465545654296875, -0.998077392578125, -0.9496002197265625, -0.901123046875, -0.8526458740234375, -0.804168701171875, -0.7556915283203125, -0.70721435546875, -0.6587371826171875, -0.610260009765625, -0.5617828369140625, -0.5133056640625, -0.4648284912109375, -0.416351318359375, -0.3678741455078125, -0.31939697265625, -0.2709197998046875, -0.222442626953125, -0.1739654541015625, -0.12548828125, -0.0770111083984375, -0.028533935546875, 0.0199432373046875, 0.06842041015625, 0.1168975830078125, 0.165374755859375, 0.2138519287109375, 0.2623291015625, 0.3108062744140625, 0.359283447265625, 0.4077606201171875, 0.45623779296875, 0.5047149658203125, 0.553192138671875, 0.6016693115234375, 0.650146484375, 0.6986236572265625, 0.747100830078125, 0.7955780029296875, 0.84405517578125, 0.8925323486328125, 0.941009521484375, 0.9894866943359375, 1.0379638671875, 1.0864410400390625, 1.134918212890625, 1.1833953857421875, 1.23187255859375, 1.2803497314453125, 1.328826904296875, 1.3773040771484375, 1.42578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 40.0, 93.0, 266.0, 328.0, 172.0, 56.0, 23.0, 12.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.725555419921875, -37.84878158569336, -36.97201156616211, -36.095237731933594, -35.218467712402344, -34.34169387817383, -33.46492385864258, -32.58815002441406, -31.711380004882812, -30.83460807800293, -29.957836151123047, -29.081064224243164, -28.20429229736328, -27.3275203704834, -26.450748443603516, -25.573974609375, -24.697202682495117, -23.820430755615234, -22.94365882873535, -22.06688690185547, -21.190114974975586, -20.313343048095703, -19.436569213867188, -18.559799194335938, -17.683025360107422, -16.80625343322754, -15.929481506347656, -15.052709579467773, -14.17593765258789, -13.299165725708008, -12.422392845153809, -11.545620918273926, -10.668851852416992, -9.79207992553711, -8.915307998657227, -8.038536071777344, -7.161763668060303, -6.28499174118042, -5.408219337463379, -4.531447410583496, -3.6546754837036133, -2.7779035568237305, -1.9011313915252686, -1.0243592262268066, -0.14758729934692383, 0.729184627532959, 1.60595703125, 2.482728958129883, 3.3595008850097656, 4.236272811889648, 5.113044738769531, 5.989817142486572, 6.866589069366455, 7.743360996246338, 8.620133399963379, 9.496905326843262, 10.373677253723145, 11.250449180603027, 12.12722110748291, 13.00399398803711, 13.880765914916992, 14.757537841796875, 15.634309768676758, 16.51108169555664, 17.387853622436523]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 3.0, 6.0, 15.0, 22.0, 20.0, 19.0, 30.0, 40.0, 39.0, 30.0, 44.0, 69.0, 49.0, 53.0, 60.0, 61.0, 48.0, 54.0, 41.0, 47.0, 35.0, 24.0, 34.0, 29.0, 23.0, 24.0, 15.0, 11.0, 10.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.49945068359375, -8.242652893066406, -7.985855579376221, -7.729058265686035, -7.47226095199585, -7.215463638305664, -6.95866584777832, -6.701868534088135, -6.445071220397949, -6.188273906707764, -5.93147611618042, -5.674678802490234, -5.417881488800049, -5.161084175109863, -4.9042863845825195, -4.647489070892334, -4.39069128036499, -4.133893966674805, -3.87709641456604, -3.6202988624572754, -3.36350154876709, -3.106703996658325, -2.8499064445495605, -2.593109130859375, -2.3363115787506104, -2.0795140266418457, -1.8227167129516602, -1.5659191608428955, -1.3091217279434204, -1.0523242950439453, -0.7955267429351807, -0.5387293100357056, -0.28193187713623047, -0.025134414434432983, 0.2316630482673645, 0.4884605407714844, 0.7452579736709595, 1.0020554065704346, 1.2588529586791992, 1.5156503915786743, 1.7724478244781494, 2.029245376586914, 2.2860426902770996, 2.5428402423858643, 2.799637794494629, 3.0564351081848145, 3.313232660293579, 3.5700302124023438, 3.8268275260925293, 4.083624839782715, 4.340422630310059, 4.597219944000244, 4.85401725769043, 5.110815048217773, 5.367612361907959, 5.6244096755981445, 5.881207466125488, 6.138004779815674, 6.394802570343018, 6.651599884033203, 6.908397197723389, 7.165194511413574, 7.421992301940918, 7.6787896156311035, 7.935586929321289]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 5.0, 10.0, 22.0, 25.0, 38.0, 48.0, 80.0, 108.0, 184.0, 334.0, 523.0, 995.0, 2051.0, 5204.0, 17251.0, 111564.0, 3899512.0, 127724.0, 18574.0, 5412.0, 2103.0, 1049.0, 551.0, 310.0, 181.0, 113.0, 81.0, 62.0, 31.0, 24.0, 21.0, 23.0, 8.0, 8.0, 4.0, 9.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.439453125, -1.3907012939453125, -1.341949462890625, -1.2931976318359375, -1.24444580078125, -1.1956939697265625, -1.146942138671875, -1.0981903076171875, -1.0494384765625, -1.0006866455078125, -0.951934814453125, -0.9031829833984375, -0.85443115234375, -0.8056793212890625, -0.756927490234375, -0.7081756591796875, -0.659423828125, -0.6106719970703125, -0.561920166015625, -0.5131683349609375, -0.46441650390625, -0.4156646728515625, -0.366912841796875, -0.3181610107421875, -0.2694091796875, -0.2206573486328125, -0.171905517578125, -0.1231536865234375, -0.07440185546875, -0.0256500244140625, 0.023101806640625, 0.0718536376953125, 0.12060546875, 0.1693572998046875, 0.218109130859375, 0.2668609619140625, 0.31561279296875, 0.3643646240234375, 0.413116455078125, 0.4618682861328125, 0.5106201171875, 0.5593719482421875, 0.608123779296875, 0.6568756103515625, 0.70562744140625, 0.7543792724609375, 0.803131103515625, 0.8518829345703125, 0.900634765625, 0.9493865966796875, 0.998138427734375, 1.0468902587890625, 1.09564208984375, 1.1443939208984375, 1.193145751953125, 1.2418975830078125, 1.2906494140625, 1.3394012451171875, 1.388153076171875, 1.4369049072265625, 1.48565673828125, 1.5344085693359375, 1.583160400390625, 1.6319122314453125, 1.6806640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 9.0, 16.0, 11.0, 10.0, 17.0, 24.0, 28.0, 36.0, 47.0, 50.0, 54.0, 72.0, 56.0, 75.0, 72.0, 71.0, 67.0, 66.0, 43.0, 29.0, 31.0, 22.0, 20.0, 10.0, 6.0, 10.0, 9.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3246021270751953, -0.3157081604003906, -0.30681419372558594, -0.29792022705078125, -0.28902626037597656, -0.2801322937011719, -0.2712383270263672, -0.2623443603515625, -0.2534503936767578, -0.24455642700195312, -0.23566246032714844, -0.22676849365234375, -0.21787452697753906, -0.20898056030273438, -0.2000865936279297, -0.191192626953125, -0.1822986602783203, -0.17340469360351562, -0.16451072692871094, -0.15561676025390625, -0.14672279357910156, -0.13782882690429688, -0.1289348602294922, -0.1200408935546875, -0.11114692687988281, -0.10225296020507812, -0.09335899353027344, -0.08446502685546875, -0.07557106018066406, -0.06667709350585938, -0.05778312683105469, -0.04888916015625, -0.03999519348144531, -0.031101226806640625, -0.022207260131835938, -0.01331329345703125, -0.0044193267822265625, 0.004474639892578125, 0.013368606567382812, 0.0222625732421875, 0.031156539916992188, 0.040050506591796875, 0.04894447326660156, 0.05783843994140625, 0.06673240661621094, 0.07562637329101562, 0.08452033996582031, 0.093414306640625, 0.10230827331542969, 0.11120223999023438, 0.12009620666503906, 0.12899017333984375, 0.13788414001464844, 0.14677810668945312, 0.1556720733642578, 0.1645660400390625, 0.1734600067138672, 0.18235397338867188, 0.19124794006347656, 0.20014190673828125, 0.20903587341308594, 0.21792984008789062, 0.2268238067626953, 0.2357177734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 8.0, 18.0, 30.0, 27.0, 34.0, 66.0, 101.0, 127.0, 191.0, 361.0, 654.0, 1242.0, 2750.0, 7687.0, 29712.0, 237143.0, 3777321.0, 108283.0, 18492.0, 5522.0, 2064.0, 1038.0, 565.0, 297.0, 159.0, 135.0, 76.0, 40.0, 42.0, 22.0, 11.0, 13.0, 13.0, 7.0, 10.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.632843017578125, -1.57720947265625, -1.521575927734375, -1.4659423828125, -1.410308837890625, -1.35467529296875, -1.299041748046875, -1.243408203125, -1.187774658203125, -1.13214111328125, -1.076507568359375, -1.0208740234375, -0.965240478515625, -0.90960693359375, -0.853973388671875, -0.79833984375, -0.742706298828125, -0.68707275390625, -0.631439208984375, -0.5758056640625, -0.520172119140625, -0.46453857421875, -0.408905029296875, -0.353271484375, -0.297637939453125, -0.24200439453125, -0.186370849609375, -0.1307373046875, -0.075103759765625, -0.01947021484375, 0.036163330078125, 0.091796875, 0.147430419921875, 0.20306396484375, 0.258697509765625, 0.3143310546875, 0.369964599609375, 0.42559814453125, 0.481231689453125, 0.536865234375, 0.592498779296875, 0.64813232421875, 0.703765869140625, 0.7593994140625, 0.815032958984375, 0.87066650390625, 0.926300048828125, 0.98193359375, 1.037567138671875, 1.09320068359375, 1.148834228515625, 1.2044677734375, 1.260101318359375, 1.31573486328125, 1.371368408203125, 1.427001953125, 1.482635498046875, 1.53826904296875, 1.593902587890625, 1.6495361328125, 1.705169677734375, 1.76080322265625, 1.816436767578125, 1.8720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 12.0, 15.0, 33.0, 73.0, 212.0, 2214.0, 1150.0, 171.0, 70.0, 48.0, 32.0, 13.0, 11.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.33892822265625, -0.3189697265625, -0.29901123046875, -0.279052734375, -0.25909423828125, -0.2391357421875, -0.21917724609375, -0.19921875, -0.17926025390625, -0.1593017578125, -0.13934326171875, -0.119384765625, -0.09942626953125, -0.0794677734375, -0.05950927734375, -0.03955078125, -0.01959228515625, 0.0003662109375, 0.02032470703125, 0.040283203125, 0.06024169921875, 0.0802001953125, 0.10015869140625, 0.1201171875, 0.14007568359375, 0.1600341796875, 0.17999267578125, 0.199951171875, 0.21990966796875, 0.2398681640625, 0.25982666015625, 0.27978515625, 0.29974365234375, 0.3197021484375, 0.33966064453125, 0.359619140625, 0.37957763671875, 0.3995361328125, 0.41949462890625, 0.439453125, 0.45941162109375, 0.4793701171875, 0.49932861328125, 0.519287109375, 0.53924560546875, 0.5592041015625, 0.57916259765625, 0.59912109375, 0.61907958984375, 0.6390380859375, 0.65899658203125, 0.678955078125, 0.69891357421875, 0.7188720703125, 0.73883056640625, 0.7587890625, 0.77874755859375, 0.7987060546875, 0.81866455078125, 0.838623046875, 0.85858154296875, 0.8785400390625, 0.89849853515625, 0.91845703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 24.0, 43.0, 127.0, 206.0, 240.0, 163.0, 99.0, 50.0, 28.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.364908695220947, -4.2325334548950195, -4.100157737731934, -3.9677822589874268, -3.83540678024292, -3.703031301498413, -3.5706558227539062, -3.4382803440093994, -3.3059048652648926, -3.1735293865203857, -3.041153907775879, -2.908778429031372, -2.7764029502868652, -2.6440274715423584, -2.5116519927978516, -2.3792765140533447, -2.246901035308838, -2.114525556564331, -1.9821500778198242, -1.8497745990753174, -1.7173991203308105, -1.5850236415863037, -1.4526481628417969, -1.32027268409729, -1.1878972053527832, -1.0555217266082764, -0.9231462478637695, -0.7907707691192627, -0.6583952903747559, -0.526019811630249, -0.3936443328857422, -0.26126885414123535, -0.12889385223388672, 0.003481626510620117, 0.13585710525512695, 0.2682325839996338, 0.4006080627441406, 0.5329835414886475, 0.6653590202331543, 0.7977344989776611, 0.930109977722168, 1.0624854564666748, 1.1948609352111816, 1.3272364139556885, 1.4596118927001953, 1.5919873714447021, 1.724362850189209, 1.8567383289337158, 1.9891138076782227, 2.1214892864227295, 2.2538647651672363, 2.386240243911743, 2.51861572265625, 2.650991201400757, 2.7833666801452637, 2.9157421588897705, 3.0481176376342773, 3.180493116378784, 3.312868595123291, 3.445244073867798, 3.5776195526123047, 3.7099950313568115, 3.8423705101013184, 3.974745988845825, 4.107121467590332]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 5.0, 6.0, 9.0, 9.0, 21.0, 18.0, 25.0, 20.0, 24.0, 29.0, 38.0, 37.0, 32.0, 33.0, 43.0, 36.0, 47.0, 44.0, 41.0, 37.0, 33.0, 48.0, 33.0, 50.0, 39.0, 38.0, 38.0, 33.0, 28.0, 23.0, 21.0, 13.0, 10.0, 6.0, 8.0, 11.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6801671981811523, -1.6221437454223633, -1.5641201734542847, -1.5060967206954956, -1.448073148727417, -1.390049695968628, -1.3320262432098389, -1.2740026712417603, -1.2159790992736816, -1.1579556465148926, -1.099932074546814, -1.041908621788025, -0.9838850498199463, -0.9258615970611572, -0.8678380846977234, -0.8098145723342896, -0.7517911195755005, -0.6937676072120667, -0.6357440948486328, -0.5777206420898438, -0.5196970701217651, -0.4616735875606537, -0.40365010499954224, -0.3456265926361084, -0.28760308027267456, -0.22957956790924072, -0.17155607044696808, -0.11353257298469543, -0.0555090606212616, 0.002514451742172241, 0.06053793430328369, 0.11856144666671753, 0.17658495903015137, 0.2346084713935852, 0.29263198375701904, 0.3506554663181305, 0.40867897868156433, 0.46670249104499817, 0.5247259736061096, 0.5827494859695435, 0.6407729983329773, 0.6987965106964111, 0.756820023059845, 0.8148435354232788, 0.8728669881820679, 0.9308905601501465, 0.9889140129089355, 1.0469374656677246, 1.1049610376358032, 1.1629844903945923, 1.221008062362671, 1.27903151512146, 1.3370550870895386, 1.3950785398483276, 1.4531021118164062, 1.5111255645751953, 1.5691490173339844, 1.6271724700927734, 1.685196042060852, 1.7432194948196411, 1.8012430667877197, 1.8592665195465088, 1.9172899723052979, 1.9753135442733765, 2.033337116241455]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 11.0, 19.0, 31.0, 38.0, 53.0, 89.0, 165.0, 229.0, 416.0, 696.0, 1340.0, 2917.0, 6454.0, 17067.0, 51743.0, 174446.0, 410033.0, 261431.0, 79774.0, 24733.0, 8992.0, 3842.0, 1807.0, 957.0, 522.0, 281.0, 171.0, 84.0, 68.0, 39.0, 33.0, 27.0, 13.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.767578125, -0.740814208984375, -0.71405029296875, -0.687286376953125, -0.6605224609375, -0.633758544921875, -0.60699462890625, -0.580230712890625, -0.553466796875, -0.526702880859375, -0.49993896484375, -0.473175048828125, -0.4464111328125, -0.419647216796875, -0.39288330078125, -0.366119384765625, -0.33935546875, -0.312591552734375, -0.28582763671875, -0.259063720703125, -0.2322998046875, -0.205535888671875, -0.17877197265625, -0.152008056640625, -0.125244140625, -0.098480224609375, -0.07171630859375, -0.044952392578125, -0.0181884765625, 0.008575439453125, 0.03533935546875, 0.062103271484375, 0.0888671875, 0.115631103515625, 0.14239501953125, 0.169158935546875, 0.1959228515625, 0.222686767578125, 0.24945068359375, 0.276214599609375, 0.302978515625, 0.329742431640625, 0.35650634765625, 0.383270263671875, 0.4100341796875, 0.436798095703125, 0.46356201171875, 0.490325927734375, 0.51708984375, 0.543853759765625, 0.57061767578125, 0.597381591796875, 0.6241455078125, 0.650909423828125, 0.67767333984375, 0.704437255859375, 0.731201171875, 0.757965087890625, 0.78472900390625, 0.811492919921875, 0.8382568359375, 0.865020751953125, 0.89178466796875, 0.918548583984375, 0.9453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 5.0, 4.0, 11.0, 18.0, 12.0, 17.0, 19.0, 23.0, 20.0, 32.0, 41.0, 41.0, 34.0, 36.0, 55.0, 65.0, 61.0, 62.0, 46.0, 44.0, 50.0, 55.0, 34.0, 31.0, 25.0, 24.0, 17.0, 23.0, 18.0, 11.0, 10.0, 7.0, 6.0, 12.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.325439453125, -0.3160552978515625, -0.306671142578125, -0.2972869873046875, -0.28790283203125, -0.2785186767578125, -0.269134521484375, -0.2597503662109375, -0.2503662109375, -0.2409820556640625, -0.231597900390625, -0.2222137451171875, -0.21282958984375, -0.2034454345703125, -0.194061279296875, -0.1846771240234375, -0.17529296875, -0.1659088134765625, -0.156524658203125, -0.1471405029296875, -0.13775634765625, -0.1283721923828125, -0.118988037109375, -0.1096038818359375, -0.1002197265625, -0.0908355712890625, -0.081451416015625, -0.0720672607421875, -0.06268310546875, -0.0532989501953125, -0.043914794921875, -0.0345306396484375, -0.025146484375, -0.0157623291015625, -0.006378173828125, 0.0030059814453125, 0.01239013671875, 0.0217742919921875, 0.031158447265625, 0.0405426025390625, 0.0499267578125, 0.0593109130859375, 0.068695068359375, 0.0780792236328125, 0.08746337890625, 0.0968475341796875, 0.106231689453125, 0.1156158447265625, 0.125, 0.1343841552734375, 0.143768310546875, 0.1531524658203125, 0.16253662109375, 0.1719207763671875, 0.181304931640625, 0.1906890869140625, 0.2000732421875, 0.2094573974609375, 0.218841552734375, 0.2282257080078125, 0.23760986328125, 0.2469940185546875, 0.256378173828125, 0.2657623291015625, 0.275146484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 10.0, 6.0, 10.0, 13.0, 21.0, 32.0, 64.0, 103.0, 148.0, 355.0, 662.0, 1590.0, 4399.0, 23648.0, 495296.0, 491178.0, 23780.0, 4335.0, 1408.0, 680.0, 336.0, 167.0, 104.0, 81.0, 42.0, 23.0, 19.0, 12.0, 4.0, 8.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.44921875, -2.370208740234375, -2.29119873046875, -2.212188720703125, -2.1331787109375, -2.054168701171875, -1.97515869140625, -1.896148681640625, -1.817138671875, -1.738128662109375, -1.65911865234375, -1.580108642578125, -1.5010986328125, -1.422088623046875, -1.34307861328125, -1.264068603515625, -1.18505859375, -1.106048583984375, -1.02703857421875, -0.948028564453125, -0.8690185546875, -0.790008544921875, -0.71099853515625, -0.631988525390625, -0.552978515625, -0.473968505859375, -0.39495849609375, -0.315948486328125, -0.2369384765625, -0.157928466796875, -0.07891845703125, 9.1552734375e-05, 0.0791015625, 0.158111572265625, 0.23712158203125, 0.316131591796875, 0.3951416015625, 0.474151611328125, 0.55316162109375, 0.632171630859375, 0.711181640625, 0.790191650390625, 0.86920166015625, 0.948211669921875, 1.0272216796875, 1.106231689453125, 1.18524169921875, 1.264251708984375, 1.34326171875, 1.422271728515625, 1.50128173828125, 1.580291748046875, 1.6593017578125, 1.738311767578125, 1.81732177734375, 1.896331787109375, 1.975341796875, 2.054351806640625, 2.13336181640625, 2.212371826171875, 2.2913818359375, 2.370391845703125, 2.44940185546875, 2.528411865234375, 2.607421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 4.0, 13.0, 8.0, 20.0, 20.0, 29.0, 28.0, 30.0, 40.0, 49.0, 48.0, 70.0, 74.0, 79.0, 57.0, 69.0, 59.0, 56.0, 27.0, 41.0, 35.0, 24.0, 22.0, 24.0, 16.0, 13.0, 6.0, 4.0, 8.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.951171875, -2.863861083984375, -2.77655029296875, -2.689239501953125, -2.6019287109375, -2.514617919921875, -2.42730712890625, -2.339996337890625, -2.252685546875, -2.165374755859375, -2.07806396484375, -1.990753173828125, -1.9034423828125, -1.816131591796875, -1.72882080078125, -1.641510009765625, -1.55419921875, -1.466888427734375, -1.37957763671875, -1.292266845703125, -1.2049560546875, -1.117645263671875, -1.03033447265625, -0.943023681640625, -0.855712890625, -0.768402099609375, -0.68109130859375, -0.593780517578125, -0.5064697265625, -0.419158935546875, -0.33184814453125, -0.244537353515625, -0.1572265625, -0.069915771484375, 0.01739501953125, 0.104705810546875, 0.1920166015625, 0.279327392578125, 0.36663818359375, 0.453948974609375, 0.541259765625, 0.628570556640625, 0.71588134765625, 0.803192138671875, 0.8905029296875, 0.977813720703125, 1.06512451171875, 1.152435302734375, 1.23974609375, 1.327056884765625, 1.41436767578125, 1.501678466796875, 1.5889892578125, 1.676300048828125, 1.76361083984375, 1.850921630859375, 1.938232421875, 2.025543212890625, 2.11285400390625, 2.200164794921875, 2.2874755859375, 2.374786376953125, 2.46209716796875, 2.549407958984375, 2.63671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 3.0, 6.0, 12.0, 15.0, 14.0, 33.0, 48.0, 66.0, 137.0, 312.0, 770.0, 4061.0, 1024783.0, 16086.0, 1345.0, 462.0, 153.0, 93.0, 53.0, 35.0, 22.0, 12.0, 7.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.3538818359375, -8.098388671875, -7.8428955078125, -7.58740234375, -7.3319091796875, -7.076416015625, -6.8209228515625, -6.5654296875, -6.3099365234375, -6.054443359375, -5.7989501953125, -5.54345703125, -5.2879638671875, -5.032470703125, -4.7769775390625, -4.521484375, -4.2659912109375, -4.010498046875, -3.7550048828125, -3.49951171875, -3.2440185546875, -2.988525390625, -2.7330322265625, -2.4775390625, -2.2220458984375, -1.966552734375, -1.7110595703125, -1.45556640625, -1.2000732421875, -0.944580078125, -0.6890869140625, -0.43359375, -0.1781005859375, 0.077392578125, 0.3328857421875, 0.58837890625, 0.8438720703125, 1.099365234375, 1.3548583984375, 1.6103515625, 1.8658447265625, 2.121337890625, 2.3768310546875, 2.63232421875, 2.8878173828125, 3.143310546875, 3.3988037109375, 3.654296875, 3.9097900390625, 4.165283203125, 4.4207763671875, 4.67626953125, 4.9317626953125, 5.187255859375, 5.4427490234375, 5.6982421875, 5.9537353515625, 6.209228515625, 6.4647216796875, 6.72021484375, 6.9757080078125, 7.231201171875, 7.4866943359375, 7.7421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 17.0, 20.0, 41.0, 102.0, 149.0, 212.0, 203.0, 130.0, 61.0, 33.0, 10.0, 12.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004134178161621094, -0.0004032682627439499, -0.0003931187093257904, -0.0003829691559076309, -0.00037281960248947144, -0.00036267004907131195, -0.00035252049565315247, -0.000342370942234993, -0.0003322213888168335, -0.000322071835398674, -0.0003119222819805145, -0.00030177272856235504, -0.00029162317514419556, -0.00028147362172603607, -0.0002713240683078766, -0.0002611745148897171, -0.0002510249614715576, -0.00024087540805339813, -0.00023072585463523865, -0.00022057630121707916, -0.00021042674779891968, -0.0002002771943807602, -0.0001901276409626007, -0.00017997808754444122, -0.00016982853412628174, -0.00015967898070812225, -0.00014952942728996277, -0.00013937987387180328, -0.0001292303204536438, -0.00011908076703548431, -0.00010893121361732483, -9.878166019916534e-05, -8.863210678100586e-05, -7.848255336284637e-05, -6.833299994468689e-05, -5.8183446526527405e-05, -4.803389310836792e-05, -3.7884339690208435e-05, -2.773478627204895e-05, -1.7585232853889465e-05, -7.4356794357299805e-06, 2.7138739824295044e-06, 1.286342740058899e-05, 2.3012980818748474e-05, 3.316253423690796e-05, 4.3312087655067444e-05, 5.346164107322693e-05, 6.361119449138641e-05, 7.37607479095459e-05, 8.391030132770538e-05, 9.405985474586487e-05, 0.00010420940816402435, 0.00011435896158218384, 0.00012450851500034332, 0.0001346580684185028, 0.0001448076218366623, 0.00015495717525482178, 0.00016510672867298126, 0.00017525628209114075, 0.00018540583550930023, 0.00019555538892745972, 0.0002057049423456192, 0.0002158544957637787, 0.00022600404918193817, 0.00023615360260009766]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 2.0, 14.0, 21.0, 31.0, 64.0, 114.0, 273.0, 753.0, 3655.0, 71098.0, 959598.0, 10669.0, 1491.0, 404.0, 172.0, 81.0, 29.0, 26.0, 11.0, 14.0, 14.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.758392333984375, -4.63397216796875, -4.509552001953125, -4.3851318359375, -4.260711669921875, -4.13629150390625, -4.011871337890625, -3.887451171875, -3.763031005859375, -3.63861083984375, -3.514190673828125, -3.3897705078125, -3.265350341796875, -3.14093017578125, -3.016510009765625, -2.89208984375, -2.767669677734375, -2.64324951171875, -2.518829345703125, -2.3944091796875, -2.269989013671875, -2.14556884765625, -2.021148681640625, -1.896728515625, -1.772308349609375, -1.64788818359375, -1.523468017578125, -1.3990478515625, -1.274627685546875, -1.15020751953125, -1.025787353515625, -0.9013671875, -0.776947021484375, -0.65252685546875, -0.528106689453125, -0.4036865234375, -0.279266357421875, -0.15484619140625, -0.030426025390625, 0.093994140625, 0.218414306640625, 0.34283447265625, 0.467254638671875, 0.5916748046875, 0.716094970703125, 0.84051513671875, 0.964935302734375, 1.08935546875, 1.213775634765625, 1.33819580078125, 1.462615966796875, 1.5870361328125, 1.711456298828125, 1.83587646484375, 1.960296630859375, 2.084716796875, 2.209136962890625, 2.33355712890625, 2.457977294921875, 2.5823974609375, 2.706817626953125, 2.83123779296875, 2.955657958984375, 3.080078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 15.0, 47.0, 158.0, 406.0, 235.0, 61.0, 19.0, 9.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.51171875, -6.37213134765625, -6.2325439453125, -6.09295654296875, -5.953369140625, -5.81378173828125, -5.6741943359375, -5.53460693359375, -5.39501953125, -5.25543212890625, -5.1158447265625, -4.97625732421875, -4.836669921875, -4.69708251953125, -4.5574951171875, -4.41790771484375, -4.2783203125, -4.13873291015625, -3.9991455078125, -3.85955810546875, -3.719970703125, -3.58038330078125, -3.4407958984375, -3.30120849609375, -3.16162109375, -3.02203369140625, -2.8824462890625, -2.74285888671875, -2.603271484375, -2.46368408203125, -2.3240966796875, -2.18450927734375, -2.044921875, -1.90533447265625, -1.7657470703125, -1.62615966796875, -1.486572265625, -1.34698486328125, -1.2073974609375, -1.06781005859375, -0.92822265625, -0.78863525390625, -0.6490478515625, -0.50946044921875, -0.369873046875, -0.23028564453125, -0.0906982421875, 0.04888916015625, 0.1884765625, 0.32806396484375, 0.4676513671875, 0.60723876953125, 0.746826171875, 0.88641357421875, 1.0260009765625, 1.16558837890625, 1.30517578125, 1.44476318359375, 1.5843505859375, 1.72393798828125, 1.863525390625, 2.00311279296875, 2.1427001953125, 2.28228759765625, 2.421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 38.0, 125.0, 353.0, 313.0, 116.0, 37.0, 16.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.729516983032227, -19.12299919128418, -17.516481399536133, -15.909964561462402, -14.303447723388672, -12.696929931640625, -11.090412139892578, -9.483895301818848, -7.877377510070801, -6.270860195159912, -4.664342880249023, -3.0578250885009766, -1.451307773590088, 0.15520954132080078, 1.7617273330688477, 3.368244171142578, 4.974761962890625, 6.581279277801514, 8.187796592712402, 9.79431438446045, 11.40083122253418, 13.007349014282227, 14.613866806030273, 16.220382690429688, 17.826900482177734, 19.43341827392578, 21.039936065673828, 22.646453857421875, 24.25296974182129, 25.859487533569336, 27.466005325317383, 29.072521209716797, 30.67904281616211, 32.285560607910156, 33.8920783996582, 35.49859619140625, 37.1051139831543, 38.711631774902344, 40.318145751953125, 41.92466354370117, 43.53118133544922, 45.137699127197266, 46.74421691894531, 48.35073471069336, 49.957252502441406, 51.56376647949219, 53.1702880859375, 54.77680206298828, 56.383323669433594, 57.98984146118164, 59.59635925292969, 61.202877044677734, 62.80939483642578, 64.41590881347656, 66.02243041992188, 67.62894439697266, 69.23545837402344, 70.84197235107422, 72.44849395751953, 74.05500793457031, 75.66152954101562, 77.2680435180664, 78.87456512451172, 80.4810791015625, 82.08760070800781]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 3.0, 4.0, 6.0, 8.0, 14.0, 10.0, 15.0, 14.0, 23.0, 30.0, 30.0, 28.0, 23.0, 40.0, 35.0, 45.0, 50.0, 48.0, 56.0, 61.0, 52.0, 47.0, 43.0, 34.0, 33.0, 40.0, 28.0, 38.0, 22.0, 18.0, 24.0, 15.0, 15.0, 13.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-15.148448944091797, -14.728678703308105, -14.308908462524414, -13.889138221740723, -13.469367980957031, -13.049596786499023, -12.629826545715332, -12.21005630493164, -11.79028606414795, -11.370515823364258, -10.950745582580566, -10.530975341796875, -10.111204147338867, -9.691434860229492, -9.271663665771484, -8.851893424987793, -8.432123184204102, -8.01235294342041, -7.592582702636719, -7.172811985015869, -6.753041744232178, -6.333271503448486, -5.913500785827637, -5.493730545043945, -5.073960304260254, -4.6541900634765625, -4.234419822692871, -3.8146491050720215, -3.39487886428833, -2.9751086235046387, -2.555338144302368, -2.1355676651000977, -1.7157974243164062, -1.2960270643234253, -0.8762567043304443, -0.4564863443374634, -0.03671598434448242, 0.383054256439209, 0.8028247356414795, 1.22259521484375, 1.6423654556274414, 2.062135696411133, 2.4819061756134033, 2.901676654815674, 3.3214468955993652, 3.7412171363830566, 4.160987854003906, 4.580758094787598, 5.000528335571289, 5.4202985763549805, 5.840068817138672, 6.2598395347595215, 6.679609775543213, 7.099380016326904, 7.519150733947754, 7.938920974731445, 8.358691215515137, 8.778461456298828, 9.19823169708252, 9.618001937866211, 10.037773132324219, 10.457542419433594, 10.877313613891602, 11.297083854675293, 11.716854095458984]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 13.0, 22.0, 22.0, 43.0, 153.0, 453.0, 2756.0, 3999609.0, 188577.0, 2013.0, 374.0, 134.0, 47.0, 29.0, 18.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.50897216796875, -5.2327880859375, -4.95660400390625, -4.680419921875, -4.40423583984375, -4.1280517578125, -3.85186767578125, -3.57568359375, -3.29949951171875, -3.0233154296875, -2.74713134765625, -2.470947265625, -2.19476318359375, -1.9185791015625, -1.64239501953125, -1.3662109375, -1.09002685546875, -0.8138427734375, -0.53765869140625, -0.261474609375, 0.01470947265625, 0.2908935546875, 0.56707763671875, 0.84326171875, 1.11944580078125, 1.3956298828125, 1.67181396484375, 1.947998046875, 2.22418212890625, 2.5003662109375, 2.77655029296875, 3.052734375, 3.32891845703125, 3.6051025390625, 3.88128662109375, 4.157470703125, 4.43365478515625, 4.7098388671875, 4.98602294921875, 5.26220703125, 5.53839111328125, 5.8145751953125, 6.09075927734375, 6.366943359375, 6.64312744140625, 6.9193115234375, 7.19549560546875, 7.4716796875, 7.74786376953125, 8.0240478515625, 8.30023193359375, 8.576416015625, 8.85260009765625, 9.1287841796875, 9.40496826171875, 9.68115234375, 9.95733642578125, 10.2335205078125, 10.50970458984375, 10.785888671875, 11.06207275390625, 11.3382568359375, 11.61444091796875, 11.890625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 12.0, 9.0, 12.0, 10.0, 10.0, 34.0, 25.0, 36.0, 48.0, 55.0, 85.0, 98.0, 81.0, 90.0, 85.0, 68.0, 56.0, 49.0, 32.0, 26.0, 20.0, 10.0, 12.0, 12.0, 5.0, 3.0, 1.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.68359375, -0.6663055419921875, -0.649017333984375, -0.6317291259765625, -0.61444091796875, -0.5971527099609375, -0.579864501953125, -0.5625762939453125, -0.5452880859375, -0.5279998779296875, -0.510711669921875, -0.4934234619140625, -0.47613525390625, -0.4588470458984375, -0.441558837890625, -0.4242706298828125, -0.406982421875, -0.3896942138671875, -0.372406005859375, -0.3551177978515625, -0.33782958984375, -0.3205413818359375, -0.303253173828125, -0.2859649658203125, -0.2686767578125, -0.2513885498046875, -0.234100341796875, -0.2168121337890625, -0.19952392578125, -0.1822357177734375, -0.164947509765625, -0.1476593017578125, -0.13037109375, -0.1130828857421875, -0.095794677734375, -0.0785064697265625, -0.06121826171875, -0.0439300537109375, -0.026641845703125, -0.0093536376953125, 0.0079345703125, 0.0252227783203125, 0.042510986328125, 0.0597991943359375, 0.07708740234375, 0.0943756103515625, 0.111663818359375, 0.1289520263671875, 0.146240234375, 0.1635284423828125, 0.180816650390625, 0.1981048583984375, 0.21539306640625, 0.2326812744140625, 0.249969482421875, 0.2672576904296875, 0.2845458984375, 0.3018341064453125, 0.319122314453125, 0.3364105224609375, 0.35369873046875, 0.3709869384765625, 0.388275146484375, 0.4055633544921875, 0.4228515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 10.0, 12.0, 31.0, 28.0, 43.0, 68.0, 76.0, 102.0, 151.0, 290.0, 500.0, 1155.0, 3282.0, 13456.0, 119528.0, 3986913.0, 55284.0, 8815.0, 2417.0, 936.0, 432.0, 209.0, 145.0, 101.0, 66.0, 67.0, 38.0, 22.0, 19.0, 20.0, 12.0, 9.0, 9.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.935455322265625, -2.84747314453125, -2.759490966796875, -2.6715087890625, -2.583526611328125, -2.49554443359375, -2.407562255859375, -2.319580078125, -2.231597900390625, -2.14361572265625, -2.055633544921875, -1.9676513671875, -1.879669189453125, -1.79168701171875, -1.703704833984375, -1.61572265625, -1.527740478515625, -1.43975830078125, -1.351776123046875, -1.2637939453125, -1.175811767578125, -1.08782958984375, -0.999847412109375, -0.911865234375, -0.823883056640625, -0.73590087890625, -0.647918701171875, -0.5599365234375, -0.471954345703125, -0.38397216796875, -0.295989990234375, -0.2080078125, -0.120025634765625, -0.03204345703125, 0.055938720703125, 0.1439208984375, 0.231903076171875, 0.31988525390625, 0.407867431640625, 0.495849609375, 0.583831787109375, 0.67181396484375, 0.759796142578125, 0.8477783203125, 0.935760498046875, 1.02374267578125, 1.111724853515625, 1.19970703125, 1.287689208984375, 1.37567138671875, 1.463653564453125, 1.5516357421875, 1.639617919921875, 1.72760009765625, 1.815582275390625, 1.903564453125, 1.991546630859375, 2.07952880859375, 2.167510986328125, 2.2554931640625, 2.343475341796875, 2.43145751953125, 2.519439697265625, 2.607421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 9.0, 16.0, 20.0, 28.0, 67.0, 147.0, 625.0, 2824.0, 177.0, 73.0, 24.0, 23.0, 11.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.716796875, -0.6989021301269531, -0.6810073852539062, -0.6631126403808594, -0.6452178955078125, -0.6273231506347656, -0.6094284057617188, -0.5915336608886719, -0.573638916015625, -0.5557441711425781, -0.5378494262695312, -0.5199546813964844, -0.5020599365234375, -0.4841651916503906, -0.46627044677734375, -0.4483757019042969, -0.43048095703125, -0.4125862121582031, -0.39469146728515625, -0.3767967224121094, -0.3589019775390625, -0.3410072326660156, -0.32311248779296875, -0.3052177429199219, -0.287322998046875, -0.2694282531738281, -0.25153350830078125, -0.23363876342773438, -0.2157440185546875, -0.19784927368164062, -0.17995452880859375, -0.16205978393554688, -0.1441650390625, -0.12627029418945312, -0.10837554931640625, -0.09048080444335938, -0.0725860595703125, -0.054691314697265625, -0.03679656982421875, -0.018901824951171875, -0.001007080078125, 0.016887664794921875, 0.03478240966796875, 0.052677154541015625, 0.0705718994140625, 0.08846664428710938, 0.10636138916015625, 0.12425613403320312, 0.14215087890625, 0.16004562377929688, 0.17794036865234375, 0.19583511352539062, 0.2137298583984375, 0.23162460327148438, 0.24951934814453125, 0.2674140930175781, 0.285308837890625, 0.3032035827636719, 0.32109832763671875, 0.3389930725097656, 0.3568878173828125, 0.3747825622558594, 0.39267730712890625, 0.4105720520019531, 0.428466796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 10.0, 17.0, 25.0, 34.0, 50.0, 75.0, 106.0, 116.0, 119.0, 123.0, 105.0, 76.0, 54.0, 31.0, 25.0, 16.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3647809028625488, -1.3026100397109985, -1.2404391765594482, -1.1782681941986084, -1.116097331047058, -1.0539264678955078, -0.9917556047439575, -0.9295847415924072, -0.8674138188362122, -0.8052429556846619, -0.7430720329284668, -0.6809011697769165, -0.6187303066253662, -0.5565593838691711, -0.49438852071762085, -0.43221762776374817, -0.3700467348098755, -0.3078758418560028, -0.24570496380329132, -0.18353408575057983, -0.12136319279670715, -0.05919229984283447, 0.0029785633087158203, 0.0651494562625885, 0.12732034921646118, 0.18949124217033386, 0.25166213512420654, 0.31383299827575684, 0.3760038912296295, 0.4381747841835022, 0.5003456473350525, 0.5625165700912476, 0.6246874332427979, 0.6868582963943481, 0.7490292191505432, 0.8112000823020935, 0.8733710050582886, 0.9355418682098389, 0.9977127313613892, 1.0598835945129395, 1.1220545768737793, 1.1842254400253296, 1.2463963031768799, 1.3085672855377197, 1.37073814868927, 1.4329090118408203, 1.4950798749923706, 1.557250738143921, 1.6194216012954712, 1.6815924644470215, 1.7437633275985718, 1.805934190750122, 1.868105173110962, 1.9302760362625122, 1.9924468994140625, 2.0546178817749023, 2.116788625717163, 2.178959608078003, 2.2411303520202637, 2.3033013343811035, 2.3654720783233643, 2.427643060684204, 2.489813804626465, 2.5519847869873047, 2.6141557693481445]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 11.0, 11.0, 9.0, 17.0, 20.0, 30.0, 22.0, 21.0, 34.0, 43.0, 61.0, 38.0, 47.0, 42.0, 48.0, 41.0, 50.0, 42.0, 38.0, 40.0, 37.0, 35.0, 28.0, 29.0, 33.0, 29.0, 18.0, 22.0, 18.0, 8.0, 11.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9708364605903625, -0.9387990832328796, -0.9067617058753967, -0.874724268913269, -0.8426868915557861, -0.8106495141983032, -0.7786121368408203, -0.7465747594833374, -0.7145373821258545, -0.6825000047683716, -0.6504626274108887, -0.6184252500534058, -0.5863878130912781, -0.5543504357337952, -0.5223130583763123, -0.49027568101882935, -0.45823824405670166, -0.42620086669921875, -0.39416345953941345, -0.36212608218193054, -0.33008867502212524, -0.29805129766464233, -0.2660139203071594, -0.23397652804851532, -0.20193913578987122, -0.1699017435312271, -0.137864351272583, -0.1058269739151001, -0.073789581656456, -0.04175218939781189, -0.00971481204032898, 0.022322580218315125, 0.054360032081604004, 0.08639742434024811, 0.11843480914831161, 0.15047219395637512, 0.18250958621501923, 0.21454697847366333, 0.24658435583114624, 0.27862173318862915, 0.31065914034843445, 0.34269651770591736, 0.37473392486572266, 0.40677130222320557, 0.4388086795806885, 0.4708460867404938, 0.5028834342956543, 0.534920871257782, 0.5669582486152649, 0.5989956259727478, 0.6310330033302307, 0.6630704402923584, 0.6951078176498413, 0.7271451950073242, 0.7591825723648071, 0.79121994972229, 0.823257327079773, 0.8552947044372559, 0.8873320817947388, 0.9193694591522217, 0.9514068961143494, 0.9834442734718323, 1.01548171043396, 1.0475190877914429, 1.0795564651489258]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 7.0, 4.0, 3.0, 9.0, 24.0, 17.0, 33.0, 46.0, 58.0, 95.0, 172.0, 336.0, 608.0, 1376.0, 3890.0, 14998.0, 97538.0, 652818.0, 237409.0, 29119.0, 6180.0, 2026.0, 817.0, 413.0, 212.0, 112.0, 73.0, 58.0, 34.0, 12.0, 19.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.81640625, -1.7640533447265625, -1.711700439453125, -1.6593475341796875, -1.60699462890625, -1.5546417236328125, -1.502288818359375, -1.4499359130859375, -1.3975830078125, -1.3452301025390625, -1.292877197265625, -1.2405242919921875, -1.18817138671875, -1.1358184814453125, -1.083465576171875, -1.0311126708984375, -0.978759765625, -0.9264068603515625, -0.874053955078125, -0.8217010498046875, -0.76934814453125, -0.7169952392578125, -0.664642333984375, -0.6122894287109375, -0.5599365234375, -0.5075836181640625, -0.455230712890625, -0.4028778076171875, -0.35052490234375, -0.2981719970703125, -0.245819091796875, -0.1934661865234375, -0.14111328125, -0.0887603759765625, -0.036407470703125, 0.0159454345703125, 0.06829833984375, 0.1206512451171875, 0.173004150390625, 0.2253570556640625, 0.2777099609375, 0.3300628662109375, 0.382415771484375, 0.4347686767578125, 0.48712158203125, 0.5394744873046875, 0.591827392578125, 0.6441802978515625, 0.696533203125, 0.7488861083984375, 0.801239013671875, 0.8535919189453125, 0.90594482421875, 0.9582977294921875, 1.010650634765625, 1.0630035400390625, 1.1153564453125, 1.1677093505859375, 1.220062255859375, 1.2724151611328125, 1.32476806640625, 1.3771209716796875, 1.429473876953125, 1.4818267822265625, 1.5341796875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 16.0, 13.0, 14.0, 10.0, 27.0, 30.0, 37.0, 42.0, 71.0, 83.0, 85.0, 86.0, 81.0, 82.0, 68.0, 64.0, 46.0, 34.0, 26.0, 27.0, 11.0, 14.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66455078125, -0.6459121704101562, -0.6272735595703125, -0.6086349487304688, -0.589996337890625, -0.5713577270507812, -0.5527191162109375, -0.5340805053710938, -0.51544189453125, -0.49680328369140625, -0.4781646728515625, -0.45952606201171875, -0.440887451171875, -0.42224884033203125, -0.4036102294921875, -0.38497161865234375, -0.3663330078125, -0.34769439697265625, -0.3290557861328125, -0.31041717529296875, -0.291778564453125, -0.27313995361328125, -0.2545013427734375, -0.23586273193359375, -0.21722412109375, -0.19858551025390625, -0.1799468994140625, -0.16130828857421875, -0.142669677734375, -0.12403106689453125, -0.1053924560546875, -0.08675384521484375, -0.068115234375, -0.04947662353515625, -0.0308380126953125, -0.01219940185546875, 0.006439208984375, 0.02507781982421875, 0.0437164306640625, 0.06235504150390625, 0.08099365234375, 0.09963226318359375, 0.1182708740234375, 0.13690948486328125, 0.155548095703125, 0.17418670654296875, 0.1928253173828125, 0.21146392822265625, 0.2301025390625, 0.24874114990234375, 0.2673797607421875, 0.28601837158203125, 0.304656982421875, 0.32329559326171875, 0.3419342041015625, 0.36057281494140625, 0.37921142578125, 0.39785003662109375, 0.4164886474609375, 0.43512725830078125, 0.453765869140625, 0.47240447998046875, 0.4910430908203125, 0.5096817016601562, 0.5283203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 14.0, 17.0, 15.0, 22.0, 40.0, 56.0, 113.0, 179.0, 303.0, 607.0, 1521.0, 5922.0, 107157.0, 886234.0, 40057.0, 3891.0, 1208.0, 518.0, 253.0, 142.0, 93.0, 51.0, 46.0, 29.0, 21.0, 11.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.033203125, -2.9449462890625, -2.856689453125, -2.7684326171875, -2.68017578125, -2.5919189453125, -2.503662109375, -2.4154052734375, -2.3271484375, -2.2388916015625, -2.150634765625, -2.0623779296875, -1.97412109375, -1.8858642578125, -1.797607421875, -1.7093505859375, -1.62109375, -1.5328369140625, -1.444580078125, -1.3563232421875, -1.26806640625, -1.1798095703125, -1.091552734375, -1.0032958984375, -0.9150390625, -0.8267822265625, -0.738525390625, -0.6502685546875, -0.56201171875, -0.4737548828125, -0.385498046875, -0.2972412109375, -0.208984375, -0.1207275390625, -0.032470703125, 0.0557861328125, 0.14404296875, 0.2322998046875, 0.320556640625, 0.4088134765625, 0.4970703125, 0.5853271484375, 0.673583984375, 0.7618408203125, 0.85009765625, 0.9383544921875, 1.026611328125, 1.1148681640625, 1.203125, 1.2913818359375, 1.379638671875, 1.4678955078125, 1.55615234375, 1.6444091796875, 1.732666015625, 1.8209228515625, 1.9091796875, 1.9974365234375, 2.085693359375, 2.1739501953125, 2.26220703125, 2.3504638671875, 2.438720703125, 2.5269775390625, 2.615234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 15.0, 15.0, 20.0, 19.0, 15.0, 33.0, 49.0, 50.0, 52.0, 56.0, 50.0, 46.0, 63.0, 76.0, 68.0, 50.0, 52.0, 50.0, 49.0, 34.0, 21.0, 34.0, 21.0, 14.0, 13.0, 12.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.796661376953125, -2.70660400390625, -2.616546630859375, -2.5264892578125, -2.436431884765625, -2.34637451171875, -2.256317138671875, -2.166259765625, -2.076202392578125, -1.98614501953125, -1.896087646484375, -1.8060302734375, -1.715972900390625, -1.62591552734375, -1.535858154296875, -1.44580078125, -1.355743408203125, -1.26568603515625, -1.175628662109375, -1.0855712890625, -0.995513916015625, -0.90545654296875, -0.815399169921875, -0.725341796875, -0.635284423828125, -0.54522705078125, -0.455169677734375, -0.3651123046875, -0.275054931640625, -0.18499755859375, -0.094940185546875, -0.0048828125, 0.085174560546875, 0.17523193359375, 0.265289306640625, 0.3553466796875, 0.445404052734375, 0.53546142578125, 0.625518798828125, 0.715576171875, 0.805633544921875, 0.89569091796875, 0.985748291015625, 1.0758056640625, 1.165863037109375, 1.25592041015625, 1.345977783203125, 1.43603515625, 1.526092529296875, 1.61614990234375, 1.706207275390625, 1.7962646484375, 1.886322021484375, 1.97637939453125, 2.066436767578125, 2.156494140625, 2.246551513671875, 2.33660888671875, 2.426666259765625, 2.5167236328125, 2.606781005859375, 2.69683837890625, 2.786895751953125, 2.876953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 11.0, 19.0, 15.0, 22.0, 37.0, 53.0, 120.0, 190.0, 403.0, 1028.0, 4065.0, 47713.0, 918499.0, 69311.0, 4876.0, 1205.0, 430.0, 234.0, 107.0, 67.0, 37.0, 25.0, 15.0, 13.0, 11.0, 9.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5615234375, -1.5086822509765625, -1.455841064453125, -1.4029998779296875, -1.35015869140625, -1.2973175048828125, -1.244476318359375, -1.1916351318359375, -1.1387939453125, -1.0859527587890625, -1.033111572265625, -0.9802703857421875, -0.92742919921875, -0.8745880126953125, -0.821746826171875, -0.7689056396484375, -0.716064453125, -0.6632232666015625, -0.610382080078125, -0.5575408935546875, -0.50469970703125, -0.4518585205078125, -0.399017333984375, -0.3461761474609375, -0.2933349609375, -0.2404937744140625, -0.187652587890625, -0.1348114013671875, -0.08197021484375, -0.0291290283203125, 0.023712158203125, 0.0765533447265625, 0.12939453125, 0.1822357177734375, 0.235076904296875, 0.2879180908203125, 0.34075927734375, 0.3936004638671875, 0.446441650390625, 0.4992828369140625, 0.5521240234375, 0.6049652099609375, 0.657806396484375, 0.7106475830078125, 0.76348876953125, 0.8163299560546875, 0.869171142578125, 0.9220123291015625, 0.974853515625, 1.0276947021484375, 1.080535888671875, 1.1333770751953125, 1.18621826171875, 1.2390594482421875, 1.291900634765625, 1.3447418212890625, 1.3975830078125, 1.4504241943359375, 1.503265380859375, 1.5561065673828125, 1.60894775390625, 1.6617889404296875, 1.714630126953125, 1.7674713134765625, 1.8203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 11.0, 13.0, 21.0, 32.0, 44.0, 49.0, 63.0, 76.0, 106.0, 112.0, 116.0, 83.0, 69.0, 41.0, 40.0, 31.0, 34.0, 9.0, 9.0, 7.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010001659393310547, -9.610876441001892e-05, -9.220093488693237e-05, -8.829310536384583e-05, -8.438527584075928e-05, -8.047744631767273e-05, -7.656961679458618e-05, -7.266178727149963e-05, -6.875395774841309e-05, -6.484612822532654e-05, -6.093829870223999e-05, -5.703046917915344e-05, -5.3122639656066895e-05, -4.921481013298035e-05, -4.53069806098938e-05, -4.139915108680725e-05, -3.74913215637207e-05, -3.3583492040634155e-05, -2.9675662517547607e-05, -2.576783299446106e-05, -2.1860003471374512e-05, -1.7952173948287964e-05, -1.4044344425201416e-05, -1.0136514902114868e-05, -6.22868537902832e-06, -2.3208558559417725e-06, 1.5869736671447754e-06, 5.494803190231323e-06, 9.402632713317871e-06, 1.3310462236404419e-05, 1.7218291759490967e-05, 2.1126121282577515e-05, 2.5033950805664062e-05, 2.894178032875061e-05, 3.284960985183716e-05, 3.6757439374923706e-05, 4.0665268898010254e-05, 4.45730984210968e-05, 4.848092794418335e-05, 5.23887574672699e-05, 5.6296586990356445e-05, 6.020441651344299e-05, 6.411224603652954e-05, 6.802007555961609e-05, 7.192790508270264e-05, 7.583573460578918e-05, 7.974356412887573e-05, 8.365139365196228e-05, 8.755922317504883e-05, 9.146705269813538e-05, 9.537488222122192e-05, 9.928271174430847e-05, 0.00010319054126739502, 0.00010709837079048157, 0.00011100620031356812, 0.00011491402983665466, 0.00011882185935974121, 0.00012272968888282776, 0.0001266375184059143, 0.00013054534792900085, 0.0001344531774520874, 0.00013836100697517395, 0.0001422688364982605, 0.00014617666602134705, 0.0001500844955444336]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 13.0, 20.0, 34.0, 59.0, 89.0, 187.0, 412.0, 1037.0, 3604.0, 25811.0, 827105.0, 178200.0, 8739.0, 1920.0, 683.0, 286.0, 136.0, 73.0, 38.0, 24.0, 13.0, 20.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.578125, -1.5232696533203125, -1.468414306640625, -1.4135589599609375, -1.35870361328125, -1.3038482666015625, -1.248992919921875, -1.1941375732421875, -1.1392822265625, -1.0844268798828125, -1.029571533203125, -0.9747161865234375, -0.91986083984375, -0.8650054931640625, -0.810150146484375, -0.7552947998046875, -0.700439453125, -0.6455841064453125, -0.590728759765625, -0.5358734130859375, -0.48101806640625, -0.4261627197265625, -0.371307373046875, -0.3164520263671875, -0.2615966796875, -0.2067413330078125, -0.151885986328125, -0.0970306396484375, -0.04217529296875, 0.0126800537109375, 0.067535400390625, 0.1223907470703125, 0.17724609375, 0.2321014404296875, 0.286956787109375, 0.3418121337890625, 0.39666748046875, 0.4515228271484375, 0.506378173828125, 0.5612335205078125, 0.6160888671875, 0.6709442138671875, 0.725799560546875, 0.7806549072265625, 0.83551025390625, 0.8903656005859375, 0.945220947265625, 1.0000762939453125, 1.054931640625, 1.1097869873046875, 1.164642333984375, 1.2194976806640625, 1.27435302734375, 1.3292083740234375, 1.384063720703125, 1.4389190673828125, 1.4937744140625, 1.5486297607421875, 1.603485107421875, 1.6583404541015625, 1.71319580078125, 1.7680511474609375, 1.822906494140625, 1.8777618408203125, 1.9326171875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 15.0, 12.0, 34.0, 48.0, 70.0, 110.0, 137.0, 141.0, 106.0, 93.0, 70.0, 70.0, 33.0, 16.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2705078125, -1.225677490234375, -1.18084716796875, -1.136016845703125, -1.0911865234375, -1.046356201171875, -1.00152587890625, -0.956695556640625, -0.911865234375, -0.867034912109375, -0.82220458984375, -0.777374267578125, -0.7325439453125, -0.687713623046875, -0.64288330078125, -0.598052978515625, -0.55322265625, -0.508392333984375, -0.46356201171875, -0.418731689453125, -0.3739013671875, -0.329071044921875, -0.28424072265625, -0.239410400390625, -0.194580078125, -0.149749755859375, -0.10491943359375, -0.060089111328125, -0.0152587890625, 0.029571533203125, 0.07440185546875, 0.119232177734375, 0.1640625, 0.208892822265625, 0.25372314453125, 0.298553466796875, 0.3433837890625, 0.388214111328125, 0.43304443359375, 0.477874755859375, 0.522705078125, 0.567535400390625, 0.61236572265625, 0.657196044921875, 0.7020263671875, 0.746856689453125, 0.79168701171875, 0.836517333984375, 0.88134765625, 0.926177978515625, 0.97100830078125, 1.015838623046875, 1.0606689453125, 1.105499267578125, 1.15032958984375, 1.195159912109375, 1.239990234375, 1.284820556640625, 1.32965087890625, 1.374481201171875, 1.4193115234375, 1.464141845703125, 1.50897216796875, 1.553802490234375, 1.5986328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 9.0, 86.0, 364.0, 400.0, 115.0, 21.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.907175064086914, -5.5349040031433105, -4.162632942199707, -2.7903618812561035, -1.4180908203125, -0.045819759368896484, 1.326451301574707, 2.6987228393554688, 4.070993423461914, 5.443264484405518, 6.815535545349121, 8.187807083129883, 9.560077667236328, 10.932348251342773, 12.304619789123535, 13.676891326904297, 15.049161911010742, 16.421432495117188, 17.793704986572266, 19.16597557067871, 20.538246154785156, 21.9105167388916, 23.282787322998047, 24.655059814453125, 26.02733039855957, 27.399600982666016, 28.771873474121094, 30.14414405822754, 31.516414642333984, 32.88868713378906, 34.260955810546875, 35.63322830200195, 37.00550079345703, 38.37777328491211, 39.75004196166992, 41.122314453125, 42.49458312988281, 43.86685562133789, 45.23912811279297, 46.61139678955078, 47.98366928100586, 49.35594177246094, 50.72821044921875, 52.10048294067383, 53.472755432128906, 54.84502410888672, 56.2172966003418, 57.589569091796875, 58.96183776855469, 60.334110260009766, 61.70637893676758, 63.078651428222656, 64.45092010498047, 65.82319641113281, 67.19546508789062, 68.56773376464844, 69.94000244140625, 71.31227111816406, 72.6845474243164, 74.05681610107422, 75.42908477783203, 76.80136108398438, 78.17362976074219, 79.5458984375, 80.91817474365234]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 7.0, 8.0, 10.0, 18.0, 19.0, 13.0, 29.0, 28.0, 33.0, 27.0, 39.0, 41.0, 45.0, 41.0, 54.0, 36.0, 53.0, 47.0, 49.0, 51.0, 43.0, 34.0, 31.0, 38.0, 31.0, 35.0, 20.0, 14.0, 18.0, 16.0, 11.0, 12.0, 15.0, 8.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.314973831176758, -8.042481422424316, -7.769989967346191, -7.49749755859375, -7.225005626678467, -6.952513694763184, -6.680021286010742, -6.407529354095459, -6.135037422180176, -5.862545490264893, -5.590053558349609, -5.317561149597168, -5.045069217681885, -4.772577285766602, -4.50008487701416, -4.227592945098877, -3.9551010131835938, -3.6826090812683105, -3.4101169109344482, -3.137624740600586, -2.8651328086853027, -2.5926408767700195, -2.3201487064361572, -2.047656536102295, -1.7751646041870117, -1.502672553062439, -1.2301805019378662, -0.9576884508132935, -0.6851963996887207, -0.41270434856414795, -0.1402122974395752, 0.13227975368499756, 0.4047718048095703, 0.6772638559341431, 0.9497559070587158, 1.2222479581832886, 1.4947400093078613, 1.767232060432434, 2.039724111557007, 2.312216281890869, 2.5847082138061523, 2.8572001457214355, 3.129692316055298, 3.40218448638916, 3.6746764183044434, 3.9471683502197266, 4.219660758972168, 4.492152690887451, 4.764644622802734, 5.037136554718018, 5.309628486633301, 5.582120895385742, 5.854612827301025, 6.127104759216309, 6.39959716796875, 6.672089099884033, 6.944581031799316, 7.2170729637146, 7.489564895629883, 7.762057304382324, 8.034549713134766, 8.30704116821289, 8.579533576965332, 8.852025032043457, 9.124517440795898]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 5.0, 5.0, 6.0, 16.0, 42.0, 85.0, 149.0, 351.0, 977.0, 4549.0, 77850.0, 4081546.0, 24864.0, 2655.0, 640.0, 252.0, 129.0, 84.0, 25.0, 21.0, 11.0, 5.0, 2.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.322265625, -2.213470458984375, -2.10467529296875, -1.995880126953125, -1.8870849609375, -1.778289794921875, -1.66949462890625, -1.560699462890625, -1.451904296875, -1.343109130859375, -1.23431396484375, -1.125518798828125, -1.0167236328125, -0.907928466796875, -0.79913330078125, -0.690338134765625, -0.58154296875, -0.472747802734375, -0.36395263671875, -0.255157470703125, -0.1463623046875, -0.037567138671875, 0.07122802734375, 0.180023193359375, 0.288818359375, 0.397613525390625, 0.50640869140625, 0.615203857421875, 0.7239990234375, 0.832794189453125, 0.94158935546875, 1.050384521484375, 1.1591796875, 1.267974853515625, 1.37677001953125, 1.485565185546875, 1.5943603515625, 1.703155517578125, 1.81195068359375, 1.920745849609375, 2.029541015625, 2.138336181640625, 2.24713134765625, 2.355926513671875, 2.4647216796875, 2.573516845703125, 2.68231201171875, 2.791107177734375, 2.89990234375, 3.008697509765625, 3.11749267578125, 3.226287841796875, 3.3350830078125, 3.443878173828125, 3.55267333984375, 3.661468505859375, 3.770263671875, 3.879058837890625, 3.98785400390625, 4.096649169921875, 4.2054443359375, 4.314239501953125, 4.42303466796875, 4.531829833984375, 4.640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 9.0, 11.0, 18.0, 10.0, 8.0, 33.0, 55.0, 60.0, 82.0, 123.0, 103.0, 107.0, 97.0, 89.0, 52.0, 44.0, 32.0, 20.0, 14.0, 7.0, 8.0, 4.0, 12.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9162673950195312, -0.8921051025390625, -0.8679428100585938, -0.843780517578125, -0.8196182250976562, -0.7954559326171875, -0.7712936401367188, -0.74713134765625, -0.7229690551757812, -0.6988067626953125, -0.6746444702148438, -0.650482177734375, -0.6263198852539062, -0.6021575927734375, -0.5779953002929688, -0.5538330078125, -0.5296707153320312, -0.5055084228515625, -0.48134613037109375, -0.457183837890625, -0.43302154541015625, -0.4088592529296875, -0.38469696044921875, -0.36053466796875, -0.33637237548828125, -0.3122100830078125, -0.28804779052734375, -0.263885498046875, -0.23972320556640625, -0.2155609130859375, -0.19139862060546875, -0.167236328125, -0.14307403564453125, -0.1189117431640625, -0.09474945068359375, -0.070587158203125, -0.04642486572265625, -0.0222625732421875, 0.00189971923828125, 0.02606201171875, 0.05022430419921875, 0.0743865966796875, 0.09854888916015625, 0.122711181640625, 0.14687347412109375, 0.1710357666015625, 0.19519805908203125, 0.2193603515625, 0.24352264404296875, 0.2676849365234375, 0.29184722900390625, 0.316009521484375, 0.34017181396484375, 0.3643341064453125, 0.38849639892578125, 0.41265869140625, 0.43682098388671875, 0.4609832763671875, 0.48514556884765625, 0.509307861328125, 0.5334701538085938, 0.5576324462890625, 0.5817947387695312, 0.60595703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 12.0, 19.0, 19.0, 26.0, 51.0, 54.0, 102.0, 139.0, 232.0, 384.0, 670.0, 1123.0, 2284.0, 5189.0, 13064.0, 41481.0, 212586.0, 3572672.0, 270757.0, 47754.0, 14437.0, 5668.0, 2470.0, 1253.0, 666.0, 398.0, 277.0, 154.0, 105.0, 68.0, 44.0, 41.0, 15.0, 14.0, 4.0, 18.0, 3.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9555435180664062, -0.9242706298828125, -0.8929977416992188, -0.861724853515625, -0.8304519653320312, -0.7991790771484375, -0.7679061889648438, -0.73663330078125, -0.7053604125976562, -0.6740875244140625, -0.6428146362304688, -0.611541748046875, -0.5802688598632812, -0.5489959716796875, -0.5177230834960938, -0.4864501953125, -0.45517730712890625, -0.4239044189453125, -0.39263153076171875, -0.361358642578125, -0.33008575439453125, -0.2988128662109375, -0.26753997802734375, -0.23626708984375, -0.20499420166015625, -0.1737213134765625, -0.14244842529296875, -0.111175537109375, -0.07990264892578125, -0.0486297607421875, -0.01735687255859375, 0.013916015625, 0.04518890380859375, 0.0764617919921875, 0.10773468017578125, 0.139007568359375, 0.17028045654296875, 0.2015533447265625, 0.23282623291015625, 0.26409912109375, 0.29537200927734375, 0.3266448974609375, 0.35791778564453125, 0.389190673828125, 0.42046356201171875, 0.4517364501953125, 0.48300933837890625, 0.5142822265625, 0.5455551147460938, 0.5768280029296875, 0.6081008911132812, 0.639373779296875, 0.6706466674804688, 0.7019195556640625, 0.7331924438476562, 0.76446533203125, 0.7957382202148438, 0.8270111083984375, 0.8582839965820312, 0.889556884765625, 0.9208297729492188, 0.9521026611328125, 0.9833755493164062, 1.0146484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 4.0, 8.0, 10.0, 22.0, 25.0, 44.0, 50.0, 82.0, 138.0, 217.0, 612.0, 2102.0, 291.0, 171.0, 98.0, 58.0, 37.0, 21.0, 20.0, 17.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3559112548828125, -0.341217041015625, -0.3265228271484375, -0.31182861328125, -0.2971343994140625, -0.282440185546875, -0.2677459716796875, -0.2530517578125, -0.2383575439453125, -0.223663330078125, -0.2089691162109375, -0.19427490234375, -0.1795806884765625, -0.164886474609375, -0.1501922607421875, -0.135498046875, -0.1208038330078125, -0.106109619140625, -0.0914154052734375, -0.07672119140625, -0.0620269775390625, -0.047332763671875, -0.0326385498046875, -0.0179443359375, -0.0032501220703125, 0.011444091796875, 0.0261383056640625, 0.04083251953125, 0.0555267333984375, 0.070220947265625, 0.0849151611328125, 0.099609375, 0.1143035888671875, 0.128997802734375, 0.1436920166015625, 0.15838623046875, 0.1730804443359375, 0.187774658203125, 0.2024688720703125, 0.2171630859375, 0.2318572998046875, 0.246551513671875, 0.2612457275390625, 0.27593994140625, 0.2906341552734375, 0.305328369140625, 0.3200225830078125, 0.334716796875, 0.3494110107421875, 0.364105224609375, 0.3787994384765625, 0.39349365234375, 0.4081878662109375, 0.422882080078125, 0.4375762939453125, 0.4522705078125, 0.4669647216796875, 0.481658935546875, 0.4963531494140625, 0.51104736328125, 0.5257415771484375, 0.540435791015625, 0.5551300048828125, 0.56982421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 12.0, 21.0, 22.0, 54.0, 92.0, 128.0, 161.0, 163.0, 156.0, 89.0, 35.0, 21.0, 15.0, 12.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.486344337463379, -4.369661808013916, -4.252979278564453, -4.136297225952148, -4.0196146965026855, -3.9029321670532227, -3.7862496376037598, -3.669567346572876, -3.552884817123413, -3.43620228767395, -3.3195199966430664, -3.2028374671936035, -3.0861551761627197, -2.969472646713257, -2.852790355682373, -2.73610782623291, -2.6194252967834473, -2.5027427673339844, -2.3860604763031006, -2.2693779468536377, -2.152695655822754, -2.036013126373291, -1.9193307161331177, -1.8026483058929443, -1.6859660148620605, -1.5692836046218872, -1.4526011943817139, -1.335918664932251, -1.2192362546920776, -1.1025538444519043, -0.985871434211731, -0.8691889643669128, -0.7525064945220947, -0.6358240842819214, -0.5191416144371033, -0.40245920419692993, -0.2857767641544342, -0.16909432411193848, -0.05241191387176514, 0.06427055597305298, 0.18095296621322632, 0.29763540625572205, 0.4143178462982178, 0.5310002565383911, 0.6476826667785645, 0.7643651366233826, 0.8810475468635559, 0.997730016708374, 1.1144124269485474, 1.2310948371887207, 1.347777247428894, 1.4644596576690674, 1.5811421871185303, 1.6978245973587036, 1.814507007598877, 1.9311895370483398, 2.0478718280792236, 2.1645543575286865, 2.2812366485595703, 2.397919178009033, 2.514601469039917, 2.63128399848938, 2.7479662895202637, 2.8646488189697266, 2.9813313484191895]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 5.0, 7.0, 5.0, 11.0, 9.0, 19.0, 14.0, 21.0, 12.0, 40.0, 32.0, 42.0, 32.0, 36.0, 48.0, 51.0, 49.0, 40.0, 43.0, 44.0, 47.0, 46.0, 39.0, 32.0, 34.0, 36.0, 42.0, 30.0, 32.0, 15.0, 14.0, 11.0, 11.0, 9.0, 4.0, 6.0, 9.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.395074486732483, -1.343608021736145, -1.2921415567398071, -1.2406750917434692, -1.189208745956421, -1.137742280960083, -1.0862758159637451, -1.0348093509674072, -0.9833428859710693, -0.9318764209747314, -0.8804099559783936, -0.8289435505867004, -0.7774770855903625, -0.7260106205940247, -0.6745442152023315, -0.6230777502059937, -0.5716112852096558, -0.5201448202133179, -0.46867838501930237, -0.41721194982528687, -0.365745484828949, -0.3142790198326111, -0.2628125846385956, -0.21134614944458008, -0.1598796844482422, -0.10841323435306549, -0.056946784257888794, -0.005480334162712097, 0.0459861159324646, 0.09745258092880249, 0.148919016122818, 0.2003854513168335, 0.25185203552246094, 0.30331850051879883, 0.35478493571281433, 0.40625137090682983, 0.4577178359031677, 0.5091843008995056, 0.5606507062911987, 0.6121171712875366, 0.6635836362838745, 0.7150501012802124, 0.7665165662765503, 0.8179829716682434, 0.8694494366645813, 0.9209159016609192, 0.9723823070526123, 1.0238487720489502, 1.075315237045288, 1.126781702041626, 1.1782481670379639, 1.2297146320343018, 1.2811810970306396, 1.3326475620269775, 1.3841139078140259, 1.4355803728103638, 1.4870468378067017, 1.5385133028030396, 1.5899797677993774, 1.6414462327957153, 1.6929125785827637, 1.7443790435791016, 1.7958455085754395, 1.8473119735717773, 1.8987784385681152]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 9.0, 10.0, 22.0, 19.0, 40.0, 81.0, 130.0, 244.0, 450.0, 1121.0, 2885.0, 9750.0, 43321.0, 246839.0, 578945.0, 130105.0, 24620.0, 6227.0, 2072.0, 803.0, 363.0, 210.0, 95.0, 70.0, 38.0, 25.0, 14.0, 12.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.80859375, -1.7613983154296875, -1.714202880859375, -1.6670074462890625, -1.61981201171875, -1.5726165771484375, -1.525421142578125, -1.4782257080078125, -1.4310302734375, -1.3838348388671875, -1.336639404296875, -1.2894439697265625, -1.24224853515625, -1.1950531005859375, -1.147857666015625, -1.1006622314453125, -1.053466796875, -1.0062713623046875, -0.959075927734375, -0.9118804931640625, -0.86468505859375, -0.8174896240234375, -0.770294189453125, -0.7230987548828125, -0.6759033203125, -0.6287078857421875, -0.581512451171875, -0.5343170166015625, -0.48712158203125, -0.4399261474609375, -0.392730712890625, -0.3455352783203125, -0.29833984375, -0.2511444091796875, -0.203948974609375, -0.1567535400390625, -0.10955810546875, -0.0623626708984375, -0.015167236328125, 0.0320281982421875, 0.0792236328125, 0.1264190673828125, 0.173614501953125, 0.2208099365234375, 0.26800537109375, 0.3152008056640625, 0.362396240234375, 0.4095916748046875, 0.456787109375, 0.5039825439453125, 0.551177978515625, 0.5983734130859375, 0.64556884765625, 0.6927642822265625, 0.739959716796875, 0.7871551513671875, 0.8343505859375, 0.8815460205078125, 0.928741455078125, 0.9759368896484375, 1.02313232421875, 1.0703277587890625, 1.117523193359375, 1.1647186279296875, 1.2119140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 3.0, 2.0, 8.0, 13.0, 15.0, 20.0, 25.0, 45.0, 49.0, 63.0, 73.0, 79.0, 91.0, 96.0, 83.0, 89.0, 69.0, 43.0, 32.0, 19.0, 24.0, 16.0, 13.0, 9.0, 10.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.84228515625, -0.82122802734375, -0.8001708984375, -0.77911376953125, -0.758056640625, -0.73699951171875, -0.7159423828125, -0.69488525390625, -0.673828125, -0.65277099609375, -0.6317138671875, -0.61065673828125, -0.589599609375, -0.56854248046875, -0.5474853515625, -0.52642822265625, -0.50537109375, -0.48431396484375, -0.4632568359375, -0.44219970703125, -0.421142578125, -0.40008544921875, -0.3790283203125, -0.35797119140625, -0.3369140625, -0.31585693359375, -0.2947998046875, -0.27374267578125, -0.252685546875, -0.23162841796875, -0.2105712890625, -0.18951416015625, -0.16845703125, -0.14739990234375, -0.1263427734375, -0.10528564453125, -0.084228515625, -0.06317138671875, -0.0421142578125, -0.02105712890625, 0.0, 0.02105712890625, 0.0421142578125, 0.06317138671875, 0.084228515625, 0.10528564453125, 0.1263427734375, 0.14739990234375, 0.16845703125, 0.18951416015625, 0.2105712890625, 0.23162841796875, 0.252685546875, 0.27374267578125, 0.2947998046875, 0.31585693359375, 0.3369140625, 0.35797119140625, 0.3790283203125, 0.40008544921875, 0.421142578125, 0.44219970703125, 0.4632568359375, 0.48431396484375, 0.50537109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 3.0, 6.0, 7.0, 10.0, 11.0, 27.0, 23.0, 33.0, 55.0, 86.0, 117.0, 183.0, 246.0, 402.0, 850.0, 2090.0, 7330.0, 60843.0, 777041.0, 179297.0, 14177.0, 3034.0, 1152.0, 590.0, 344.0, 167.0, 133.0, 93.0, 65.0, 20.0, 28.0, 22.0, 19.0, 8.0, 8.0, 5.0, 5.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.244140625, -2.17547607421875, -2.1068115234375, -2.03814697265625, -1.969482421875, -1.90081787109375, -1.8321533203125, -1.76348876953125, -1.69482421875, -1.62615966796875, -1.5574951171875, -1.48883056640625, -1.420166015625, -1.35150146484375, -1.2828369140625, -1.21417236328125, -1.1455078125, -1.07684326171875, -1.0081787109375, -0.93951416015625, -0.870849609375, -0.80218505859375, -0.7335205078125, -0.66485595703125, -0.59619140625, -0.52752685546875, -0.4588623046875, -0.39019775390625, -0.321533203125, -0.25286865234375, -0.1842041015625, -0.11553955078125, -0.046875, 0.02178955078125, 0.0904541015625, 0.15911865234375, 0.227783203125, 0.29644775390625, 0.3651123046875, 0.43377685546875, 0.50244140625, 0.57110595703125, 0.6397705078125, 0.70843505859375, 0.777099609375, 0.84576416015625, 0.9144287109375, 0.98309326171875, 1.0517578125, 1.12042236328125, 1.1890869140625, 1.25775146484375, 1.326416015625, 1.39508056640625, 1.4637451171875, 1.53240966796875, 1.60107421875, 1.66973876953125, 1.7384033203125, 1.80706787109375, 1.875732421875, 1.94439697265625, 2.0130615234375, 2.08172607421875, 2.150390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 11.0, 11.0, 16.0, 22.0, 16.0, 28.0, 26.0, 35.0, 38.0, 36.0, 42.0, 48.0, 48.0, 57.0, 38.0, 57.0, 65.0, 39.0, 48.0, 45.0, 46.0, 35.0, 26.0, 23.0, 13.0, 19.0, 14.0, 12.0, 8.0, 11.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.89453125, -1.8339080810546875, -1.773284912109375, -1.7126617431640625, -1.65203857421875, -1.5914154052734375, -1.530792236328125, -1.4701690673828125, -1.4095458984375, -1.3489227294921875, -1.288299560546875, -1.2276763916015625, -1.16705322265625, -1.1064300537109375, -1.045806884765625, -0.9851837158203125, -0.924560546875, -0.8639373779296875, -0.803314208984375, -0.7426910400390625, -0.68206787109375, -0.6214447021484375, -0.560821533203125, -0.5001983642578125, -0.4395751953125, -0.3789520263671875, -0.318328857421875, -0.2577056884765625, -0.19708251953125, -0.1364593505859375, -0.075836181640625, -0.0152130126953125, 0.04541015625, 0.1060333251953125, 0.166656494140625, 0.2272796630859375, 0.28790283203125, 0.3485260009765625, 0.409149169921875, 0.4697723388671875, 0.5303955078125, 0.5910186767578125, 0.651641845703125, 0.7122650146484375, 0.77288818359375, 0.8335113525390625, 0.894134521484375, 0.9547576904296875, 1.015380859375, 1.0760040283203125, 1.136627197265625, 1.1972503662109375, 1.25787353515625, 1.3184967041015625, 1.379119873046875, 1.4397430419921875, 1.5003662109375, 1.5609893798828125, 1.621612548828125, 1.6822357177734375, 1.74285888671875, 1.8034820556640625, 1.864105224609375, 1.9247283935546875, 1.9853515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 8.0, 7.0, 17.0, 15.0, 27.0, 56.0, 129.0, 277.0, 753.0, 3022.0, 26744.0, 809715.0, 196744.0, 8667.0, 1529.0, 478.0, 168.0, 89.0, 54.0, 23.0, 14.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.07647705078125, -1.0426025390625, -1.00872802734375, -0.974853515625, -0.94097900390625, -0.9071044921875, -0.87322998046875, -0.83935546875, -0.80548095703125, -0.7716064453125, -0.73773193359375, -0.703857421875, -0.66998291015625, -0.6361083984375, -0.60223388671875, -0.568359375, -0.53448486328125, -0.5006103515625, -0.46673583984375, -0.432861328125, -0.39898681640625, -0.3651123046875, -0.33123779296875, -0.29736328125, -0.26348876953125, -0.2296142578125, -0.19573974609375, -0.161865234375, -0.12799072265625, -0.0941162109375, -0.06024169921875, -0.0263671875, 0.00750732421875, 0.0413818359375, 0.07525634765625, 0.109130859375, 0.14300537109375, 0.1768798828125, 0.21075439453125, 0.24462890625, 0.27850341796875, 0.3123779296875, 0.34625244140625, 0.380126953125, 0.41400146484375, 0.4478759765625, 0.48175048828125, 0.515625, 0.54949951171875, 0.5833740234375, 0.61724853515625, 0.651123046875, 0.68499755859375, 0.7188720703125, 0.75274658203125, 0.78662109375, 0.82049560546875, 0.8543701171875, 0.88824462890625, 0.922119140625, 0.95599365234375, 0.9898681640625, 1.02374267578125, 1.0576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 8.0, 6.0, 6.0, 11.0, 12.0, 15.0, 14.0, 18.0, 24.0, 24.0, 22.0, 23.0, 47.0, 32.0, 43.0, 72.0, 96.0, 84.0, 89.0, 60.0, 45.0, 36.0, 32.0, 38.0, 23.0, 21.0, 18.0, 20.0, 15.0, 11.0, 11.0, 5.0, 1.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.988380432128906e-05, -8.699577301740646e-05, -8.410774171352386e-05, -8.121971040964127e-05, -7.833167910575867e-05, -7.544364780187607e-05, -7.255561649799347e-05, -6.966758519411087e-05, -6.677955389022827e-05, -6.389152258634567e-05, -6.1003491282463074e-05, -5.8115459978580475e-05, -5.5227428674697876e-05, -5.233939737081528e-05, -4.945136606693268e-05, -4.656333476305008e-05, -4.367530345916748e-05, -4.078727215528488e-05, -3.789924085140228e-05, -3.5011209547519684e-05, -3.2123178243637085e-05, -2.9235146939754486e-05, -2.6347115635871887e-05, -2.345908433198929e-05, -2.057105302810669e-05, -1.768302172422409e-05, -1.4794990420341492e-05, -1.1906959116458893e-05, -9.018927812576294e-06, -6.130896508693695e-06, -3.242865204811096e-06, -3.548339009284973e-07, 2.5331974029541016e-06, 5.4212287068367004e-06, 8.3092600107193e-06, 1.1197291314601898e-05, 1.4085322618484497e-05, 1.6973353922367096e-05, 1.9861385226249695e-05, 2.2749416530132294e-05, 2.5637447834014893e-05, 2.852547913789749e-05, 3.141351044178009e-05, 3.430154174566269e-05, 3.718957304954529e-05, 4.007760435342789e-05, 4.2965635657310486e-05, 4.5853666961193085e-05, 4.8741698265075684e-05, 5.162972956895828e-05, 5.451776087284088e-05, 5.740579217672348e-05, 6.029382348060608e-05, 6.318185478448868e-05, 6.606988608837128e-05, 6.895791739225388e-05, 7.184594869613647e-05, 7.473398000001907e-05, 7.762201130390167e-05, 8.051004260778427e-05, 8.339807391166687e-05, 8.628610521554947e-05, 8.917413651943207e-05, 9.206216782331467e-05, 9.495019912719727e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 14.0, 15.0, 29.0, 47.0, 63.0, 110.0, 195.0, 436.0, 1005.0, 3326.0, 25459.0, 751939.0, 251046.0, 11279.0, 2137.0, 709.0, 333.0, 170.0, 99.0, 60.0, 30.0, 19.0, 14.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.044342041015625, -1.01153564453125, -0.978729248046875, -0.9459228515625, -0.913116455078125, -0.88031005859375, -0.847503662109375, -0.814697265625, -0.781890869140625, -0.74908447265625, -0.716278076171875, -0.6834716796875, -0.650665283203125, -0.61785888671875, -0.585052490234375, -0.55224609375, -0.519439697265625, -0.48663330078125, -0.453826904296875, -0.4210205078125, -0.388214111328125, -0.35540771484375, -0.322601318359375, -0.289794921875, -0.256988525390625, -0.22418212890625, -0.191375732421875, -0.1585693359375, -0.125762939453125, -0.09295654296875, -0.060150146484375, -0.02734375, 0.005462646484375, 0.03826904296875, 0.071075439453125, 0.1038818359375, 0.136688232421875, 0.16949462890625, 0.202301025390625, 0.235107421875, 0.267913818359375, 0.30072021484375, 0.333526611328125, 0.3663330078125, 0.399139404296875, 0.43194580078125, 0.464752197265625, 0.49755859375, 0.530364990234375, 0.56317138671875, 0.595977783203125, 0.6287841796875, 0.661590576171875, 0.69439697265625, 0.727203369140625, 0.760009765625, 0.792816162109375, 0.82562255859375, 0.858428955078125, 0.8912353515625, 0.924041748046875, 0.95684814453125, 0.989654541015625, 1.0224609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 7.0, 7.0, 14.0, 23.0, 25.0, 30.0, 40.0, 73.0, 94.0, 110.0, 129.0, 116.0, 92.0, 82.0, 51.0, 25.0, 31.0, 14.0, 8.0, 11.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0], "bins": [-1.158203125, -1.1342811584472656, -1.1103591918945312, -1.0864372253417969, -1.0625152587890625, -1.0385932922363281, -1.0146713256835938, -0.9907493591308594, -0.966827392578125, -0.9429054260253906, -0.9189834594726562, -0.8950614929199219, -0.8711395263671875, -0.8472175598144531, -0.8232955932617188, -0.7993736267089844, -0.77545166015625, -0.7515296936035156, -0.7276077270507812, -0.7036857604980469, -0.6797637939453125, -0.6558418273925781, -0.6319198608398438, -0.6079978942871094, -0.584075927734375, -0.5601539611816406, -0.5362319946289062, -0.5123100280761719, -0.4883880615234375, -0.4644660949707031, -0.44054412841796875, -0.4166221618652344, -0.3927001953125, -0.3687782287597656, -0.34485626220703125, -0.3209342956542969, -0.2970123291015625, -0.2730903625488281, -0.24916839599609375, -0.22524642944335938, -0.201324462890625, -0.17740249633789062, -0.15348052978515625, -0.12955856323242188, -0.1056365966796875, -0.08171463012695312, -0.05779266357421875, -0.033870697021484375, -0.00994873046875, 0.013973236083984375, 0.03789520263671875, 0.061817169189453125, 0.0857391357421875, 0.10966110229492188, 0.13358306884765625, 0.15750503540039062, 0.181427001953125, 0.20534896850585938, 0.22927093505859375, 0.2531929016113281, 0.2771148681640625, 0.3010368347167969, 0.32495880126953125, 0.3488807678222656, 0.372802734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 23.0, 79.0, 227.0, 345.0, 215.0, 80.0, 20.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.49342918395996, -17.704021453857422, -16.914615631103516, -16.125207901000977, -15.335800170898438, -14.546393394470215, -13.756986618041992, -12.967578887939453, -12.17817211151123, -11.388765335083008, -10.599357604980469, -9.809950828552246, -9.020544052124023, -8.231136322021484, -7.441729545593262, -6.652322292327881, -5.8629150390625, -5.073507785797119, -4.284100532531738, -3.4946937561035156, -2.7052865028381348, -1.915879249572754, -1.1264724731445312, -0.3370652198791504, 0.45234203338623047, 1.2417491674423218, 2.031156301498413, 2.820563316345215, 3.6099705696105957, 4.399377822875977, 5.188784599304199, 5.97819185256958, 6.767601013183594, 7.557008266448975, 8.346415519714355, 9.135822296142578, 9.925230026245117, 10.71463680267334, 11.504043579101562, 12.293451309204102, 13.082858085632324, 13.872264862060547, 14.661672592163086, 15.451079368591309, 16.24048614501953, 17.02989387512207, 17.81930160522461, 18.608707427978516, 19.398115158081055, 20.187522888183594, 20.9769287109375, 21.76633644104004, 22.555744171142578, 23.345149993896484, 24.134557723999023, 24.923965454101562, 25.71337127685547, 26.502779006958008, 27.292184829711914, 28.081592559814453, 28.871000289916992, 29.66040802001953, 30.449813842773438, 31.239221572875977, 32.028629302978516]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 5.0, 10.0, 12.0, 17.0, 22.0, 17.0, 27.0, 28.0, 34.0, 47.0, 49.0, 62.0, 45.0, 40.0, 56.0, 53.0, 60.0, 66.0, 51.0, 51.0, 32.0, 38.0, 34.0, 22.0, 12.0, 15.0, 14.0, 12.0, 15.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.913366317749023, -9.619521141052246, -9.325675964355469, -9.031831741333008, -8.73798656463623, -8.444141387939453, -8.150296211242676, -7.856451511383057, -7.5626068115234375, -7.26876163482666, -6.974916934967041, -6.681071758270264, -6.3872270584106445, -6.093381881713867, -5.79953670501709, -5.505692005157471, -5.211846828460693, -4.918001651763916, -4.624156951904297, -4.3303117752075195, -4.0364670753479, -3.742621898651123, -3.448776960372925, -3.1549320220947266, -2.8610870838165283, -2.56724214553833, -2.273397207260132, -1.979552149772644, -1.6857072114944458, -1.3918622732162476, -1.0980172157287598, -0.8041722774505615, -0.5103273391723633, -0.21648237109184265, 0.07736259698867798, 0.371207594871521, 0.6650525331497192, 0.9588974714279175, 1.2527425289154053, 1.5465874671936035, 1.8404324054718018, 2.13427734375, 2.4281222820281982, 2.7219672203063965, 3.015812397003174, 3.309657096862793, 3.6035022735595703, 3.8973472118377686, 4.191192150115967, 4.485037326812744, 4.778882026672363, 5.072727203369141, 5.36657190322876, 5.660417079925537, 5.954261779785156, 6.248106956481934, 6.541952133178711, 6.835797309875488, 7.129642009735107, 7.423487186431885, 7.717331886291504, 8.011177062988281, 8.305022239685059, 8.598867416381836, 8.892711639404297]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 9.0, 14.0, 17.0, 21.0, 36.0, 64.0, 102.0, 143.0, 223.0, 444.0, 880.0, 1813.0, 4411.0, 12963.0, 49672.0, 366633.0, 3251899.0, 428027.0, 55123.0, 13511.0, 4577.0, 1896.0, 781.0, 398.0, 244.0, 120.0, 73.0, 54.0, 27.0, 16.0, 18.0, 11.0, 12.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68359375, -0.6587600708007812, -0.6339263916015625, -0.6090927124023438, -0.584259033203125, -0.5594253540039062, -0.5345916748046875, -0.5097579956054688, -0.48492431640625, -0.46009063720703125, -0.4352569580078125, -0.41042327880859375, -0.385589599609375, -0.36075592041015625, -0.3359222412109375, -0.31108856201171875, -0.2862548828125, -0.26142120361328125, -0.2365875244140625, -0.21175384521484375, -0.186920166015625, -0.16208648681640625, -0.1372528076171875, -0.11241912841796875, -0.08758544921875, -0.06275177001953125, -0.0379180908203125, -0.01308441162109375, 0.011749267578125, 0.03658294677734375, 0.0614166259765625, 0.08625030517578125, 0.111083984375, 0.13591766357421875, 0.1607513427734375, 0.18558502197265625, 0.210418701171875, 0.23525238037109375, 0.2600860595703125, 0.28491973876953125, 0.30975341796875, 0.33458709716796875, 0.3594207763671875, 0.38425445556640625, 0.409088134765625, 0.43392181396484375, 0.4587554931640625, 0.48358917236328125, 0.5084228515625, 0.5332565307617188, 0.5580902099609375, 0.5829238891601562, 0.607757568359375, 0.6325912475585938, 0.6574249267578125, 0.6822586059570312, 0.70709228515625, 0.7319259643554688, 0.7567596435546875, 0.7815933227539062, 0.806427001953125, 0.8312606811523438, 0.8560943603515625, 0.8809280395507812, 0.90576171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 14.0, 16.0, 32.0, 29.0, 51.0, 68.0, 71.0, 76.0, 77.0, 127.0, 88.0, 68.0, 80.0, 47.0, 41.0, 27.0, 19.0, 22.0, 7.0, 8.0, 8.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.7393875122070312, -0.7204742431640625, -0.7015609741210938, -0.682647705078125, -0.6637344360351562, -0.6448211669921875, -0.6259078979492188, -0.60699462890625, -0.5880813598632812, -0.5691680908203125, -0.5502548217773438, -0.531341552734375, -0.5124282836914062, -0.4935150146484375, -0.47460174560546875, -0.4556884765625, -0.43677520751953125, -0.4178619384765625, -0.39894866943359375, -0.380035400390625, -0.36112213134765625, -0.3422088623046875, -0.32329559326171875, -0.30438232421875, -0.28546905517578125, -0.2665557861328125, -0.24764251708984375, -0.228729248046875, -0.20981597900390625, -0.1909027099609375, -0.17198944091796875, -0.153076171875, -0.13416290283203125, -0.1152496337890625, -0.09633636474609375, -0.077423095703125, -0.05850982666015625, -0.0395965576171875, -0.02068328857421875, -0.00177001953125, 0.01714324951171875, 0.0360565185546875, 0.05496978759765625, 0.073883056640625, 0.09279632568359375, 0.1117095947265625, 0.13062286376953125, 0.1495361328125, 0.16844940185546875, 0.1873626708984375, 0.20627593994140625, 0.225189208984375, 0.24410247802734375, 0.2630157470703125, 0.28192901611328125, 0.30084228515625, 0.31975555419921875, 0.3386688232421875, 0.35758209228515625, 0.376495361328125, 0.39540863037109375, 0.4143218994140625, 0.43323516845703125, 0.4521484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 12.0, 10.0, 15.0, 27.0, 25.0, 48.0, 57.0, 101.0, 148.0, 271.0, 464.0, 963.0, 1970.0, 4260.0, 10504.0, 30689.0, 135564.0, 1444999.0, 2310902.0, 191926.0, 39172.0, 12640.0, 4830.0, 2207.0, 1073.0, 577.0, 310.0, 185.0, 103.0, 80.0, 40.0, 31.0, 23.0, 12.0, 11.0, 6.0, 3.0, 5.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.76220703125, -0.7410888671875, -0.719970703125, -0.6988525390625, -0.677734375, -0.6566162109375, -0.635498046875, -0.6143798828125, -0.59326171875, -0.5721435546875, -0.551025390625, -0.5299072265625, -0.5087890625, -0.4876708984375, -0.466552734375, -0.4454345703125, -0.42431640625, -0.4031982421875, -0.382080078125, -0.3609619140625, -0.33984375, -0.3187255859375, -0.297607421875, -0.2764892578125, -0.25537109375, -0.2342529296875, -0.213134765625, -0.1920166015625, -0.1708984375, -0.1497802734375, -0.128662109375, -0.1075439453125, -0.08642578125, -0.0653076171875, -0.044189453125, -0.0230712890625, -0.001953125, 0.0191650390625, 0.040283203125, 0.0614013671875, 0.08251953125, 0.1036376953125, 0.124755859375, 0.1458740234375, 0.1669921875, 0.1881103515625, 0.209228515625, 0.2303466796875, 0.25146484375, 0.2725830078125, 0.293701171875, 0.3148193359375, 0.3359375, 0.3570556640625, 0.378173828125, 0.3992919921875, 0.42041015625, 0.4415283203125, 0.462646484375, 0.4837646484375, 0.5048828125, 0.5260009765625, 0.547119140625, 0.5682373046875, 0.58935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 6.0, 9.0, 11.0, 18.0, 27.0, 32.0, 56.0, 126.0, 192.0, 367.0, 675.0, 967.0, 697.0, 349.0, 227.0, 118.0, 69.0, 27.0, 26.0, 15.0, 11.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.0042266845703125, -0.971343994140625, -0.9384613037109375, -0.90557861328125, -0.8726959228515625, -0.839813232421875, -0.8069305419921875, -0.7740478515625, -0.7411651611328125, -0.708282470703125, -0.6753997802734375, -0.64251708984375, -0.6096343994140625, -0.576751708984375, -0.5438690185546875, -0.510986328125, -0.4781036376953125, -0.445220947265625, -0.4123382568359375, -0.37945556640625, -0.3465728759765625, -0.313690185546875, -0.2808074951171875, -0.2479248046875, -0.2150421142578125, -0.182159423828125, -0.1492767333984375, -0.11639404296875, -0.0835113525390625, -0.050628662109375, -0.0177459716796875, 0.01513671875, 0.0480194091796875, 0.080902099609375, 0.1137847900390625, 0.14666748046875, 0.1795501708984375, 0.212432861328125, 0.2453155517578125, 0.2781982421875, 0.3110809326171875, 0.343963623046875, 0.3768463134765625, 0.40972900390625, 0.4426116943359375, 0.475494384765625, 0.5083770751953125, 0.541259765625, 0.5741424560546875, 0.607025146484375, 0.6399078369140625, 0.67279052734375, 0.7056732177734375, 0.738555908203125, 0.7714385986328125, 0.8043212890625, 0.8372039794921875, 0.870086669921875, 0.9029693603515625, 0.93585205078125, 0.9687347412109375, 1.001617431640625, 1.0345001220703125, 1.0673828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 11.0, 3.0, 12.0, 25.0, 44.0, 92.0, 149.0, 208.0, 162.0, 129.0, 89.0, 36.0, 21.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.519721984863281, -11.229414939880371, -10.939107894897461, -10.64880084991455, -10.35849380493164, -10.06818675994873, -9.77787971496582, -9.48757266998291, -9.197265625, -8.90695858001709, -8.61665153503418, -8.32634449005127, -8.03603744506836, -7.745730400085449, -7.455423355102539, -7.165116310119629, -6.874809741973877, -6.584502696990967, -6.294195652008057, -6.0038886070251465, -5.713581562042236, -5.423274517059326, -5.132967948913574, -4.842660903930664, -4.552353858947754, -4.262046813964844, -3.9717397689819336, -3.6814327239990234, -3.3911256790161133, -3.100818634033203, -2.810511827468872, -2.520204782485962, -2.2298970222473145, -1.9395899772644043, -1.6492829322814941, -1.3589760065078735, -1.0686689615249634, -0.7783619165420532, -0.4880549907684326, -0.19774794578552246, 0.0925590991973877, 0.38286611437797546, 0.6731731295585632, 0.9634801149368286, 1.2537871599197388, 1.544094204902649, 1.8344011306762695, 2.1247081756591797, 2.41501522064209, 2.705322265625, 2.99562931060791, 3.2859363555908203, 3.5762434005737305, 3.8665504455566406, 4.156857490539551, 4.447164535522461, 4.737471580505371, 5.027778625488281, 5.318085670471191, 5.608392715454102, 5.898699760437012, 6.189006805419922, 6.479313850402832, 6.769620895385742, 7.059927463531494]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 14.0, 6.0, 11.0, 16.0, 19.0, 27.0, 25.0, 18.0, 26.0, 38.0, 38.0, 45.0, 43.0, 54.0, 48.0, 50.0, 53.0, 47.0, 47.0, 38.0, 39.0, 38.0, 35.0, 32.0, 31.0, 18.0, 20.0, 18.0, 16.0, 16.0, 9.0, 11.0, 14.0, 7.0, 3.0, 3.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.58216667175293, -4.451664924621582, -4.321163654327393, -4.190661907196045, -4.060160160064697, -3.9296586513519287, -3.79915714263916, -3.6686553955078125, -3.538153886795044, -3.4076523780822754, -3.2771506309509277, -3.146649122238159, -3.0161476135253906, -2.885645866394043, -2.7551443576812744, -2.624642848968506, -2.494141101837158, -2.3636395931243896, -2.233137845993042, -2.1026363372802734, -1.9721347093582153, -1.8416330814361572, -1.7111315727233887, -1.5806299448013306, -1.4501283168792725, -1.3196266889572144, -1.1891250610351562, -1.0586235523223877, -0.9281219244003296, -0.7976202964782715, -0.6671187281608582, -0.5366171598434448, -0.4061152935028076, -0.2756136953830719, -0.14511209726333618, -0.014610499143600464, 0.11589109897613525, 0.24639272689819336, 0.3768942952156067, 0.50739586353302, 0.6378974914550781, 0.7683991193771362, 0.8989006876945496, 1.029402256011963, 1.159903883934021, 1.290405511856079, 1.4209070205688477, 1.5514086484909058, 1.6819102764129639, 1.812411904335022, 1.94291353225708, 2.0734150409698486, 2.203916549682617, 2.334418296813965, 2.4649198055267334, 2.595421314239502, 2.7259230613708496, 2.856424570083618, 2.986926317214966, 3.1174278259277344, 3.247929573059082, 3.3784310817718506, 3.508932590484619, 3.639434337615967, 3.7699358463287354]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 0.0, 5.0, 4.0, 6.0, 10.0, 8.0, 15.0, 25.0, 48.0, 77.0, 114.0, 193.0, 364.0, 645.0, 1268.0, 2477.0, 5353.0, 13145.0, 39068.0, 145327.0, 481797.0, 259412.0, 64611.0, 20312.0, 7586.0, 3294.0, 1517.0, 804.0, 430.0, 240.0, 137.0, 88.0, 54.0, 42.0, 19.0, 17.0, 12.0, 12.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.861328125, -0.8323287963867188, -0.8033294677734375, -0.7743301391601562, -0.745330810546875, -0.7163314819335938, -0.6873321533203125, -0.6583328247070312, -0.62933349609375, -0.6003341674804688, -0.5713348388671875, -0.5423355102539062, -0.513336181640625, -0.48433685302734375, -0.4553375244140625, -0.42633819580078125, -0.3973388671875, -0.36833953857421875, -0.3393402099609375, -0.31034088134765625, -0.281341552734375, -0.25234222412109375, -0.2233428955078125, -0.19434356689453125, -0.16534423828125, -0.13634490966796875, -0.1073455810546875, -0.07834625244140625, -0.049346923828125, -0.02034759521484375, 0.0086517333984375, 0.03765106201171875, 0.066650390625, 0.09564971923828125, 0.1246490478515625, 0.15364837646484375, 0.182647705078125, 0.21164703369140625, 0.2406463623046875, 0.26964569091796875, 0.29864501953125, 0.32764434814453125, 0.3566436767578125, 0.38564300537109375, 0.414642333984375, 0.44364166259765625, 0.4726409912109375, 0.5016403198242188, 0.5306396484375, 0.5596389770507812, 0.5886383056640625, 0.6176376342773438, 0.646636962890625, 0.6756362915039062, 0.7046356201171875, 0.7336349487304688, 0.76263427734375, 0.7916336059570312, 0.8206329345703125, 0.8496322631835938, 0.878631591796875, 0.9076309204101562, 0.9366302490234375, 0.9656295776367188, 0.99462890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 11.0, 7.0, 12.0, 21.0, 25.0, 34.0, 36.0, 31.0, 55.0, 50.0, 56.0, 74.0, 69.0, 70.0, 67.0, 58.0, 58.0, 46.0, 46.0, 35.0, 28.0, 21.0, 19.0, 21.0, 9.0, 8.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.56103515625, -0.5479621887207031, -0.5348892211914062, -0.5218162536621094, -0.5087432861328125, -0.4956703186035156, -0.48259735107421875, -0.4695243835449219, -0.456451416015625, -0.4433784484863281, -0.43030548095703125, -0.4172325134277344, -0.4041595458984375, -0.3910865783691406, -0.37801361083984375, -0.3649406433105469, -0.35186767578125, -0.3387947082519531, -0.32572174072265625, -0.3126487731933594, -0.2995758056640625, -0.2865028381347656, -0.27342987060546875, -0.2603569030761719, -0.247283935546875, -0.23421096801757812, -0.22113800048828125, -0.20806503295898438, -0.1949920654296875, -0.18191909790039062, -0.16884613037109375, -0.15577316284179688, -0.1427001953125, -0.12962722778320312, -0.11655426025390625, -0.10348129272460938, -0.0904083251953125, -0.07733535766601562, -0.06426239013671875, -0.051189422607421875, -0.038116455078125, -0.025043487548828125, -0.01197052001953125, 0.001102447509765625, 0.0141754150390625, 0.027248382568359375, 0.04032135009765625, 0.053394317626953125, 0.06646728515625, 0.07954025268554688, 0.09261322021484375, 0.10568618774414062, 0.1187591552734375, 0.13183212280273438, 0.14490509033203125, 0.15797805786132812, 0.171051025390625, 0.18412399291992188, 0.19719696044921875, 0.21026992797851562, 0.2233428955078125, 0.23641586303710938, 0.24948883056640625, 0.2625617980957031, 0.275634765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 20.0, 9.0, 30.0, 43.0, 57.0, 94.0, 173.0, 321.0, 564.0, 1390.0, 4474.0, 37987.0, 882308.0, 109981.0, 7568.0, 1861.0, 710.0, 365.0, 182.0, 136.0, 75.0, 56.0, 40.0, 27.0, 13.0, 15.0, 9.0, 11.0, 6.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.666015625, -2.59124755859375, -2.5164794921875, -2.44171142578125, -2.366943359375, -2.29217529296875, -2.2174072265625, -2.14263916015625, -2.06787109375, -1.99310302734375, -1.9183349609375, -1.84356689453125, -1.768798828125, -1.69403076171875, -1.6192626953125, -1.54449462890625, -1.4697265625, -1.39495849609375, -1.3201904296875, -1.24542236328125, -1.170654296875, -1.09588623046875, -1.0211181640625, -0.94635009765625, -0.87158203125, -0.79681396484375, -0.7220458984375, -0.64727783203125, -0.572509765625, -0.49774169921875, -0.4229736328125, -0.34820556640625, -0.2734375, -0.19866943359375, -0.1239013671875, -0.04913330078125, 0.025634765625, 0.10040283203125, 0.1751708984375, 0.24993896484375, 0.32470703125, 0.39947509765625, 0.4742431640625, 0.54901123046875, 0.623779296875, 0.69854736328125, 0.7733154296875, 0.84808349609375, 0.9228515625, 0.99761962890625, 1.0723876953125, 1.14715576171875, 1.221923828125, 1.29669189453125, 1.3714599609375, 1.44622802734375, 1.52099609375, 1.59576416015625, 1.6705322265625, 1.74530029296875, 1.820068359375, 1.89483642578125, 1.9696044921875, 2.04437255859375, 2.119140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 11.0, 8.0, 3.0, 11.0, 13.0, 15.0, 26.0, 29.0, 36.0, 33.0, 47.0, 44.0, 53.0, 44.0, 55.0, 62.0, 42.0, 51.0, 51.0, 40.0, 48.0, 38.0, 39.0, 26.0, 34.0, 21.0, 15.0, 12.0, 12.0, 8.0, 14.0, 4.0, 9.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.49609375, -1.4463043212890625, -1.396514892578125, -1.3467254638671875, -1.29693603515625, -1.2471466064453125, -1.197357177734375, -1.1475677490234375, -1.0977783203125, -1.0479888916015625, -0.998199462890625, -0.9484100341796875, -0.89862060546875, -0.8488311767578125, -0.799041748046875, -0.7492523193359375, -0.699462890625, -0.6496734619140625, -0.599884033203125, -0.5500946044921875, -0.50030517578125, -0.4505157470703125, -0.400726318359375, -0.3509368896484375, -0.3011474609375, -0.2513580322265625, -0.201568603515625, -0.1517791748046875, -0.10198974609375, -0.0522003173828125, -0.002410888671875, 0.0473785400390625, 0.09716796875, 0.1469573974609375, 0.196746826171875, 0.2465362548828125, 0.29632568359375, 0.3461151123046875, 0.395904541015625, 0.4456939697265625, 0.4954833984375, 0.5452728271484375, 0.595062255859375, 0.6448516845703125, 0.69464111328125, 0.7444305419921875, 0.794219970703125, 0.8440093994140625, 0.893798828125, 0.9435882568359375, 0.993377685546875, 1.0431671142578125, 1.09295654296875, 1.1427459716796875, 1.192535400390625, 1.2423248291015625, 1.2921142578125, 1.3419036865234375, 1.391693115234375, 1.4414825439453125, 1.49127197265625, 1.5410614013671875, 1.590850830078125, 1.6406402587890625, 1.6904296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 11.0, 12.0, 28.0, 33.0, 72.0, 135.0, 288.0, 735.0, 3718.0, 77909.0, 943017.0, 19599.0, 2050.0, 535.0, 204.0, 76.0, 45.0, 29.0, 15.0, 13.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.79296875, -1.748504638671875, -1.70404052734375, -1.659576416015625, -1.6151123046875, -1.570648193359375, -1.52618408203125, -1.481719970703125, -1.437255859375, -1.392791748046875, -1.34832763671875, -1.303863525390625, -1.2593994140625, -1.214935302734375, -1.17047119140625, -1.126007080078125, -1.08154296875, -1.037078857421875, -0.99261474609375, -0.948150634765625, -0.9036865234375, -0.859222412109375, -0.81475830078125, -0.770294189453125, -0.725830078125, -0.681365966796875, -0.63690185546875, -0.592437744140625, -0.5479736328125, -0.503509521484375, -0.45904541015625, -0.414581298828125, -0.3701171875, -0.325653076171875, -0.28118896484375, -0.236724853515625, -0.1922607421875, -0.147796630859375, -0.10333251953125, -0.058868408203125, -0.014404296875, 0.030059814453125, 0.07452392578125, 0.118988037109375, 0.1634521484375, 0.207916259765625, 0.25238037109375, 0.296844482421875, 0.34130859375, 0.385772705078125, 0.43023681640625, 0.474700927734375, 0.5191650390625, 0.563629150390625, 0.60809326171875, 0.652557373046875, 0.697021484375, 0.741485595703125, 0.78594970703125, 0.830413818359375, 0.8748779296875, 0.919342041015625, 0.96380615234375, 1.008270263671875, 1.052734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 12.0, 6.0, 3.0, 12.0, 12.0, 18.0, 21.0, 17.0, 31.0, 34.0, 48.0, 75.0, 72.0, 92.0, 106.0, 80.0, 72.0, 52.0, 44.0, 32.0, 20.0, 17.0, 16.0, 6.0, 10.0, 10.0, 3.0, 10.0, 7.0, 8.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.673833847045898e-05, -9.375158697366714e-05, -9.07648354768753e-05, -8.777808398008347e-05, -8.479133248329163e-05, -8.180458098649979e-05, -7.881782948970795e-05, -7.583107799291611e-05, -7.284432649612427e-05, -6.985757499933243e-05, -6.687082350254059e-05, -6.388407200574875e-05, -6.089732050895691e-05, -5.791056901216507e-05, -5.492381751537323e-05, -5.193706601858139e-05, -4.895031452178955e-05, -4.596356302499771e-05, -4.297681152820587e-05, -3.999006003141403e-05, -3.700330853462219e-05, -3.401655703783035e-05, -3.102980554103851e-05, -2.8043054044246674e-05, -2.5056302547454834e-05, -2.2069551050662994e-05, -1.9082799553871155e-05, -1.6096048057079315e-05, -1.3109296560287476e-05, -1.0122545063495636e-05, -7.135793566703796e-06, -4.149042069911957e-06, -1.1622905731201172e-06, 1.8244609236717224e-06, 4.811212420463562e-06, 7.797963917255402e-06, 1.0784715414047241e-05, 1.377146691083908e-05, 1.675821840763092e-05, 1.974496990442276e-05, 2.27317214012146e-05, 2.571847289800644e-05, 2.870522439479828e-05, 3.169197589159012e-05, 3.467872738838196e-05, 3.76654788851738e-05, 4.065223038196564e-05, 4.363898187875748e-05, 4.6625733375549316e-05, 4.9612484872341156e-05, 5.2599236369132996e-05, 5.5585987865924835e-05, 5.8572739362716675e-05, 6.155949085950851e-05, 6.454624235630035e-05, 6.75329938530922e-05, 7.051974534988403e-05, 7.350649684667587e-05, 7.649324834346771e-05, 7.947999984025955e-05, 8.246675133705139e-05, 8.545350283384323e-05, 8.844025433063507e-05, 9.142700582742691e-05, 9.441375732421875e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 8.0, 9.0, 13.0, 24.0, 56.0, 82.0, 191.0, 482.0, 1331.0, 7966.0, 669384.0, 360678.0, 6426.0, 1166.0, 353.0, 182.0, 83.0, 52.0, 30.0, 12.0, 7.0, 9.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2196807861328125, -1.170806884765625, -1.1219329833984375, -1.07305908203125, -1.0241851806640625, -0.975311279296875, -0.9264373779296875, -0.8775634765625, -0.8286895751953125, -0.779815673828125, -0.7309417724609375, -0.68206787109375, -0.6331939697265625, -0.584320068359375, -0.5354461669921875, -0.486572265625, -0.4376983642578125, -0.388824462890625, -0.3399505615234375, -0.29107666015625, -0.2422027587890625, -0.193328857421875, -0.1444549560546875, -0.0955810546875, -0.0467071533203125, 0.002166748046875, 0.0510406494140625, 0.09991455078125, 0.1487884521484375, 0.197662353515625, 0.2465362548828125, 0.29541015625, 0.3442840576171875, 0.393157958984375, 0.4420318603515625, 0.49090576171875, 0.5397796630859375, 0.588653564453125, 0.6375274658203125, 0.6864013671875, 0.7352752685546875, 0.784149169921875, 0.8330230712890625, 0.88189697265625, 0.9307708740234375, 0.979644775390625, 1.0285186767578125, 1.077392578125, 1.1262664794921875, 1.175140380859375, 1.2240142822265625, 1.27288818359375, 1.3217620849609375, 1.370635986328125, 1.4195098876953125, 1.4683837890625, 1.5172576904296875, 1.566131591796875, 1.6150054931640625, 1.66387939453125, 1.7127532958984375, 1.761627197265625, 1.8105010986328125, 1.859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 18.0, 16.0, 27.0, 51.0, 62.0, 106.0, 145.0, 165.0, 142.0, 81.0, 42.0, 36.0, 15.0, 23.0, 14.0, 11.0, 5.0, 4.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483642578125, -0.4555778503417969, -0.42751312255859375, -0.3994483947753906, -0.3713836669921875, -0.3433189392089844, -0.31525421142578125, -0.2871894836425781, -0.259124755859375, -0.23106002807617188, -0.20299530029296875, -0.17493057250976562, -0.1468658447265625, -0.11880111694335938, -0.09073638916015625, -0.06267166137695312, -0.03460693359375, -0.006542205810546875, 0.02152252197265625, 0.049587249755859375, 0.0776519775390625, 0.10571670532226562, 0.13378143310546875, 0.16184616088867188, 0.189910888671875, 0.21797561645507812, 0.24604034423828125, 0.2741050720214844, 0.3021697998046875, 0.3302345275878906, 0.35829925537109375, 0.3863639831542969, 0.4144287109375, 0.4424934387207031, 0.47055816650390625, 0.4986228942871094, 0.5266876220703125, 0.5547523498535156, 0.5828170776367188, 0.6108818054199219, 0.638946533203125, 0.6670112609863281, 0.6950759887695312, 0.7231407165527344, 0.7512054443359375, 0.7792701721191406, 0.8073348999023438, 0.8353996276855469, 0.86346435546875, 0.8915290832519531, 0.9195938110351562, 0.9476585388183594, 0.9757232666015625, 1.0037879943847656, 1.0318527221679688, 1.0599174499511719, 1.087982177734375, 1.1160469055175781, 1.1441116333007812, 1.1721763610839844, 1.2002410888671875, 1.2283058166503906, 1.2563705444335938, 1.2844352722167969, 1.3125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 14.0, 19.0, 54.0, 122.0, 220.0, 261.0, 172.0, 83.0, 24.0, 15.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.999593734741211, -8.596375465393066, -8.193158149719238, -7.789939880371094, -7.386722087860107, -6.983504295349121, -6.580286502838135, -6.177068710327148, -5.773850440979004, -5.370632648468018, -4.967414855957031, -4.564196586608887, -4.1609787940979, -3.757761001586914, -3.3545432090759277, -2.9513251781463623, -2.548107624053955, -2.1448898315429688, -1.7416718006134033, -1.338454008102417, -0.9352360963821411, -0.5320181846618652, -0.1288003921508789, 0.2744176387786865, 0.6776354312896729, 1.0808533430099487, 1.4840712547302246, 1.887289047241211, 2.2905068397521973, 2.6937248706817627, 3.096942663192749, 3.5001606941223145, 3.903378486633301, 4.306596279144287, 4.709814071655273, 5.113032341003418, 5.516250133514404, 5.919467926025391, 6.322685718536377, 6.725903511047363, 7.129121780395508, 7.532339572906494, 7.9355573654174805, 8.338775634765625, 8.741992950439453, 9.145211219787598, 9.548429489135742, 9.95164680480957, 10.354864120483398, 10.758082389831543, 11.161299705505371, 11.564517974853516, 11.967735290527344, 12.370953559875488, 12.774171829223633, 13.177389144897461, 13.580607414245605, 13.98382568359375, 14.387042999267578, 14.790261268615723, 15.19347858428955, 15.596696853637695, 15.999914169311523, 16.403133392333984, 16.806350708007812]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 5.0, 7.0, 10.0, 14.0, 18.0, 21.0, 23.0, 28.0, 26.0, 33.0, 48.0, 61.0, 61.0, 48.0, 75.0, 55.0, 46.0, 51.0, 61.0, 51.0, 45.0, 39.0, 22.0, 29.0, 24.0, 18.0, 18.0, 11.0, 12.0, 15.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.69635009765625, -8.46436882019043, -8.23238754272461, -8.000406265258789, -7.768424987792969, -7.536443710327148, -7.304462432861328, -7.072481632232666, -6.840500354766846, -6.608519077301025, -6.376537799835205, -6.144556522369385, -5.9125752449035645, -5.680594444274902, -5.448613166809082, -5.216631889343262, -4.984650611877441, -4.752669334411621, -4.520688056945801, -4.2887067794799805, -4.05672550201416, -3.824744462966919, -3.5927631855010986, -3.3607821464538574, -3.128800392150879, -2.8968191146850586, -2.6648378372192383, -2.432856559753418, -2.2008755207061768, -1.9688942432403564, -1.7369129657745361, -1.5049318075180054, -1.2729506492614746, -1.0409693717956543, -0.8089882135391235, -0.5770069360733032, -0.3450257182121277, -0.11304450035095215, 0.11893677711486816, 0.3509179353713989, 0.5828992128372192, 0.8148804306983948, 1.0468616485595703, 1.2788429260253906, 1.510824203491211, 1.7428053617477417, 1.974786639213562, 2.2067677974700928, 2.438749074935913, 2.6707303524017334, 2.9027116298675537, 3.134692668914795, 3.3666739463806152, 3.5986552238464355, 3.830636501312256, 4.062617778778076, 4.2945990562438965, 4.526580333709717, 4.758561611175537, 4.990542888641357, 5.222524166107178, 5.45450496673584, 5.68648624420166, 5.9184675216674805, 6.150448799133301]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 15.0, 5.0, 11.0, 13.0, 12.0, 21.0, 32.0, 33.0, 48.0, 64.0, 84.0, 103.0, 152.0, 270.0, 1464.0, 899557.0, 3289645.0, 1746.0, 318.0, 171.0, 137.0, 93.0, 70.0, 49.0, 46.0, 28.0, 19.0, 17.0, 10.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.20703125, -4.08343505859375, -3.9598388671875, -3.83624267578125, -3.712646484375, -3.58905029296875, -3.4654541015625, -3.34185791015625, -3.21826171875, -3.09466552734375, -2.9710693359375, -2.84747314453125, -2.723876953125, -2.60028076171875, -2.4766845703125, -2.35308837890625, -2.2294921875, -2.10589599609375, -1.9822998046875, -1.85870361328125, -1.735107421875, -1.61151123046875, -1.4879150390625, -1.36431884765625, -1.24072265625, -1.11712646484375, -0.9935302734375, -0.86993408203125, -0.746337890625, -0.62274169921875, -0.4991455078125, -0.37554931640625, -0.251953125, -0.12835693359375, -0.0047607421875, 0.11883544921875, 0.242431640625, 0.36602783203125, 0.4896240234375, 0.61322021484375, 0.73681640625, 0.86041259765625, 0.9840087890625, 1.10760498046875, 1.231201171875, 1.35479736328125, 1.4783935546875, 1.60198974609375, 1.7255859375, 1.84918212890625, 1.9727783203125, 2.09637451171875, 2.219970703125, 2.34356689453125, 2.4671630859375, 2.59075927734375, 2.71435546875, 2.83795166015625, 2.9615478515625, 3.08514404296875, 3.208740234375, 3.33233642578125, 3.4559326171875, 3.57952880859375, 3.703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 12.0, 14.0, 21.0, 28.0, 34.0, 40.0, 45.0, 37.0, 52.0, 67.0, 68.0, 85.0, 58.0, 56.0, 73.0, 53.0, 50.0, 32.0, 35.0, 32.0, 26.0, 18.0, 15.0, 15.0, 8.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.54638671875, -0.5341529846191406, -0.5219192504882812, -0.5096855163574219, -0.4974517822265625, -0.4852180480957031, -0.47298431396484375, -0.4607505798339844, -0.448516845703125, -0.4362831115722656, -0.42404937744140625, -0.4118156433105469, -0.3995819091796875, -0.3873481750488281, -0.37511444091796875, -0.3628807067871094, -0.35064697265625, -0.3384132385253906, -0.32617950439453125, -0.3139457702636719, -0.3017120361328125, -0.2894783020019531, -0.27724456787109375, -0.2650108337402344, -0.252777099609375, -0.24054336547851562, -0.22830963134765625, -0.21607589721679688, -0.2038421630859375, -0.19160842895507812, -0.17937469482421875, -0.16714096069335938, -0.1549072265625, -0.14267349243164062, -0.13043975830078125, -0.11820602416992188, -0.1059722900390625, -0.09373855590820312, -0.08150482177734375, -0.06927108764648438, -0.057037353515625, -0.044803619384765625, -0.03256988525390625, -0.020336151123046875, -0.0081024169921875, 0.004131317138671875, 0.01636505126953125, 0.028598785400390625, 0.04083251953125, 0.053066253662109375, 0.06529998779296875, 0.07753372192382812, 0.0897674560546875, 0.10200119018554688, 0.11423492431640625, 0.12646865844726562, 0.138702392578125, 0.15093612670898438, 0.16316986083984375, 0.17540359497070312, 0.1876373291015625, 0.19987106323242188, 0.21210479736328125, 0.22433853149414062, 0.236572265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 17.0, 21.0, 51.0, 83.0, 100.0, 241.0, 505.0, 1055.0, 2759.0, 7846.0, 28633.0, 158720.0, 2469389.0, 1387056.0, 105769.0, 21235.0, 6467.0, 2452.0, 979.0, 428.0, 229.0, 105.0, 54.0, 32.0, 21.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5623626708984375, -0.542205810546875, -0.5220489501953125, -0.50189208984375, -0.4817352294921875, -0.461578369140625, -0.4414215087890625, -0.4212646484375, -0.4011077880859375, -0.380950927734375, -0.3607940673828125, -0.34063720703125, -0.3204803466796875, -0.300323486328125, -0.2801666259765625, -0.260009765625, -0.2398529052734375, -0.219696044921875, -0.1995391845703125, -0.17938232421875, -0.1592254638671875, -0.139068603515625, -0.1189117431640625, -0.0987548828125, -0.0785980224609375, -0.058441162109375, -0.0382843017578125, -0.01812744140625, 0.0020294189453125, 0.022186279296875, 0.0423431396484375, 0.0625, 0.0826568603515625, 0.102813720703125, 0.1229705810546875, 0.14312744140625, 0.1632843017578125, 0.183441162109375, 0.2035980224609375, 0.2237548828125, 0.2439117431640625, 0.264068603515625, 0.2842254638671875, 0.30438232421875, 0.3245391845703125, 0.344696044921875, 0.3648529052734375, 0.385009765625, 0.4051666259765625, 0.425323486328125, 0.4454803466796875, 0.46563720703125, 0.4857940673828125, 0.505950927734375, 0.5261077880859375, 0.5462646484375, 0.5664215087890625, 0.586578369140625, 0.6067352294921875, 0.62689208984375, 0.6470489501953125, 0.667205810546875, 0.6873626708984375, 0.70751953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 11.0, 21.0, 25.0, 54.0, 78.0, 102.0, 189.0, 349.0, 663.0, 960.0, 683.0, 377.0, 187.0, 128.0, 70.0, 50.0, 30.0, 16.0, 15.0, 15.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90673828125, -0.8832168579101562, -0.8596954345703125, -0.8361740112304688, -0.812652587890625, -0.7891311645507812, -0.7656097412109375, -0.7420883178710938, -0.71856689453125, -0.6950454711914062, -0.6715240478515625, -0.6480026245117188, -0.624481201171875, -0.6009597778320312, -0.5774383544921875, -0.5539169311523438, -0.5303955078125, -0.5068740844726562, -0.4833526611328125, -0.45983123779296875, -0.436309814453125, -0.41278839111328125, -0.3892669677734375, -0.36574554443359375, -0.34222412109375, -0.31870269775390625, -0.2951812744140625, -0.27165985107421875, -0.248138427734375, -0.22461700439453125, -0.2010955810546875, -0.17757415771484375, -0.154052734375, -0.13053131103515625, -0.1070098876953125, -0.08348846435546875, -0.059967041015625, -0.03644561767578125, -0.0129241943359375, 0.01059722900390625, 0.03411865234375, 0.05764007568359375, 0.0811614990234375, 0.10468292236328125, 0.128204345703125, 0.15172576904296875, 0.1752471923828125, 0.19876861572265625, 0.2222900390625, 0.24581146240234375, 0.2693328857421875, 0.29285430908203125, 0.316375732421875, 0.33989715576171875, 0.3634185791015625, 0.38694000244140625, 0.41046142578125, 0.43398284912109375, 0.4575042724609375, 0.48102569580078125, 0.504547119140625, 0.5280685424804688, 0.5515899658203125, 0.5751113891601562, 0.5986328125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 12.0, 44.0, 143.0, 346.0, 281.0, 109.0, 29.0, 15.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.231163024902344, -8.857980728149414, -8.4847993850708, -8.111618041992188, -7.738435745239258, -7.365253925323486, -6.992072105407715, -6.618890285491943, -6.245708465576172, -5.8725266456604, -5.499344825744629, -5.126163005828857, -4.752981185913086, -4.3797993659973145, -4.006617546081543, -3.6334357261657715, -3.26025390625, -2.8870720863342285, -2.513890266418457, -2.1407084465026855, -1.767526626586914, -1.3943448066711426, -1.021162986755371, -0.6479811668395996, -0.2747993469238281, 0.09838247299194336, 0.47156429290771484, 0.8447461128234863, 1.2179279327392578, 1.5911097526550293, 1.9642915725708008, 2.3374733924865723, 2.71065616607666, 3.0838379859924316, 3.457019805908203, 3.8302016258239746, 4.203383445739746, 4.576565265655518, 4.949747085571289, 5.3229289054870605, 5.696110725402832, 6.0692925453186035, 6.442474365234375, 6.8156561851501465, 7.188838005065918, 7.5620198249816895, 7.935201644897461, 8.30838394165039, 8.681565284729004, 9.054746627807617, 9.427928924560547, 9.801111221313477, 10.17429256439209, 10.547473907470703, 10.920656204223633, 11.293838500976562, 11.667019844055176, 12.040201187133789, 12.413383483886719, 12.786565780639648, 13.159747123718262, 13.532928466796875, 13.906110763549805, 14.279293060302734, 14.652474403381348]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 11.0, 17.0, 11.0, 14.0, 20.0, 26.0, 22.0, 32.0, 34.0, 42.0, 52.0, 46.0, 46.0, 57.0, 64.0, 69.0, 53.0, 47.0, 43.0, 43.0, 38.0, 35.0, 24.0, 25.0, 20.0, 22.0, 14.0, 15.0, 17.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2577648162841797, -3.151721239089966, -3.045677423477173, -2.939633846282959, -2.833590030670166, -2.727546453475952, -2.6215028762817383, -2.5154590606689453, -2.4094154834747314, -2.3033719062805176, -2.1973280906677246, -2.0912845134735107, -1.9852408170700073, -1.879197120666504, -1.7731534242630005, -1.667109727859497, -1.5610660314559937, -1.4550223350524902, -1.3489786386489868, -1.2429349422454834, -1.1368913650512695, -1.0308476686477661, -0.9248039722442627, -0.818760335445404, -0.7127166390419006, -0.6066729426383972, -0.5006293058395386, -0.39458560943603516, -0.2885419428348541, -0.1824982762336731, -0.07645457983016968, 0.029589056968688965, 0.13563275337219238, 0.2416764199733734, 0.34772008657455444, 0.45376378297805786, 0.5598074197769165, 0.6658511161804199, 0.7718948125839233, 0.877938449382782, 0.9839821457862854, 1.090025782585144, 1.1960694789886475, 1.3021131753921509, 1.4081568717956543, 1.5142004489898682, 1.6202442646026611, 1.726287841796875, 1.8323315382003784, 1.9383752346038818, 2.0444188117980957, 2.1504626274108887, 2.2565062046051025, 2.3625497817993164, 2.4685935974121094, 2.5746371746063232, 2.680680990219116, 2.78672456741333, 2.892768383026123, 2.998811960220337, 3.10485577583313, 3.2108993530273438, 3.3169431686401367, 3.4229867458343506, 3.5290303230285645]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 14.0, 14.0, 22.0, 29.0, 48.0, 91.0, 124.0, 176.0, 318.0, 539.0, 985.0, 1675.0, 3467.0, 7235.0, 17817.0, 50057.0, 174481.0, 449983.0, 235683.0, 66171.0, 22211.0, 8842.0, 3980.0, 2004.0, 1030.0, 601.0, 338.0, 208.0, 136.0, 90.0, 59.0, 35.0, 25.0, 12.0, 9.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6614990234375, -0.639892578125, -0.6182861328125, -0.5966796875, -0.5750732421875, -0.553466796875, -0.5318603515625, -0.51025390625, -0.4886474609375, -0.467041015625, -0.4454345703125, -0.423828125, -0.4022216796875, -0.380615234375, -0.3590087890625, -0.33740234375, -0.3157958984375, -0.294189453125, -0.2725830078125, -0.2509765625, -0.2293701171875, -0.207763671875, -0.1861572265625, -0.16455078125, -0.1429443359375, -0.121337890625, -0.0997314453125, -0.078125, -0.0565185546875, -0.034912109375, -0.0133056640625, 0.00830078125, 0.0299072265625, 0.051513671875, 0.0731201171875, 0.0947265625, 0.1163330078125, 0.137939453125, 0.1595458984375, 0.18115234375, 0.2027587890625, 0.224365234375, 0.2459716796875, 0.267578125, 0.2891845703125, 0.310791015625, 0.3323974609375, 0.35400390625, 0.3756103515625, 0.397216796875, 0.4188232421875, 0.4404296875, 0.4620361328125, 0.483642578125, 0.5052490234375, 0.52685546875, 0.5484619140625, 0.570068359375, 0.5916748046875, 0.61328125, 0.6348876953125, 0.656494140625, 0.6781005859375, 0.69970703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 5.0, 8.0, 11.0, 25.0, 25.0, 31.0, 29.0, 46.0, 56.0, 50.0, 77.0, 60.0, 87.0, 66.0, 78.0, 65.0, 54.0, 53.0, 36.0, 43.0, 29.0, 22.0, 13.0, 13.0, 11.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6044921875, -0.590972900390625, -0.57745361328125, -0.563934326171875, -0.5504150390625, -0.536895751953125, -0.52337646484375, -0.509857177734375, -0.496337890625, -0.482818603515625, -0.46929931640625, -0.455780029296875, -0.4422607421875, -0.428741455078125, -0.41522216796875, -0.401702880859375, -0.38818359375, -0.374664306640625, -0.36114501953125, -0.347625732421875, -0.3341064453125, -0.320587158203125, -0.30706787109375, -0.293548583984375, -0.280029296875, -0.266510009765625, -0.25299072265625, -0.239471435546875, -0.2259521484375, -0.212432861328125, -0.19891357421875, -0.185394287109375, -0.171875, -0.158355712890625, -0.14483642578125, -0.131317138671875, -0.1177978515625, -0.104278564453125, -0.09075927734375, -0.077239990234375, -0.063720703125, -0.050201416015625, -0.03668212890625, -0.023162841796875, -0.0096435546875, 0.003875732421875, 0.01739501953125, 0.030914306640625, 0.04443359375, 0.057952880859375, 0.07147216796875, 0.084991455078125, 0.0985107421875, 0.112030029296875, 0.12554931640625, 0.139068603515625, 0.152587890625, 0.166107177734375, 0.17962646484375, 0.193145751953125, 0.2066650390625, 0.220184326171875, 0.23370361328125, 0.247222900390625, 0.2607421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 11.0, 13.0, 17.0, 17.0, 24.0, 24.0, 65.0, 97.0, 132.0, 212.0, 317.0, 654.0, 1341.0, 3719.0, 13464.0, 80277.0, 687980.0, 221563.0, 28241.0, 6286.0, 2074.0, 858.0, 450.0, 250.0, 139.0, 102.0, 54.0, 48.0, 34.0, 23.0, 9.0, 14.0, 4.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.07421875, -1.0368194580078125, -0.999420166015625, -0.9620208740234375, -0.92462158203125, -0.8872222900390625, -0.849822998046875, -0.8124237060546875, -0.7750244140625, -0.7376251220703125, -0.700225830078125, -0.6628265380859375, -0.62542724609375, -0.5880279541015625, -0.550628662109375, -0.5132293701171875, -0.475830078125, -0.4384307861328125, -0.401031494140625, -0.3636322021484375, -0.32623291015625, -0.2888336181640625, -0.251434326171875, -0.2140350341796875, -0.1766357421875, -0.1392364501953125, -0.101837158203125, -0.0644378662109375, -0.02703857421875, 0.0103607177734375, 0.047760009765625, 0.0851593017578125, 0.12255859375, 0.1599578857421875, 0.197357177734375, 0.2347564697265625, 0.27215576171875, 0.3095550537109375, 0.346954345703125, 0.3843536376953125, 0.4217529296875, 0.4591522216796875, 0.496551513671875, 0.5339508056640625, 0.57135009765625, 0.6087493896484375, 0.646148681640625, 0.6835479736328125, 0.720947265625, 0.7583465576171875, 0.795745849609375, 0.8331451416015625, 0.87054443359375, 0.9079437255859375, 0.945343017578125, 0.9827423095703125, 1.0201416015625, 1.0575408935546875, 1.094940185546875, 1.1323394775390625, 1.16973876953125, 1.2071380615234375, 1.244537353515625, 1.2819366455078125, 1.3193359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 4.0, 6.0, 10.0, 15.0, 18.0, 23.0, 27.0, 38.0, 28.0, 35.0, 54.0, 37.0, 55.0, 44.0, 60.0, 51.0, 49.0, 53.0, 53.0, 53.0, 47.0, 25.0, 36.0, 31.0, 19.0, 26.0, 15.0, 14.0, 16.0, 5.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -0.995513916015625, -0.95391845703125, -0.912322998046875, -0.8707275390625, -0.829132080078125, -0.78753662109375, -0.745941162109375, -0.704345703125, -0.662750244140625, -0.62115478515625, -0.579559326171875, -0.5379638671875, -0.496368408203125, -0.45477294921875, -0.413177490234375, -0.37158203125, -0.329986572265625, -0.28839111328125, -0.246795654296875, -0.2052001953125, -0.163604736328125, -0.12200927734375, -0.080413818359375, -0.038818359375, 0.002777099609375, 0.04437255859375, 0.085968017578125, 0.1275634765625, 0.169158935546875, 0.21075439453125, 0.252349853515625, 0.2939453125, 0.335540771484375, 0.37713623046875, 0.418731689453125, 0.4603271484375, 0.501922607421875, 0.54351806640625, 0.585113525390625, 0.626708984375, 0.668304443359375, 0.70989990234375, 0.751495361328125, 0.7930908203125, 0.834686279296875, 0.87628173828125, 0.917877197265625, 0.95947265625, 1.001068115234375, 1.04266357421875, 1.084259033203125, 1.1258544921875, 1.167449951171875, 1.20904541015625, 1.250640869140625, 1.292236328125, 1.333831787109375, 1.37542724609375, 1.417022705078125, 1.4586181640625, 1.500213623046875, 1.54180908203125, 1.583404541015625, 1.625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 12.0, 24.0, 34.0, 37.0, 89.0, 143.0, 352.0, 982.0, 4323.0, 675608.0, 361373.0, 3915.0, 906.0, 354.0, 157.0, 86.0, 43.0, 33.0, 25.0, 12.0, 9.0, 4.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.43695068359375, -2.3582763671875, -2.27960205078125, -2.200927734375, -2.12225341796875, -2.0435791015625, -1.96490478515625, -1.88623046875, -1.80755615234375, -1.7288818359375, -1.65020751953125, -1.571533203125, -1.49285888671875, -1.4141845703125, -1.33551025390625, -1.2568359375, -1.17816162109375, -1.0994873046875, -1.02081298828125, -0.942138671875, -0.86346435546875, -0.7847900390625, -0.70611572265625, -0.62744140625, -0.54876708984375, -0.4700927734375, -0.39141845703125, -0.312744140625, -0.23406982421875, -0.1553955078125, -0.07672119140625, 0.001953125, 0.08062744140625, 0.1593017578125, 0.23797607421875, 0.316650390625, 0.39532470703125, 0.4739990234375, 0.55267333984375, 0.63134765625, 0.71002197265625, 0.7886962890625, 0.86737060546875, 0.946044921875, 1.02471923828125, 1.1033935546875, 1.18206787109375, 1.2607421875, 1.33941650390625, 1.4180908203125, 1.49676513671875, 1.575439453125, 1.65411376953125, 1.7327880859375, 1.81146240234375, 1.89013671875, 1.96881103515625, 2.0474853515625, 2.12615966796875, 2.204833984375, 2.28350830078125, 2.3621826171875, 2.44085693359375, 2.51953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 1.0, 7.0, 5.0, 8.0, 13.0, 14.0, 13.0, 20.0, 23.0, 26.0, 35.0, 52.0, 93.0, 119.0, 140.0, 127.0, 71.0, 60.0, 30.0, 23.0, 17.0, 17.0, 8.0, 7.0, 12.0, 10.0, 8.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011861324310302734, -0.0001153433695435524, -0.00011207349598407745, -0.00010880362242460251, -0.00010553374886512756, -0.00010226387530565262, -9.899400174617767e-05, -9.572412818670273e-05, -9.245425462722778e-05, -8.918438106775284e-05, -8.591450750827789e-05, -8.264463394880295e-05, -7.9374760389328e-05, -7.610488682985306e-05, -7.283501327037811e-05, -6.956513971090317e-05, -6.629526615142822e-05, -6.302539259195328e-05, -5.975551903247833e-05, -5.648564547300339e-05, -5.321577191352844e-05, -4.99458983540535e-05, -4.667602479457855e-05, -4.340615123510361e-05, -4.013627767562866e-05, -3.686640411615372e-05, -3.359653055667877e-05, -3.0326656997203827e-05, -2.7056783437728882e-05, -2.3786909878253937e-05, -2.0517036318778992e-05, -1.7247162759304047e-05, -1.3977289199829102e-05, -1.0707415640354156e-05, -7.4375420808792114e-06, -4.167668521404266e-06, -8.977949619293213e-07, 2.3720785975456238e-06, 5.641952157020569e-06, 8.911825716495514e-06, 1.2181699275970459e-05, 1.5451572835445404e-05, 1.872144639492035e-05, 2.1991319954395294e-05, 2.526119351387024e-05, 2.8531067073345184e-05, 3.180094063282013e-05, 3.5070814192295074e-05, 3.834068775177002e-05, 4.1610561311244965e-05, 4.488043487071991e-05, 4.8150308430194855e-05, 5.14201819896698e-05, 5.4690055549144745e-05, 5.795992910861969e-05, 6.122980266809464e-05, 6.449967622756958e-05, 6.776954978704453e-05, 7.103942334651947e-05, 7.430929690599442e-05, 7.757917046546936e-05, 8.08490440249443e-05, 8.411891758441925e-05, 8.73887911438942e-05, 9.065866470336914e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 13.0, 22.0, 18.0, 43.0, 62.0, 101.0, 199.0, 377.0, 872.0, 2059.0, 9093.0, 660692.0, 363582.0, 7864.0, 1948.0, 758.0, 353.0, 186.0, 105.0, 60.0, 29.0, 30.0, 15.0, 12.0, 7.0, 10.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59765625, -1.5506134033203125, -1.503570556640625, -1.4565277099609375, -1.40948486328125, -1.3624420166015625, -1.315399169921875, -1.2683563232421875, -1.2213134765625, -1.1742706298828125, -1.127227783203125, -1.0801849365234375, -1.03314208984375, -0.9860992431640625, -0.939056396484375, -0.8920135498046875, -0.844970703125, -0.7979278564453125, -0.750885009765625, -0.7038421630859375, -0.65679931640625, -0.6097564697265625, -0.562713623046875, -0.5156707763671875, -0.4686279296875, -0.4215850830078125, -0.374542236328125, -0.3274993896484375, -0.28045654296875, -0.2334136962890625, -0.186370849609375, -0.1393280029296875, -0.09228515625, -0.0452423095703125, 0.001800537109375, 0.0488433837890625, 0.09588623046875, 0.1429290771484375, 0.189971923828125, 0.2370147705078125, 0.2840576171875, 0.3311004638671875, 0.378143310546875, 0.4251861572265625, 0.47222900390625, 0.5192718505859375, 0.566314697265625, 0.6133575439453125, 0.660400390625, 0.7074432373046875, 0.754486083984375, 0.8015289306640625, 0.84857177734375, 0.8956146240234375, 0.942657470703125, 0.9897003173828125, 1.0367431640625, 1.0837860107421875, 1.130828857421875, 1.1778717041015625, 1.22491455078125, 1.2719573974609375, 1.319000244140625, 1.3660430908203125, 1.4130859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 1.0, 5.0, 1.0, 6.0, 9.0, 12.0, 20.0, 47.0, 74.0, 103.0, 159.0, 173.0, 148.0, 96.0, 57.0, 29.0, 19.0, 13.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9878311157226562, -0.9580841064453125, -0.9283370971679688, -0.898590087890625, -0.8688430786132812, -0.8390960693359375, -0.8093490600585938, -0.77960205078125, -0.7498550415039062, -0.7201080322265625, -0.6903610229492188, -0.660614013671875, -0.6308670043945312, -0.6011199951171875, -0.5713729858398438, -0.5416259765625, -0.5118789672851562, -0.4821319580078125, -0.45238494873046875, -0.422637939453125, -0.39289093017578125, -0.3631439208984375, -0.33339691162109375, -0.30364990234375, -0.27390289306640625, -0.2441558837890625, -0.21440887451171875, -0.184661865234375, -0.15491485595703125, -0.1251678466796875, -0.09542083740234375, -0.065673828125, -0.03592681884765625, -0.0061798095703125, 0.02356719970703125, 0.053314208984375, 0.08306121826171875, 0.1128082275390625, 0.14255523681640625, 0.17230224609375, 0.20204925537109375, 0.2317962646484375, 0.26154327392578125, 0.291290283203125, 0.32103729248046875, 0.3507843017578125, 0.38053131103515625, 0.4102783203125, 0.44002532958984375, 0.4697723388671875, 0.49951934814453125, 0.529266357421875, 0.5590133666992188, 0.5887603759765625, 0.6185073852539062, 0.64825439453125, 0.6780014038085938, 0.7077484130859375, 0.7374954223632812, 0.767242431640625, 0.7969894409179688, 0.8267364501953125, 0.8564834594726562, 0.88623046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 42.0, 223.0, 439.0, 204.0, 48.0, 10.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.52410125732422, -29.8038387298584, -29.083574295043945, -28.363311767578125, -27.643049240112305, -26.922786712646484, -26.20252227783203, -25.48225975036621, -24.76199722290039, -24.04173469543457, -23.321470260620117, -22.601207733154297, -21.880945205688477, -21.160682678222656, -20.440418243408203, -19.720155715942383, -18.99989128112793, -18.27962875366211, -17.559364318847656, -16.839101791381836, -16.118839263916016, -15.398575782775879, -14.678312301635742, -13.958049774169922, -13.237786293029785, -12.517522811889648, -11.797260284423828, -11.076996803283691, -10.356733322143555, -9.636470794677734, -8.916207313537598, -8.195943832397461, -7.475681304931641, -6.755418300628662, -6.035155296325684, -5.314891815185547, -4.594628810882568, -3.87436580657959, -3.154102325439453, -2.4338393211364746, -1.713576316833496, -0.993313193321228, -0.27305006980895996, 0.44721317291259766, 1.1674761772155762, 1.8877391815185547, 2.6080026626586914, 3.32826566696167, 4.048528671264648, 4.768791675567627, 5.4890546798706055, 6.209318161010742, 6.929581165313721, 7.649844169616699, 8.370107650756836, 9.090370178222656, 9.810633659362793, 10.53089714050293, 11.25115966796875, 11.971423149108887, 12.691686630249023, 13.411949157714844, 14.13221263885498, 14.852476119995117, 15.572738647460938]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 10.0, 14.0, 18.0, 24.0, 28.0, 44.0, 53.0, 63.0, 59.0, 83.0, 90.0, 104.0, 99.0, 59.0, 56.0, 44.0, 36.0, 33.0, 24.0, 22.0, 13.0, 3.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.369007110595703, -5.085866928100586, -4.8027262687683105, -4.519586086273193, -4.236445426940918, -3.953305244445801, -3.6701650619506836, -3.3870246410369873, -3.103884220123291, -2.8207437992095947, -2.5376033782958984, -2.2544631958007812, -1.971322774887085, -1.6881823539733887, -1.405042052268982, -1.1219017505645752, -0.8387613296508789, -0.5556209683418274, -0.2724806070327759, 0.010659754276275635, 0.29380011558532715, 0.5769405364990234, 0.8600808382034302, 1.143221139907837, 1.4263615608215332, 1.7095019817352295, 1.9926422834396362, 2.275782585144043, 2.5589230060577393, 2.8420634269714355, 3.1252036094665527, 3.408344030380249, 3.6914844512939453, 3.9746248722076416, 4.257765293121338, 4.540905475616455, 4.8240461349487305, 5.107186317443848, 5.390326499938965, 5.673466682434082, 5.956607341766357, 6.239747524261475, 6.52288818359375, 6.806028366088867, 7.089168548583984, 7.37230920791626, 7.655449390411377, 7.938590049743652, 8.22173023223877, 8.504870414733887, 8.788010597229004, 9.071151733398438, 9.354291915893555, 9.637432098388672, 9.920572280883789, 10.203712463378906, 10.486852645874023, 10.76999282836914, 11.053133010864258, 11.336274147033691, 11.619414329528809, 11.902554512023926, 12.185694694519043, 12.46883487701416, 12.751976013183594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 15.0, 13.0, 12.0, 19.0, 24.0, 38.0, 80.0, 107.0, 262.0, 641.0, 2039.0, 11023.0, 147101.0, 3599539.0, 408195.0, 20104.0, 3304.0, 920.0, 367.0, 174.0, 100.0, 62.0, 35.0, 26.0, 21.0, 14.0, 11.0, 3.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8056640625, -0.7729644775390625, -0.740264892578125, -0.7075653076171875, -0.67486572265625, -0.6421661376953125, -0.609466552734375, -0.5767669677734375, -0.5440673828125, -0.5113677978515625, -0.478668212890625, -0.4459686279296875, -0.41326904296875, -0.3805694580078125, -0.347869873046875, -0.3151702880859375, -0.282470703125, -0.2497711181640625, -0.217071533203125, -0.1843719482421875, -0.15167236328125, -0.1189727783203125, -0.086273193359375, -0.0535736083984375, -0.0208740234375, 0.0118255615234375, 0.044525146484375, 0.0772247314453125, 0.10992431640625, 0.1426239013671875, 0.175323486328125, 0.2080230712890625, 0.24072265625, 0.2734222412109375, 0.306121826171875, 0.3388214111328125, 0.37152099609375, 0.4042205810546875, 0.436920166015625, 0.4696197509765625, 0.5023193359375, 0.5350189208984375, 0.567718505859375, 0.6004180908203125, 0.63311767578125, 0.6658172607421875, 0.698516845703125, 0.7312164306640625, 0.763916015625, 0.7966156005859375, 0.829315185546875, 0.8620147705078125, 0.89471435546875, 0.9274139404296875, 0.960113525390625, 0.9928131103515625, 1.0255126953125, 1.0582122802734375, 1.090911865234375, 1.1236114501953125, 1.15631103515625, 1.1890106201171875, 1.221710205078125, 1.2544097900390625, 1.287109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 10.0, 13.0, 19.0, 25.0, 45.0, 48.0, 61.0, 65.0, 93.0, 78.0, 95.0, 92.0, 78.0, 75.0, 56.0, 40.0, 33.0, 23.0, 21.0, 9.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2952003479003906, -0.28058624267578125, -0.2659721374511719, -0.2513580322265625, -0.23674392700195312, -0.22212982177734375, -0.20751571655273438, -0.192901611328125, -0.17828750610351562, -0.16367340087890625, -0.14905929565429688, -0.1344451904296875, -0.11983108520507812, -0.10521697998046875, -0.09060287475585938, -0.07598876953125, -0.061374664306640625, -0.04676055908203125, -0.032146453857421875, -0.0175323486328125, -0.002918243408203125, 0.01169586181640625, 0.026309967041015625, 0.040924072265625, 0.055538177490234375, 0.07015228271484375, 0.08476638793945312, 0.0993804931640625, 0.11399459838867188, 0.12860870361328125, 0.14322280883789062, 0.1578369140625, 0.17245101928710938, 0.18706512451171875, 0.20167922973632812, 0.2162933349609375, 0.23090744018554688, 0.24552154541015625, 0.2601356506347656, 0.274749755859375, 0.2893638610839844, 0.30397796630859375, 0.3185920715332031, 0.3332061767578125, 0.3478202819824219, 0.36243438720703125, 0.3770484924316406, 0.39166259765625, 0.4062767028808594, 0.42089080810546875, 0.4355049133300781, 0.4501190185546875, 0.4647331237792969, 0.47934722900390625, 0.4939613342285156, 0.508575439453125, 0.5231895446777344, 0.5378036499023438, 0.5524177551269531, 0.5670318603515625, 0.5816459655761719, 0.5962600708007812, 0.6108741760253906, 0.62548828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 21.0, 27.0, 44.0, 61.0, 74.0, 164.0, 252.0, 513.0, 1252.0, 4329.0, 27729.0, 492662.0, 3497188.0, 155050.0, 11823.0, 2050.0, 551.0, 218.0, 118.0, 71.0, 28.0, 22.0, 10.0, 13.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.375, -1.3432769775390625, -1.311553955078125, -1.2798309326171875, -1.24810791015625, -1.2163848876953125, -1.184661865234375, -1.1529388427734375, -1.1212158203125, -1.0894927978515625, -1.057769775390625, -1.0260467529296875, -0.99432373046875, -0.9626007080078125, -0.930877685546875, -0.8991546630859375, -0.867431640625, -0.8357086181640625, -0.803985595703125, -0.7722625732421875, -0.74053955078125, -0.7088165283203125, -0.677093505859375, -0.6453704833984375, -0.6136474609375, -0.5819244384765625, -0.550201416015625, -0.5184783935546875, -0.48675537109375, -0.4550323486328125, -0.423309326171875, -0.3915863037109375, -0.35986328125, -0.3281402587890625, -0.296417236328125, -0.2646942138671875, -0.23297119140625, -0.2012481689453125, -0.169525146484375, -0.1378021240234375, -0.1060791015625, -0.0743560791015625, -0.042633056640625, -0.0109100341796875, 0.02081298828125, 0.0525360107421875, 0.084259033203125, 0.1159820556640625, 0.147705078125, 0.1794281005859375, 0.211151123046875, 0.2428741455078125, 0.27459716796875, 0.3063201904296875, 0.338043212890625, 0.3697662353515625, 0.4014892578125, 0.4332122802734375, 0.464935302734375, 0.4966583251953125, 0.52838134765625, 0.5601043701171875, 0.591827392578125, 0.6235504150390625, 0.6552734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 10.0, 20.0, 24.0, 33.0, 59.0, 107.0, 154.0, 238.0, 440.0, 789.0, 857.0, 560.0, 336.0, 165.0, 105.0, 66.0, 37.0, 29.0, 8.0, 7.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4951171875, -1.4635009765625, -1.431884765625, -1.4002685546875, -1.36865234375, -1.3370361328125, -1.305419921875, -1.2738037109375, -1.2421875, -1.2105712890625, -1.178955078125, -1.1473388671875, -1.11572265625, -1.0841064453125, -1.052490234375, -1.0208740234375, -0.9892578125, -0.9576416015625, -0.926025390625, -0.8944091796875, -0.86279296875, -0.8311767578125, -0.799560546875, -0.7679443359375, -0.736328125, -0.7047119140625, -0.673095703125, -0.6414794921875, -0.60986328125, -0.5782470703125, -0.546630859375, -0.5150146484375, -0.4833984375, -0.4517822265625, -0.420166015625, -0.3885498046875, -0.35693359375, -0.3253173828125, -0.293701171875, -0.2620849609375, -0.23046875, -0.1988525390625, -0.167236328125, -0.1356201171875, -0.10400390625, -0.0723876953125, -0.040771484375, -0.0091552734375, 0.0224609375, 0.0540771484375, 0.085693359375, 0.1173095703125, 0.14892578125, 0.1805419921875, 0.212158203125, 0.2437744140625, 0.275390625, 0.3070068359375, 0.338623046875, 0.3702392578125, 0.40185546875, 0.4334716796875, 0.465087890625, 0.4967041015625, 0.5283203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 34.0, 48.0, 107.0, 182.0, 211.0, 188.0, 95.0, 49.0, 15.0, 16.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.270851135253906, -7.964827537536621, -7.658803939819336, -7.352780342102051, -7.046756744384766, -6.7407331466674805, -6.4347100257873535, -6.128686428070068, -5.822662830352783, -5.516639232635498, -5.210615634918213, -4.904592037200928, -4.598568916320801, -4.292545318603516, -3.9865217208862305, -3.6804981231689453, -3.37447452545166, -3.068450927734375, -2.76242733001709, -2.456403970718384, -2.1503803730010986, -1.8443567752838135, -1.5383332967758179, -1.2323098182678223, -0.9262862205505371, -0.6202626824378967, -0.31423914432525635, -0.008215606212615967, 0.2978079319000244, 0.6038315296173096, 0.9098550081253052, 1.2158784866333008, 1.5219030380249023, 1.8279266357421875, 2.1339502334594727, 2.4399735927581787, 2.745997190475464, 3.052020788192749, 3.358044147491455, 3.6640677452087402, 3.9700913429260254, 4.2761149406433105, 4.582138538360596, 4.888162136077881, 5.194185256958008, 5.500208854675293, 5.806232452392578, 6.112256050109863, 6.418279647827148, 6.724303245544434, 7.030326843261719, 7.336350440979004, 7.642374038696289, 7.948397636413574, 8.25442123413086, 8.560443878173828, 8.86646842956543, 9.172492027282715, 9.478515625, 9.784539222717285, 10.09056282043457, 10.396586418151855, 10.70261001586914, 11.00863265991211, 11.314656257629395]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 4.0, 13.0, 5.0, 13.0, 20.0, 21.0, 20.0, 29.0, 37.0, 44.0, 49.0, 48.0, 60.0, 51.0, 49.0, 57.0, 69.0, 62.0, 59.0, 52.0, 54.0, 42.0, 23.0, 23.0, 22.0, 21.0, 18.0, 9.0, 4.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3762922286987305, -6.173606872558594, -5.970921039581299, -5.768235683441162, -5.565550327301025, -5.3628644943237305, -5.160179138183594, -4.957493782043457, -4.75480842590332, -4.552123069763184, -4.349437236785889, -4.146751880645752, -3.9440665245056152, -3.7413809299468994, -3.5386953353881836, -3.336009979248047, -3.133324146270752, -2.930638551712036, -2.7279531955718994, -2.5252676010131836, -2.322582244873047, -2.119896650314331, -1.9172110557556152, -1.714525580406189, -1.5118401050567627, -1.3091546297073364, -1.1064691543579102, -0.9037835597991943, -0.7010980844497681, -0.4984126091003418, -0.295727014541626, -0.09304153919219971, 0.10964393615722656, 0.3123294413089752, 0.5150149464607239, 0.7177004814147949, 0.9203859567642212, 1.1230714321136475, 1.3257570266723633, 1.5284425020217896, 1.7311279773712158, 1.933813452720642, 2.1364989280700684, 2.339184522628784, 2.5418701171875, 2.7445554733276367, 2.9472410678863525, 3.1499266624450684, 3.352612018585205, 3.555297613143921, 3.7579829692840576, 3.9606685638427734, 4.16335391998291, 4.366039276123047, 4.568725109100342, 4.7714104652404785, 4.974096298217773, 5.17678165435791, 5.379467487335205, 5.582152843475342, 5.7848381996154785, 5.987524032592773, 6.19020938873291, 6.392894744873047, 6.595580101013184]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 10.0, 12.0, 9.0, 39.0, 58.0, 105.0, 237.0, 510.0, 1350.0, 4362.0, 17132.0, 89414.0, 464819.0, 381403.0, 69617.0, 13862.0, 3530.0, 1144.0, 481.0, 202.0, 108.0, 70.0, 29.0, 15.0, 9.0, 15.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6701583862304688, -0.6347503662109375, -0.5993423461914062, -0.563934326171875, -0.5285263061523438, -0.4931182861328125, -0.45771026611328125, -0.42230224609375, -0.38689422607421875, -0.3514862060546875, -0.31607818603515625, -0.280670166015625, -0.24526214599609375, -0.2098541259765625, -0.17444610595703125, -0.1390380859375, -0.10363006591796875, -0.0682220458984375, -0.03281402587890625, 0.002593994140625, 0.03800201416015625, 0.0734100341796875, 0.10881805419921875, 0.14422607421875, 0.17963409423828125, 0.2150421142578125, 0.25045013427734375, 0.285858154296875, 0.32126617431640625, 0.3566741943359375, 0.39208221435546875, 0.427490234375, 0.46289825439453125, 0.4983062744140625, 0.5337142944335938, 0.569122314453125, 0.6045303344726562, 0.6399383544921875, 0.6753463745117188, 0.71075439453125, 0.7461624145507812, 0.7815704345703125, 0.8169784545898438, 0.852386474609375, 0.8877944946289062, 0.9232025146484375, 0.9586105346679688, 0.9940185546875, 1.0294265747070312, 1.0648345947265625, 1.1002426147460938, 1.135650634765625, 1.1710586547851562, 1.2064666748046875, 1.2418746948242188, 1.27728271484375, 1.3126907348632812, 1.3480987548828125, 1.3835067749023438, 1.418914794921875, 1.4543228149414062, 1.4897308349609375, 1.5251388549804688, 1.560546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 11.0, 11.0, 11.0, 22.0, 25.0, 23.0, 19.0, 42.0, 29.0, 45.0, 41.0, 37.0, 42.0, 47.0, 45.0, 64.0, 46.0, 52.0, 51.0, 46.0, 40.0, 36.0, 41.0, 29.0, 19.0, 18.0, 22.0, 16.0, 6.0, 11.0, 8.0, 4.0, 6.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3330078125, -0.3242053985595703, -0.3154029846191406, -0.30660057067871094, -0.29779815673828125, -0.28899574279785156, -0.2801933288574219, -0.2713909149169922, -0.2625885009765625, -0.2537860870361328, -0.24498367309570312, -0.23618125915527344, -0.22737884521484375, -0.21857643127441406, -0.20977401733398438, -0.2009716033935547, -0.192169189453125, -0.1833667755126953, -0.17456436157226562, -0.16576194763183594, -0.15695953369140625, -0.14815711975097656, -0.13935470581054688, -0.1305522918701172, -0.1217498779296875, -0.11294746398925781, -0.10414505004882812, -0.09534263610839844, -0.08654022216796875, -0.07773780822753906, -0.06893539428710938, -0.06013298034667969, -0.05133056640625, -0.04252815246582031, -0.033725738525390625, -0.024923324584960938, -0.01612091064453125, -0.0073184967041015625, 0.001483917236328125, 0.010286331176757812, 0.0190887451171875, 0.027891159057617188, 0.036693572998046875, 0.04549598693847656, 0.05429840087890625, 0.06310081481933594, 0.07190322875976562, 0.08070564270019531, 0.089508056640625, 0.09831047058105469, 0.10711288452148438, 0.11591529846191406, 0.12471771240234375, 0.13352012634277344, 0.14232254028320312, 0.1511249542236328, 0.1599273681640625, 0.1687297821044922, 0.17753219604492188, 0.18633460998535156, 0.19513702392578125, 0.20393943786621094, 0.21274185180664062, 0.2215442657470703, 0.2303466796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 8.0, 7.0, 18.0, 17.0, 30.0, 56.0, 57.0, 94.0, 156.0, 261.0, 472.0, 889.0, 2066.0, 6603.0, 51060.0, 837141.0, 133541.0, 10775.0, 2746.0, 1126.0, 605.0, 278.0, 198.0, 116.0, 66.0, 48.0, 35.0, 27.0, 21.0, 6.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0234375, -1.9614715576171875, -1.899505615234375, -1.8375396728515625, -1.77557373046875, -1.7136077880859375, -1.651641845703125, -1.5896759033203125, -1.5277099609375, -1.4657440185546875, -1.403778076171875, -1.3418121337890625, -1.27984619140625, -1.2178802490234375, -1.155914306640625, -1.0939483642578125, -1.031982421875, -0.9700164794921875, -0.908050537109375, -0.8460845947265625, -0.78411865234375, -0.7221527099609375, -0.660186767578125, -0.5982208251953125, -0.5362548828125, -0.4742889404296875, -0.412322998046875, -0.3503570556640625, -0.28839111328125, -0.2264251708984375, -0.164459228515625, -0.1024932861328125, -0.04052734375, 0.0214385986328125, 0.083404541015625, 0.1453704833984375, 0.20733642578125, 0.2693023681640625, 0.331268310546875, 0.3932342529296875, 0.4552001953125, 0.5171661376953125, 0.579132080078125, 0.6410980224609375, 0.70306396484375, 0.7650299072265625, 0.826995849609375, 0.8889617919921875, 0.950927734375, 1.0128936767578125, 1.074859619140625, 1.1368255615234375, 1.19879150390625, 1.2607574462890625, 1.322723388671875, 1.3846893310546875, 1.4466552734375, 1.5086212158203125, 1.570587158203125, 1.6325531005859375, 1.69451904296875, 1.7564849853515625, 1.818450927734375, 1.8804168701171875, 1.9423828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 7.0, 16.0, 22.0, 21.0, 20.0, 22.0, 36.0, 40.0, 41.0, 50.0, 52.0, 39.0, 45.0, 63.0, 51.0, 54.0, 54.0, 48.0, 44.0, 44.0, 46.0, 28.0, 30.0, 21.0, 20.0, 10.0, 8.0, 11.0, 8.0, 3.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.640380859375, -1.59033203125, -1.540283203125, -1.490234375, -1.440185546875, -1.39013671875, -1.340087890625, -1.2900390625, -1.239990234375, -1.18994140625, -1.139892578125, -1.08984375, -1.039794921875, -0.98974609375, -0.939697265625, -0.8896484375, -0.839599609375, -0.78955078125, -0.739501953125, -0.689453125, -0.639404296875, -0.58935546875, -0.539306640625, -0.4892578125, -0.439208984375, -0.38916015625, -0.339111328125, -0.2890625, -0.239013671875, -0.18896484375, -0.138916015625, -0.0888671875, -0.038818359375, 0.01123046875, 0.061279296875, 0.111328125, 0.161376953125, 0.21142578125, 0.261474609375, 0.3115234375, 0.361572265625, 0.41162109375, 0.461669921875, 0.51171875, 0.561767578125, 0.61181640625, 0.661865234375, 0.7119140625, 0.761962890625, 0.81201171875, 0.862060546875, 0.912109375, 0.962158203125, 1.01220703125, 1.062255859375, 1.1123046875, 1.162353515625, 1.21240234375, 1.262451171875, 1.3125, 1.362548828125, 1.41259765625, 1.462646484375, 1.5126953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 5.0, 8.0, 14.0, 32.0, 31.0, 62.0, 86.0, 164.0, 298.0, 847.0, 2742.0, 14499.0, 233415.0, 761224.0, 28790.0, 4145.0, 1165.0, 484.0, 230.0, 109.0, 68.0, 33.0, 34.0, 9.0, 8.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9443283081054688, -0.9174652099609375, -0.8906021118164062, -0.863739013671875, -0.8368759155273438, -0.8100128173828125, -0.7831497192382812, -0.75628662109375, -0.7294235229492188, -0.7025604248046875, -0.6756973266601562, -0.648834228515625, -0.6219711303710938, -0.5951080322265625, -0.5682449340820312, -0.5413818359375, -0.5145187377929688, -0.4876556396484375, -0.46079254150390625, -0.433929443359375, -0.40706634521484375, -0.3802032470703125, -0.35334014892578125, -0.32647705078125, -0.29961395263671875, -0.2727508544921875, -0.24588775634765625, -0.219024658203125, -0.19216156005859375, -0.1652984619140625, -0.13843536376953125, -0.111572265625, -0.08470916748046875, -0.0578460693359375, -0.03098297119140625, -0.004119873046875, 0.02274322509765625, 0.0496063232421875, 0.07646942138671875, 0.10333251953125, 0.13019561767578125, 0.1570587158203125, 0.18392181396484375, 0.210784912109375, 0.23764801025390625, 0.2645111083984375, 0.29137420654296875, 0.3182373046875, 0.34510040283203125, 0.3719635009765625, 0.39882659912109375, 0.425689697265625, 0.45255279541015625, 0.4794158935546875, 0.5062789916992188, 0.53314208984375, 0.5600051879882812, 0.5868682861328125, 0.6137313842773438, 0.640594482421875, 0.6674575805664062, 0.6943206787109375, 0.7211837768554688, 0.748046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 4.0, 12.0, 13.0, 7.0, 10.0, 9.0, 31.0, 31.0, 26.0, 29.0, 44.0, 58.0, 75.0, 148.0, 142.0, 87.0, 60.0, 48.0, 41.0, 28.0, 23.0, 21.0, 14.0, 9.0, 11.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001354217529296875, -0.0001307651400566101, -0.00012610852718353271, -0.00012145191431045532, -0.00011679530143737793, -0.00011213868856430054, -0.00010748207569122314, -0.00010282546281814575, -9.816884994506836e-05, -9.351223707199097e-05, -8.885562419891357e-05, -8.419901132583618e-05, -7.954239845275879e-05, -7.48857855796814e-05, -7.0229172706604e-05, -6.557255983352661e-05, -6.091594696044922e-05, -5.6259334087371826e-05, -5.1602721214294434e-05, -4.694610834121704e-05, -4.228949546813965e-05, -3.7632882595062256e-05, -3.297626972198486e-05, -2.831965684890747e-05, -2.3663043975830078e-05, -1.9006431102752686e-05, -1.4349818229675293e-05, -9.6932053565979e-06, -5.036592483520508e-06, -3.7997961044311523e-07, 4.276633262634277e-06, 8.93324613571167e-06, 1.3589859008789062e-05, 1.8246471881866455e-05, 2.2903084754943848e-05, 2.755969762802124e-05, 3.221631050109863e-05, 3.6872923374176025e-05, 4.152953624725342e-05, 4.618614912033081e-05, 5.08427619934082e-05, 5.5499374866485596e-05, 6.015598773956299e-05, 6.481260061264038e-05, 6.946921348571777e-05, 7.412582635879517e-05, 7.878243923187256e-05, 8.343905210494995e-05, 8.809566497802734e-05, 9.275227785110474e-05, 9.740889072418213e-05, 0.00010206550359725952, 0.00010672211647033691, 0.0001113787293434143, 0.0001160353422164917, 0.00012069195508956909, 0.00012534856796264648, 0.00013000518083572388, 0.00013466179370880127, 0.00013931840658187866, 0.00014397501945495605, 0.00014863163232803345, 0.00015328824520111084, 0.00015794485807418823, 0.00016260147094726562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 10.0, 10.0, 20.0, 23.0, 33.0, 43.0, 35.0, 58.0, 107.0, 165.0, 238.0, 441.0, 847.0, 1721.0, 4450.0, 14745.0, 85763.0, 811543.0, 103182.0, 16225.0, 4827.0, 1839.0, 893.0, 460.0, 278.0, 178.0, 110.0, 76.0, 63.0, 39.0, 31.0, 18.0, 9.0, 14.0, 11.0, 10.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6358261108398438, -0.6168670654296875, -0.5979080200195312, -0.578948974609375, -0.5599899291992188, -0.5410308837890625, -0.5220718383789062, -0.50311279296875, -0.48415374755859375, -0.4651947021484375, -0.44623565673828125, -0.427276611328125, -0.40831756591796875, -0.3893585205078125, -0.37039947509765625, -0.3514404296875, -0.33248138427734375, -0.3135223388671875, -0.29456329345703125, -0.275604248046875, -0.25664520263671875, -0.2376861572265625, -0.21872711181640625, -0.19976806640625, -0.18080902099609375, -0.1618499755859375, -0.14289093017578125, -0.123931884765625, -0.10497283935546875, -0.0860137939453125, -0.06705474853515625, -0.048095703125, -0.02913665771484375, -0.0101776123046875, 0.00878143310546875, 0.027740478515625, 0.04669952392578125, 0.0656585693359375, 0.08461761474609375, 0.10357666015625, 0.12253570556640625, 0.1414947509765625, 0.16045379638671875, 0.179412841796875, 0.19837188720703125, 0.2173309326171875, 0.23628997802734375, 0.2552490234375, 0.27420806884765625, 0.2931671142578125, 0.31212615966796875, 0.331085205078125, 0.35004425048828125, 0.3690032958984375, 0.38796234130859375, 0.40692138671875, 0.42588043212890625, 0.4448394775390625, 0.46379852294921875, 0.482757568359375, 0.5017166137695312, 0.5206756591796875, 0.5396347045898438, 0.55859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 3.0, 5.0, 7.0, 11.0, 13.0, 25.0, 32.0, 40.0, 61.0, 80.0, 93.0, 138.0, 113.0, 73.0, 69.0, 52.0, 40.0, 39.0, 24.0, 17.0, 10.0, 13.0, 6.0, 1.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.49810791015625, -0.4781494140625, -0.45819091796875, -0.438232421875, -0.41827392578125, -0.3983154296875, -0.37835693359375, -0.3583984375, -0.33843994140625, -0.3184814453125, -0.29852294921875, -0.278564453125, -0.25860595703125, -0.2386474609375, -0.21868896484375, -0.19873046875, -0.17877197265625, -0.1588134765625, -0.13885498046875, -0.118896484375, -0.09893798828125, -0.0789794921875, -0.05902099609375, -0.0390625, -0.01910400390625, 0.0008544921875, 0.02081298828125, 0.040771484375, 0.06072998046875, 0.0806884765625, 0.10064697265625, 0.12060546875, 0.14056396484375, 0.1605224609375, 0.18048095703125, 0.200439453125, 0.22039794921875, 0.2403564453125, 0.26031494140625, 0.2802734375, 0.30023193359375, 0.3201904296875, 0.34014892578125, 0.360107421875, 0.38006591796875, 0.4000244140625, 0.41998291015625, 0.43994140625, 0.45989990234375, 0.4798583984375, 0.49981689453125, 0.519775390625, 0.53973388671875, 0.5596923828125, 0.57965087890625, 0.599609375, 0.61956787109375, 0.6395263671875, 0.65948486328125, 0.679443359375, 0.69940185546875, 0.7193603515625, 0.73931884765625, 0.75927734375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 14.0, 15.0, 35.0, 73.0, 126.0, 197.0, 203.0, 145.0, 83.0, 40.0, 19.0, 9.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.508768081665039, -10.209827423095703, -9.910886764526367, -9.611946105957031, -9.313005447387695, -9.01406478881836, -8.715124130249023, -8.416183471679688, -8.117242813110352, -7.818302154541016, -7.51936149597168, -7.220420837402344, -6.921480178833008, -6.622539520263672, -6.323598384857178, -6.024657726287842, -5.725716590881348, -5.426775932312012, -5.127835273742676, -4.82889461517334, -4.529953956604004, -4.231013298034668, -3.932072162628174, -3.633131504058838, -3.334190845489502, -3.035250186920166, -2.73630952835083, -2.437368631362915, -2.138427972793579, -1.8394873142242432, -1.5405465364456177, -1.2416057586669922, -0.9426660537719727, -0.6437253355979919, -0.34478461742401123, -0.04584389925003052, 0.2530968189239502, 0.5520374774932861, 0.8509782552719116, 1.149919033050537, 1.448859691619873, 1.747800350189209, 2.046741008758545, 2.34568190574646, 2.644622564315796, 2.943563222885132, 3.242504119873047, 3.541444778442383, 3.8403854370117188, 4.139326095581055, 4.438266754150391, 4.737207412719727, 5.0361480712890625, 5.335088729858398, 5.634029865264893, 5.9329705238342285, 6.2319111824035645, 6.5308518409729, 6.829792499542236, 7.128733158111572, 7.427674293518066, 7.726614952087402, 8.025555610656738, 8.324496269226074, 8.62343692779541]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 8.0, 5.0, 21.0, 11.0, 9.0, 8.0, 27.0, 18.0, 23.0, 24.0, 20.0, 31.0, 38.0, 36.0, 44.0, 49.0, 66.0, 43.0, 57.0, 51.0, 48.0, 38.0, 31.0, 31.0, 34.0, 24.0, 29.0, 20.0, 17.0, 12.0, 26.0, 18.0, 15.0, 8.0, 10.0, 5.0, 5.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-6.334390640258789, -6.159178256988525, -5.983965873718262, -5.808753967285156, -5.633541584014893, -5.458329200744629, -5.283117294311523, -5.10790491104126, -4.932692527770996, -4.757480144500732, -4.582267761230469, -4.407055854797363, -4.2318434715271, -4.056631088256836, -3.8814189434051514, -3.706206798553467, -3.530994415283203, -3.3557820320129395, -3.180569887161255, -3.0053577423095703, -2.8301453590393066, -2.654932975769043, -2.4797208309173584, -2.304508686065674, -2.12929630279541, -1.954084038734436, -1.778871774673462, -1.6036595106124878, -1.4284472465515137, -1.2532349824905396, -1.0780227184295654, -0.9028104543685913, -0.7275986671447754, -0.5523864030838013, -0.37717413902282715, -0.20196187496185303, -0.026749610900878906, 0.14846265316009521, 0.32367491722106934, 0.49888718128204346, 0.6740994453430176, 0.8493117094039917, 1.0245239734649658, 1.19973623752594, 1.374948501586914, 1.5501607656478882, 1.7253730297088623, 1.9005852937698364, 2.0757975578308105, 2.251009941101074, 2.426222085952759, 2.6014342308044434, 2.776646614074707, 2.9518589973449707, 3.1270711421966553, 3.30228328704834, 3.4774956703186035, 3.652708053588867, 3.8279201984405518, 4.003132343292236, 4.1783447265625, 4.353557109832764, 4.528769493103027, 4.703981399536133, 4.8791937828063965]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 7.0, 11.0, 12.0, 16.0, 32.0, 45.0, 52.0, 74.0, 148.0, 287.0, 506.0, 1036.0, 2584.0, 8136.0, 37478.0, 417761.0, 3380144.0, 302943.0, 31592.0, 7212.0, 2264.0, 934.0, 469.0, 213.0, 112.0, 83.0, 49.0, 27.0, 20.0, 7.0, 10.0, 2.0, 7.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75244140625, -0.7317962646484375, -0.711151123046875, -0.6905059814453125, -0.66986083984375, -0.6492156982421875, -0.628570556640625, -0.6079254150390625, -0.5872802734375, -0.5666351318359375, -0.545989990234375, -0.5253448486328125, -0.50469970703125, -0.4840545654296875, -0.463409423828125, -0.4427642822265625, -0.422119140625, -0.4014739990234375, -0.380828857421875, -0.3601837158203125, -0.33953857421875, -0.3188934326171875, -0.298248291015625, -0.2776031494140625, -0.2569580078125, -0.2363128662109375, -0.215667724609375, -0.1950225830078125, -0.17437744140625, -0.1537322998046875, -0.133087158203125, -0.1124420166015625, -0.091796875, -0.0711517333984375, -0.050506591796875, -0.0298614501953125, -0.00921630859375, 0.0114288330078125, 0.032073974609375, 0.0527191162109375, 0.0733642578125, 0.0940093994140625, 0.114654541015625, 0.1352996826171875, 0.15594482421875, 0.1765899658203125, 0.197235107421875, 0.2178802490234375, 0.238525390625, 0.2591705322265625, 0.279815673828125, 0.3004608154296875, 0.32110595703125, 0.3417510986328125, 0.362396240234375, 0.3830413818359375, 0.4036865234375, 0.4243316650390625, 0.444976806640625, 0.4656219482421875, 0.48626708984375, 0.5069122314453125, 0.527557373046875, 0.5482025146484375, 0.56884765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 8.0, 6.0, 6.0, 11.0, 11.0, 14.0, 16.0, 17.0, 26.0, 43.0, 35.0, 36.0, 52.0, 58.0, 38.0, 56.0, 67.0, 49.0, 57.0, 60.0, 46.0, 46.0, 49.0, 41.0, 33.0, 32.0, 23.0, 14.0, 13.0, 14.0, 7.0, 7.0, 5.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.404296875, -0.39418983459472656, -0.3840827941894531, -0.3739757537841797, -0.36386871337890625, -0.3537616729736328, -0.3436546325683594, -0.33354759216308594, -0.3234405517578125, -0.31333351135253906, -0.3032264709472656, -0.2931194305419922, -0.28301239013671875, -0.2729053497314453, -0.2627983093261719, -0.25269126892089844, -0.242584228515625, -0.23247718811035156, -0.22237014770507812, -0.2122631072998047, -0.20215606689453125, -0.1920490264892578, -0.18194198608398438, -0.17183494567871094, -0.1617279052734375, -0.15162086486816406, -0.14151382446289062, -0.1314067840576172, -0.12129974365234375, -0.11119270324707031, -0.10108566284179688, -0.09097862243652344, -0.08087158203125, -0.07076454162597656, -0.060657501220703125, -0.05055046081542969, -0.04044342041015625, -0.030336380004882812, -0.020229339599609375, -0.010122299194335938, -1.52587890625e-05, 0.010091781616210938, 0.020198822021484375, 0.030305862426757812, 0.04041290283203125, 0.05051994323730469, 0.060626983642578125, 0.07073402404785156, 0.080841064453125, 0.09094810485839844, 0.10105514526367188, 0.11116218566894531, 0.12126922607421875, 0.1313762664794922, 0.14148330688476562, 0.15159034729003906, 0.1616973876953125, 0.17180442810058594, 0.18191146850585938, 0.1920185089111328, 0.20212554931640625, 0.2122325897216797, 0.22233963012695312, 0.23244667053222656, 0.2425537109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 24.0, 37.0, 33.0, 75.0, 95.0, 111.0, 180.0, 209.0, 328.0, 1026.0, 10824.0, 4038097.0, 140462.0, 2040.0, 349.0, 151.0, 75.0, 53.0, 55.0, 24.0, 11.0, 8.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3125, -3.2331390380859375, -3.153778076171875, -3.0744171142578125, -2.99505615234375, -2.9156951904296875, -2.836334228515625, -2.7569732666015625, -2.6776123046875, -2.5982513427734375, -2.518890380859375, -2.4395294189453125, -2.36016845703125, -2.2808074951171875, -2.201446533203125, -2.1220855712890625, -2.042724609375, -1.9633636474609375, -1.884002685546875, -1.8046417236328125, -1.72528076171875, -1.6459197998046875, -1.566558837890625, -1.4871978759765625, -1.4078369140625, -1.3284759521484375, -1.249114990234375, -1.1697540283203125, -1.09039306640625, -1.0110321044921875, -0.931671142578125, -0.8523101806640625, -0.77294921875, -0.6935882568359375, -0.614227294921875, -0.5348663330078125, -0.45550537109375, -0.3761444091796875, -0.296783447265625, -0.2174224853515625, -0.1380615234375, -0.0587005615234375, 0.020660400390625, 0.1000213623046875, 0.17938232421875, 0.2587432861328125, 0.338104248046875, 0.4174652099609375, 0.496826171875, 0.5761871337890625, 0.655548095703125, 0.7349090576171875, 0.81427001953125, 0.8936309814453125, 0.972991943359375, 1.0523529052734375, 1.1317138671875, 1.2110748291015625, 1.290435791015625, 1.3697967529296875, 1.44915771484375, 1.5285186767578125, 1.607879638671875, 1.6872406005859375, 1.7666015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 14.0, 29.0, 116.0, 274.0, 1130.0, 1798.0, 498.0, 141.0, 47.0, 14.0, 8.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.560546875, -3.4948577880859375, -3.429168701171875, -3.3634796142578125, -3.29779052734375, -3.2321014404296875, -3.166412353515625, -3.1007232666015625, -3.0350341796875, -2.9693450927734375, -2.903656005859375, -2.8379669189453125, -2.77227783203125, -2.7065887451171875, -2.640899658203125, -2.5752105712890625, -2.509521484375, -2.4438323974609375, -2.378143310546875, -2.3124542236328125, -2.24676513671875, -2.1810760498046875, -2.115386962890625, -2.0496978759765625, -1.9840087890625, -1.9183197021484375, -1.852630615234375, -1.7869415283203125, -1.72125244140625, -1.6555633544921875, -1.589874267578125, -1.5241851806640625, -1.45849609375, -1.3928070068359375, -1.327117919921875, -1.2614288330078125, -1.19573974609375, -1.1300506591796875, -1.064361572265625, -0.9986724853515625, -0.9329833984375, -0.8672943115234375, -0.801605224609375, -0.7359161376953125, -0.67022705078125, -0.6045379638671875, -0.538848876953125, -0.4731597900390625, -0.407470703125, -0.3417816162109375, -0.276092529296875, -0.2104034423828125, -0.14471435546875, -0.0790252685546875, -0.013336181640625, 0.0523529052734375, 0.1180419921875, 0.1837310791015625, 0.249420166015625, 0.3151092529296875, 0.38079833984375, 0.4464874267578125, 0.512176513671875, 0.5778656005859375, 0.6435546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 14.0, 24.0, 49.0, 87.0, 171.0, 316.0, 196.0, 78.0, 23.0, 17.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.600770950317383, -13.183714866638184, -12.7666597366333, -12.349603652954102, -11.932547569274902, -11.515491485595703, -11.09843635559082, -10.681380271911621, -10.264324188232422, -9.847268104553223, -9.43021297454834, -9.01315689086914, -8.596100807189941, -8.179044723510742, -7.761989593505859, -7.34493350982666, -6.927878379821777, -6.510822772979736, -6.093766689300537, -5.676711082458496, -5.259654998779297, -4.842599391937256, -4.425543785095215, -4.008487701416016, -3.5914320945739746, -3.1743762493133545, -2.7573204040527344, -2.3402647972106934, -1.9232089519500732, -1.5061531066894531, -1.089097499847412, -0.672041654586792, -0.2549858093261719, 0.16206997632980347, 0.5791257619857788, 0.9961814880371094, 1.4132373332977295, 1.8302931785583496, 2.2473487854003906, 2.6644046306610107, 3.081460475921631, 3.498516321182251, 3.915572166442871, 4.332627773284912, 4.749683380126953, 5.166739463806152, 5.583795070648193, 6.000850677490234, 6.417906761169434, 6.834962368011475, 7.252018451690674, 7.669074058532715, 8.086130142211914, 8.503185272216797, 8.920241355895996, 9.337297439575195, 9.754352569580078, 10.171408653259277, 10.58846378326416, 11.00551986694336, 11.422575950622559, 11.839632034301758, 12.25668716430664, 12.67374324798584, 13.090799331665039]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 4.0, 8.0, 6.0, 10.0, 7.0, 17.0, 19.0, 18.0, 22.0, 31.0, 34.0, 36.0, 44.0, 57.0, 54.0, 69.0, 71.0, 58.0, 51.0, 43.0, 46.0, 46.0, 44.0, 28.0, 27.0, 42.0, 20.0, 13.0, 18.0, 14.0, 8.0, 9.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.489697456359863, -7.2925801277160645, -7.095462799072266, -6.898344993591309, -6.70122766494751, -6.504110336303711, -6.306993007659912, -6.109875679016113, -5.912757873535156, -5.715640544891357, -5.518523216247559, -5.321405410766602, -5.124288082122803, -4.927170753479004, -4.730053424835205, -4.532936096191406, -4.335818767547607, -4.138701438903809, -3.9415838718414307, -3.744466543197632, -3.547348976135254, -3.350231647491455, -3.1531143188476562, -2.9559969902038574, -2.7588794231414795, -2.5617620944976807, -2.3646445274353027, -2.167527198791504, -1.9704097509384155, -1.7732923030853271, -1.5761749744415283, -1.37905752658844, -1.1819405555725098, -0.9848231077194214, -0.7877057194709778, -0.5905883312225342, -0.3934708833694458, -0.19635343551635742, 0.0007638931274414062, 0.19788134098052979, 0.39499878883361816, 0.5921162366867065, 0.7892336249351501, 0.9863510131835938, 1.1834684610366821, 1.3805859088897705, 1.5777032375335693, 1.7748206853866577, 1.971938133239746, 2.169055461883545, 2.366173028945923, 2.5632903575897217, 2.7604079246520996, 2.9575252532958984, 3.1546425819396973, 3.351759910583496, 3.548877477645874, 3.745994806289673, 3.943112373352051, 4.14022970199585, 4.337347030639648, 4.5344648361206055, 4.731581687927246, 4.928699493408203, 5.125816822052002]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 12.0, 19.0, 23.0, 29.0, 43.0, 61.0, 142.0, 246.0, 380.0, 788.0, 1743.0, 4388.0, 12962.0, 51212.0, 272822.0, 544561.0, 119873.0, 26431.0, 7518.0, 2755.0, 1251.0, 557.0, 275.0, 171.0, 97.0, 57.0, 39.0, 23.0, 15.0, 14.0, 10.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79443359375, -0.7616958618164062, -0.7289581298828125, -0.6962203979492188, -0.663482666015625, -0.6307449340820312, -0.5980072021484375, -0.5652694702148438, -0.53253173828125, -0.49979400634765625, -0.4670562744140625, -0.43431854248046875, -0.401580810546875, -0.36884307861328125, -0.3361053466796875, -0.30336761474609375, -0.2706298828125, -0.23789215087890625, -0.2051544189453125, -0.17241668701171875, -0.139678955078125, -0.10694122314453125, -0.0742034912109375, -0.04146575927734375, -0.00872802734375, 0.02400970458984375, 0.0567474365234375, 0.08948516845703125, 0.122222900390625, 0.15496063232421875, 0.1876983642578125, 0.22043609619140625, 0.253173828125, 0.28591156005859375, 0.3186492919921875, 0.35138702392578125, 0.384124755859375, 0.41686248779296875, 0.4496002197265625, 0.48233795166015625, 0.51507568359375, 0.5478134155273438, 0.5805511474609375, 0.6132888793945312, 0.646026611328125, 0.6787643432617188, 0.7115020751953125, 0.7442398071289062, 0.7769775390625, 0.8097152709960938, 0.8424530029296875, 0.8751907348632812, 0.907928466796875, 0.9406661987304688, 0.9734039306640625, 1.0061416625976562, 1.03887939453125, 1.0716171264648438, 1.1043548583984375, 1.1370925903320312, 1.169830322265625, 1.2025680541992188, 1.2353057861328125, 1.2680435180664062, 1.30078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 9.0, 2.0, 10.0, 15.0, 7.0, 20.0, 34.0, 37.0, 38.0, 52.0, 63.0, 68.0, 65.0, 58.0, 56.0, 77.0, 45.0, 58.0, 48.0, 47.0, 46.0, 29.0, 23.0, 25.0, 17.0, 17.0, 5.0, 10.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.51416015625, -0.5016937255859375, -0.489227294921875, -0.4767608642578125, -0.46429443359375, -0.4518280029296875, -0.439361572265625, -0.4268951416015625, -0.4144287109375, -0.4019622802734375, -0.389495849609375, -0.3770294189453125, -0.36456298828125, -0.3520965576171875, -0.339630126953125, -0.3271636962890625, -0.314697265625, -0.3022308349609375, -0.289764404296875, -0.2772979736328125, -0.26483154296875, -0.2523651123046875, -0.239898681640625, -0.2274322509765625, -0.2149658203125, -0.2024993896484375, -0.190032958984375, -0.1775665283203125, -0.16510009765625, -0.1526336669921875, -0.140167236328125, -0.1277008056640625, -0.115234375, -0.1027679443359375, -0.090301513671875, -0.0778350830078125, -0.06536865234375, -0.0529022216796875, -0.040435791015625, -0.0279693603515625, -0.0155029296875, -0.0030364990234375, 0.009429931640625, 0.0218963623046875, 0.03436279296875, 0.0468292236328125, 0.059295654296875, 0.0717620849609375, 0.084228515625, 0.0966949462890625, 0.109161376953125, 0.1216278076171875, 0.13409423828125, 0.1465606689453125, 0.159027099609375, 0.1714935302734375, 0.1839599609375, 0.1964263916015625, 0.208892822265625, 0.2213592529296875, 0.23382568359375, 0.2462921142578125, 0.258758544921875, 0.2712249755859375, 0.28369140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 6.0, 6.0, 12.0, 12.0, 19.0, 27.0, 44.0, 60.0, 98.0, 176.0, 366.0, 793.0, 2147.0, 11123.0, 288690.0, 722398.0, 17685.0, 2941.0, 946.0, 428.0, 226.0, 131.0, 67.0, 50.0, 29.0, 24.0, 16.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.762237548828125, -2.67877197265625, -2.595306396484375, -2.5118408203125, -2.428375244140625, -2.34490966796875, -2.261444091796875, -2.177978515625, -2.094512939453125, -2.01104736328125, -1.927581787109375, -1.8441162109375, -1.760650634765625, -1.67718505859375, -1.593719482421875, -1.51025390625, -1.426788330078125, -1.34332275390625, -1.259857177734375, -1.1763916015625, -1.092926025390625, -1.00946044921875, -0.925994873046875, -0.842529296875, -0.759063720703125, -0.67559814453125, -0.592132568359375, -0.5086669921875, -0.425201416015625, -0.34173583984375, -0.258270263671875, -0.1748046875, -0.091339111328125, -0.00787353515625, 0.075592041015625, 0.1590576171875, 0.242523193359375, 0.32598876953125, 0.409454345703125, 0.492919921875, 0.576385498046875, 0.65985107421875, 0.743316650390625, 0.8267822265625, 0.910247802734375, 0.99371337890625, 1.077178955078125, 1.16064453125, 1.244110107421875, 1.32757568359375, 1.411041259765625, 1.4945068359375, 1.577972412109375, 1.66143798828125, 1.744903564453125, 1.828369140625, 1.911834716796875, 1.99530029296875, 2.078765869140625, 2.1622314453125, 2.245697021484375, 2.32916259765625, 2.412628173828125, 2.49609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 9.0, 7.0, 5.0, 6.0, 19.0, 18.0, 34.0, 35.0, 38.0, 44.0, 48.0, 57.0, 68.0, 54.0, 53.0, 81.0, 63.0, 62.0, 53.0, 53.0, 36.0, 44.0, 27.0, 24.0, 13.0, 15.0, 12.0, 5.0, 4.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1484375, -2.0902252197265625, -2.032012939453125, -1.9738006591796875, -1.91558837890625, -1.8573760986328125, -1.799163818359375, -1.7409515380859375, -1.6827392578125, -1.6245269775390625, -1.566314697265625, -1.5081024169921875, -1.44989013671875, -1.3916778564453125, -1.333465576171875, -1.2752532958984375, -1.217041015625, -1.1588287353515625, -1.100616455078125, -1.0424041748046875, -0.98419189453125, -0.9259796142578125, -0.867767333984375, -0.8095550537109375, -0.7513427734375, -0.6931304931640625, -0.634918212890625, -0.5767059326171875, -0.51849365234375, -0.4602813720703125, -0.402069091796875, -0.3438568115234375, -0.28564453125, -0.2274322509765625, -0.169219970703125, -0.1110076904296875, -0.05279541015625, 0.0054168701171875, 0.063629150390625, 0.1218414306640625, 0.1800537109375, 0.2382659912109375, 0.296478271484375, 0.3546905517578125, 0.41290283203125, 0.4711151123046875, 0.529327392578125, 0.5875396728515625, 0.645751953125, 0.7039642333984375, 0.762176513671875, 0.8203887939453125, 0.87860107421875, 0.9368133544921875, 0.995025634765625, 1.0532379150390625, 1.1114501953125, 1.1696624755859375, 1.227874755859375, 1.2860870361328125, 1.34429931640625, 1.4025115966796875, 1.460723876953125, 1.5189361572265625, 1.5771484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 2.0, 5.0, 11.0, 10.0, 18.0, 34.0, 72.0, 141.0, 377.0, 1180.0, 7855.0, 267899.0, 756966.0, 11686.0, 1535.0, 403.0, 156.0, 83.0, 43.0, 29.0, 17.0, 6.0, 4.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3427734375, -1.2995758056640625, -1.256378173828125, -1.2131805419921875, -1.16998291015625, -1.1267852783203125, -1.083587646484375, -1.0403900146484375, -0.9971923828125, -0.9539947509765625, -0.910797119140625, -0.8675994873046875, -0.82440185546875, -0.7812042236328125, -0.738006591796875, -0.6948089599609375, -0.651611328125, -0.6084136962890625, -0.565216064453125, -0.5220184326171875, -0.47882080078125, -0.4356231689453125, -0.392425537109375, -0.3492279052734375, -0.3060302734375, -0.2628326416015625, -0.219635009765625, -0.1764373779296875, -0.13323974609375, -0.0900421142578125, -0.046844482421875, -0.0036468505859375, 0.03955078125, 0.0827484130859375, 0.125946044921875, 0.1691436767578125, 0.21234130859375, 0.2555389404296875, 0.298736572265625, 0.3419342041015625, 0.3851318359375, 0.4283294677734375, 0.471527099609375, 0.5147247314453125, 0.55792236328125, 0.6011199951171875, 0.644317626953125, 0.6875152587890625, 0.730712890625, 0.7739105224609375, 0.817108154296875, 0.8603057861328125, 0.90350341796875, 0.9467010498046875, 0.989898681640625, 1.0330963134765625, 1.0762939453125, 1.1194915771484375, 1.162689208984375, 1.2058868408203125, 1.24908447265625, 1.2922821044921875, 1.335479736328125, 1.3786773681640625, 1.421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 7.0, 19.0, 12.0, 19.0, 28.0, 25.0, 40.0, 55.0, 87.0, 143.0, 159.0, 124.0, 58.0, 51.0, 40.0, 21.0, 20.0, 10.0, 9.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.00019502639770507812, -0.0001905187964439392, -0.0001860111951828003, -0.00018150359392166138, -0.00017699599266052246, -0.00017248839139938354, -0.00016798079013824463, -0.0001634731888771057, -0.0001589655876159668, -0.00015445798635482788, -0.00014995038509368896, -0.00014544278383255005, -0.00014093518257141113, -0.00013642758131027222, -0.0001319199800491333, -0.00012741237878799438, -0.00012290477752685547, -0.00011839717626571655, -0.00011388957500457764, -0.00010938197374343872, -0.0001048743724822998, -0.00010036677122116089, -9.585916996002197e-05, -9.135156869888306e-05, -8.684396743774414e-05, -8.233636617660522e-05, -7.782876491546631e-05, -7.332116365432739e-05, -6.881356239318848e-05, -6.430596113204956e-05, -5.9798359870910645e-05, -5.529075860977173e-05, -5.078315734863281e-05, -4.6275556087493896e-05, -4.176795482635498e-05, -3.7260353565216064e-05, -3.275275230407715e-05, -2.8245151042938232e-05, -2.3737549781799316e-05, -1.92299485206604e-05, -1.4722347259521484e-05, -1.0214745998382568e-05, -5.707144737243652e-06, -1.1995434761047363e-06, 3.3080577850341797e-06, 7.815659046173096e-06, 1.2323260307312012e-05, 1.6830861568450928e-05, 2.1338462829589844e-05, 2.584606409072876e-05, 3.0353665351867676e-05, 3.486126661300659e-05, 3.936886787414551e-05, 4.3876469135284424e-05, 4.838407039642334e-05, 5.2891671657562256e-05, 5.739927291870117e-05, 6.190687417984009e-05, 6.6414475440979e-05, 7.092207670211792e-05, 7.542967796325684e-05, 7.993727922439575e-05, 8.444488048553467e-05, 8.895248174667358e-05, 9.34600830078125e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 14.0, 20.0, 26.0, 39.0, 57.0, 85.0, 128.0, 252.0, 435.0, 1062.0, 2783.0, 9675.0, 64024.0, 865281.0, 88155.0, 11074.0, 3157.0, 1197.0, 464.0, 243.0, 137.0, 74.0, 57.0, 34.0, 22.0, 15.0, 9.0, 6.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6868820190429688, -0.6628265380859375, -0.6387710571289062, -0.614715576171875, -0.5906600952148438, -0.5666046142578125, -0.5425491333007812, -0.51849365234375, -0.49443817138671875, -0.4703826904296875, -0.44632720947265625, -0.422271728515625, -0.39821624755859375, -0.3741607666015625, -0.35010528564453125, -0.3260498046875, -0.30199432373046875, -0.2779388427734375, -0.25388336181640625, -0.229827880859375, -0.20577239990234375, -0.1817169189453125, -0.15766143798828125, -0.13360595703125, -0.10955047607421875, -0.0854949951171875, -0.06143951416015625, -0.037384033203125, -0.01332855224609375, 0.0107269287109375, 0.03478240966796875, 0.058837890625, 0.08289337158203125, 0.1069488525390625, 0.13100433349609375, 0.155059814453125, 0.17911529541015625, 0.2031707763671875, 0.22722625732421875, 0.25128173828125, 0.27533721923828125, 0.2993927001953125, 0.32344818115234375, 0.347503662109375, 0.37155914306640625, 0.3956146240234375, 0.41967010498046875, 0.4437255859375, 0.46778106689453125, 0.4918365478515625, 0.5158920288085938, 0.539947509765625, 0.5640029907226562, 0.5880584716796875, 0.6121139526367188, 0.63616943359375, 0.6602249145507812, 0.6842803955078125, 0.7083358764648438, 0.732391357421875, 0.7564468383789062, 0.7805023193359375, 0.8045578002929688, 0.82861328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 6.0, 3.0, 6.0, 5.0, 13.0, 21.0, 28.0, 41.0, 46.0, 101.0, 130.0, 137.0, 155.0, 92.0, 63.0, 45.0, 23.0, 25.0, 17.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7392578125, -0.7179718017578125, -0.696685791015625, -0.6753997802734375, -0.65411376953125, -0.6328277587890625, -0.611541748046875, -0.5902557373046875, -0.5689697265625, -0.5476837158203125, -0.526397705078125, -0.5051116943359375, -0.48382568359375, -0.4625396728515625, -0.441253662109375, -0.4199676513671875, -0.398681640625, -0.3773956298828125, -0.356109619140625, -0.3348236083984375, -0.31353759765625, -0.2922515869140625, -0.270965576171875, -0.2496795654296875, -0.2283935546875, -0.2071075439453125, -0.185821533203125, -0.1645355224609375, -0.14324951171875, -0.1219635009765625, -0.100677490234375, -0.0793914794921875, -0.05810546875, -0.0368194580078125, -0.015533447265625, 0.0057525634765625, 0.02703857421875, 0.0483245849609375, 0.069610595703125, 0.0908966064453125, 0.1121826171875, 0.1334686279296875, 0.154754638671875, 0.1760406494140625, 0.19732666015625, 0.2186126708984375, 0.239898681640625, 0.2611846923828125, 0.282470703125, 0.3037567138671875, 0.325042724609375, 0.3463287353515625, 0.36761474609375, 0.3889007568359375, 0.410186767578125, 0.4314727783203125, 0.4527587890625, 0.4740447998046875, 0.495330810546875, 0.5166168212890625, 0.53790283203125, 0.5591888427734375, 0.580474853515625, 0.6017608642578125, 0.623046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 16.0, 17.0, 64.0, 136.0, 275.0, 251.0, 138.0, 42.0, 22.0, 11.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.772589683532715, -13.339581489562988, -12.906572341918945, -12.473564147949219, -12.040555953979492, -11.60754680633545, -11.174538612365723, -10.74152946472168, -10.308521270751953, -9.875513076782227, -9.442503929138184, -9.009495735168457, -8.57648754119873, -8.143478393554688, -7.710470199584961, -7.277461528778076, -6.84445333480835, -6.411444664001465, -5.978436470031738, -5.5454277992248535, -5.112419128417969, -4.679410934448242, -4.246402263641357, -3.8133935928344727, -3.380385160446167, -2.9473767280578613, -2.5143680572509766, -2.081359624862671, -1.6483510732650757, -1.2153425216674805, -0.7823340892791748, -0.34932541847229004, 0.08368301391601562, 0.5166915655136108, 0.9497000575065613, 1.3827085494995117, 1.815717101097107, 2.248725652694702, 2.681734085083008, 3.1147427558898926, 3.5477511882781982, 3.980759620666504, 4.413768291473389, 4.846776962280273, 5.27978515625, 5.712793827056885, 6.1458024978637695, 6.578810691833496, 7.011819362640381, 7.444828033447266, 7.877836227416992, 8.310844421386719, 8.743853569030762, 9.176861763000488, 9.609870910644531, 10.042879104614258, 10.475887298583984, 10.908895492553711, 11.341904640197754, 11.77491283416748, 12.207921028137207, 12.64093017578125, 13.073938369750977, 13.506946563720703, 13.939955711364746]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 5.0, 6.0, 8.0, 9.0, 13.0, 14.0, 18.0, 21.0, 26.0, 24.0, 24.0, 35.0, 35.0, 43.0, 51.0, 61.0, 57.0, 67.0, 60.0, 63.0, 56.0, 34.0, 31.0, 39.0, 25.0, 20.0, 17.0, 24.0, 27.0, 21.0, 14.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.163899898529053, -6.953677654266357, -6.743455410003662, -6.533233165740967, -6.323010444641113, -6.112788200378418, -5.902565956115723, -5.692343711853027, -5.482121467590332, -5.271899223327637, -5.061676979064941, -4.851454734802246, -4.641232490539551, -4.4310102462768555, -4.220787525177002, -4.010565280914307, -3.8003430366516113, -3.590120792388916, -3.3798985481262207, -3.1696760654449463, -2.959453821182251, -2.7492315769195557, -2.5390090942382812, -2.328786849975586, -2.1185646057128906, -1.9083423614501953, -1.6981199979782104, -1.4878976345062256, -1.2776753902435303, -1.067453145980835, -0.8572307825088501, -0.6470084190368652, -0.4367856979370117, -0.22656339406967163, -0.016341090202331543, 0.19388121366500854, 0.40410351753234863, 0.614325761795044, 0.8245481252670288, 1.0347704887390137, 1.244992733001709, 1.4552149772644043, 1.6654373407363892, 1.875659704208374, 2.0858819484710693, 2.2961041927337646, 2.506326675415039, 2.7165489196777344, 2.9267711639404297, 3.136993408203125, 3.3472156524658203, 3.5574381351470947, 3.76766037940979, 3.9778826236724854, 4.18810510635376, 4.398327350616455, 4.60854959487915, 4.818771839141846, 5.028994083404541, 5.239216327667236, 5.44943904876709, 5.659661293029785, 5.8698835372924805, 6.080105781555176, 6.290328025817871]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 16.0, 27.0, 36.0, 55.0, 78.0, 121.0, 206.0, 384.0, 680.0, 1525.0, 4489.0, 21623.0, 415345.0, 3628384.0, 104875.0, 11297.0, 2796.0, 982.0, 503.0, 282.0, 160.0, 110.0, 65.0, 46.0, 45.0, 29.0, 16.0, 16.0, 11.0, 8.0, 7.0, 7.0, 7.0, 2.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.85986328125, -0.8340530395507812, -0.8082427978515625, -0.7824325561523438, -0.756622314453125, -0.7308120727539062, -0.7050018310546875, -0.6791915893554688, -0.65338134765625, -0.6275711059570312, -0.6017608642578125, -0.5759506225585938, -0.550140380859375, -0.5243301391601562, -0.4985198974609375, -0.47270965576171875, -0.4468994140625, -0.42108917236328125, -0.3952789306640625, -0.36946868896484375, -0.343658447265625, -0.31784820556640625, -0.2920379638671875, -0.26622772216796875, -0.24041748046875, -0.21460723876953125, -0.1887969970703125, -0.16298675537109375, -0.137176513671875, -0.11136627197265625, -0.0855560302734375, -0.05974578857421875, -0.033935546875, -0.00812530517578125, 0.0176849365234375, 0.04349517822265625, 0.069305419921875, 0.09511566162109375, 0.1209259033203125, 0.14673614501953125, 0.17254638671875, 0.19835662841796875, 0.2241668701171875, 0.24997711181640625, 0.275787353515625, 0.30159759521484375, 0.3274078369140625, 0.35321807861328125, 0.3790283203125, 0.40483856201171875, 0.4306488037109375, 0.45645904541015625, 0.482269287109375, 0.5080795288085938, 0.5338897705078125, 0.5597000122070312, 0.58551025390625, 0.6113204956054688, 0.6371307373046875, 0.6629409790039062, 0.688751220703125, 0.7145614624023438, 0.7403717041015625, 0.7661819458007812, 0.7919921875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 8.0, 7.0, 16.0, 24.0, 20.0, 44.0, 35.0, 52.0, 54.0, 68.0, 70.0, 75.0, 59.0, 67.0, 68.0, 76.0, 55.0, 59.0, 25.0, 30.0, 22.0, 22.0, 21.0, 11.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373291015625, -0.3600883483886719, -0.34688568115234375, -0.3336830139160156, -0.3204803466796875, -0.3072776794433594, -0.29407501220703125, -0.2808723449707031, -0.267669677734375, -0.2544670104980469, -0.24126434326171875, -0.22806167602539062, -0.2148590087890625, -0.20165634155273438, -0.18845367431640625, -0.17525100708007812, -0.16204833984375, -0.14884567260742188, -0.13564300537109375, -0.12244033813476562, -0.1092376708984375, -0.09603500366210938, -0.08283233642578125, -0.06962966918945312, -0.056427001953125, -0.043224334716796875, -0.03002166748046875, -0.016819000244140625, -0.0036163330078125, 0.009586334228515625, 0.02278900146484375, 0.035991668701171875, 0.0491943359375, 0.062397003173828125, 0.07559967041015625, 0.08880233764648438, 0.1020050048828125, 0.11520767211914062, 0.12841033935546875, 0.14161300659179688, 0.154815673828125, 0.16801834106445312, 0.18122100830078125, 0.19442367553710938, 0.2076263427734375, 0.22082901000976562, 0.23403167724609375, 0.24723434448242188, 0.26043701171875, 0.2736396789550781, 0.28684234619140625, 0.3000450134277344, 0.3132476806640625, 0.3264503479003906, 0.33965301513671875, 0.3528556823730469, 0.366058349609375, 0.3792610168457031, 0.39246368408203125, 0.4056663513183594, 0.4188690185546875, 0.4320716857910156, 0.44527435302734375, 0.4584770202636719, 0.4716796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 13.0, 26.0, 40.0, 51.0, 73.0, 92.0, 145.0, 298.0, 1036.0, 65808.0, 4123696.0, 2439.0, 307.0, 100.0, 51.0, 26.0, 33.0, 22.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.606201171875, -4.45849609375, -4.310791015625, -4.1630859375, -4.015380859375, -3.86767578125, -3.719970703125, -3.572265625, -3.424560546875, -3.27685546875, -3.129150390625, -2.9814453125, -2.833740234375, -2.68603515625, -2.538330078125, -2.390625, -2.242919921875, -2.09521484375, -1.947509765625, -1.7998046875, -1.652099609375, -1.50439453125, -1.356689453125, -1.208984375, -1.061279296875, -0.91357421875, -0.765869140625, -0.6181640625, -0.470458984375, -0.32275390625, -0.175048828125, -0.02734375, 0.120361328125, 0.26806640625, 0.415771484375, 0.5634765625, 0.711181640625, 0.85888671875, 1.006591796875, 1.154296875, 1.302001953125, 1.44970703125, 1.597412109375, 1.7451171875, 1.892822265625, 2.04052734375, 2.188232421875, 2.3359375, 2.483642578125, 2.63134765625, 2.779052734375, 2.9267578125, 3.074462890625, 3.22216796875, 3.369873046875, 3.517578125, 3.665283203125, 3.81298828125, 3.960693359375, 4.1083984375, 4.256103515625, 4.40380859375, 4.551513671875, 4.69921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 13.0, 32.0, 223.0, 2623.0, 1068.0, 106.0, 14.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.93359375, -5.825370788574219, -5.7171478271484375, -5.608924865722656, -5.500701904296875, -5.392478942871094, -5.2842559814453125, -5.176033020019531, -5.06781005859375, -4.959587097167969, -4.8513641357421875, -4.743141174316406, -4.634918212890625, -4.526695251464844, -4.4184722900390625, -4.310249328613281, -4.2020263671875, -4.093803405761719, -3.9855804443359375, -3.8773574829101562, -3.769134521484375, -3.6609115600585938, -3.5526885986328125, -3.4444656372070312, -3.33624267578125, -3.2280197143554688, -3.1197967529296875, -3.0115737915039062, -2.903350830078125, -2.7951278686523438, -2.6869049072265625, -2.5786819458007812, -2.470458984375, -2.3622360229492188, -2.2540130615234375, -2.1457901000976562, -2.037567138671875, -1.9293441772460938, -1.8211212158203125, -1.7128982543945312, -1.60467529296875, -1.4964523315429688, -1.3882293701171875, -1.2800064086914062, -1.171783447265625, -1.0635604858398438, -0.9553375244140625, -0.8471145629882812, -0.7388916015625, -0.6306686401367188, -0.5224456787109375, -0.41422271728515625, -0.305999755859375, -0.19777679443359375, -0.0895538330078125, 0.01866912841796875, 0.12689208984375, 0.23511505126953125, 0.3433380126953125, 0.45156097412109375, 0.559783935546875, 0.6680068969726562, 0.7762298583984375, 0.8844528198242188, 0.99267578125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 12.0, 19.0, 39.0, 136.0, 490.0, 242.0, 39.0, 11.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.63571548461914, -22.935924530029297, -22.236133575439453, -21.536344528198242, -20.8365535736084, -20.136762619018555, -19.436973571777344, -18.7371826171875, -18.037391662597656, -17.337600708007812, -16.63780975341797, -15.938020706176758, -15.238229751586914, -14.53843879699707, -13.838648796081543, -13.138858795166016, -12.439067840576172, -11.739276885986328, -11.0394868850708, -10.339696884155273, -9.63990592956543, -8.940114974975586, -8.240324974060059, -7.540534496307373, -6.8407440185546875, -6.140953540802002, -5.441163063049316, -4.741372585296631, -4.041582107543945, -3.3417916297912598, -2.642001152038574, -1.9422106742858887, -1.2424201965332031, -0.5426297187805176, 0.15716075897216797, 0.8569512367248535, 1.556741714477539, 2.2565321922302246, 2.95632266998291, 3.6561131477355957, 4.355903625488281, 5.055694103240967, 5.755484580993652, 6.455275058746338, 7.155065536499023, 7.854856014251709, 8.554646492004395, 9.254436492919922, 9.954227447509766, 10.65401840209961, 11.353808403015137, 12.053598403930664, 12.753389358520508, 13.453180313110352, 14.152970314025879, 14.852760314941406, 15.55255126953125, 16.252342224121094, 16.952133178710938, 17.65192222595215, 18.351713180541992, 19.051504135131836, 19.751293182373047, 20.45108413696289, 21.150875091552734]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 9.0, 10.0, 20.0, 22.0, 26.0, 31.0, 46.0, 48.0, 49.0, 46.0, 65.0, 50.0, 63.0, 53.0, 75.0, 60.0, 47.0, 41.0, 41.0, 43.0, 29.0, 16.0, 21.0, 13.0, 13.0, 15.0, 9.0, 10.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.843503952026367, -5.640341758728027, -5.4371795654296875, -5.234017372131348, -5.030855178833008, -4.827692985534668, -4.624530792236328, -4.421368598937988, -4.218206405639648, -4.015044212341309, -3.8118820190429688, -3.608719825744629, -3.405557632446289, -3.202395439147949, -2.9992332458496094, -2.7960710525512695, -2.5929086208343506, -2.3897464275360107, -2.186584234237671, -1.983422040939331, -1.7802598476409912, -1.5770975351333618, -1.373935341835022, -1.1707731485366821, -0.9676109552383423, -0.7644487619400024, -0.5612865686416626, -0.358124315738678, -0.15496212244033813, 0.048200130462646484, 0.25136232376098633, 0.45452451705932617, 0.657686710357666, 0.8608489036560059, 1.0640110969543457, 1.2671732902526855, 1.4703354835510254, 1.6734977960586548, 1.8766599893569946, 2.079822063446045, 2.2829842567443848, 2.4861464500427246, 2.6893086433410645, 2.8924708366394043, 3.095633029937744, 3.298795223236084, 3.501957416534424, 3.7051196098327637, 3.9082820415496826, 4.111444473266602, 4.314606666564941, 4.517768859863281, 4.720931053161621, 4.924093246459961, 5.127255439758301, 5.330417633056641, 5.5335798263549805, 5.73674201965332, 5.93990421295166, 6.14306640625, 6.34622859954834, 6.54939079284668, 6.7525529861450195, 6.955715179443359, 7.158877372741699]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 13.0, 13.0, 14.0, 19.0, 23.0, 43.0, 60.0, 102.0, 137.0, 224.0, 423.0, 822.0, 2333.0, 9484.0, 61004.0, 489585.0, 421932.0, 50258.0, 8125.0, 2140.0, 800.0, 389.0, 186.0, 135.0, 78.0, 53.0, 45.0, 28.0, 21.0, 11.0, 16.0, 9.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.005859375, -0.96710205078125, -0.9283447265625, -0.88958740234375, -0.850830078125, -0.81207275390625, -0.7733154296875, -0.73455810546875, -0.69580078125, -0.65704345703125, -0.6182861328125, -0.57952880859375, -0.540771484375, -0.50201416015625, -0.4632568359375, -0.42449951171875, -0.3857421875, -0.34698486328125, -0.3082275390625, -0.26947021484375, -0.230712890625, -0.19195556640625, -0.1531982421875, -0.11444091796875, -0.07568359375, -0.03692626953125, 0.0018310546875, 0.04058837890625, 0.079345703125, 0.11810302734375, 0.1568603515625, 0.19561767578125, 0.234375, 0.27313232421875, 0.3118896484375, 0.35064697265625, 0.389404296875, 0.42816162109375, 0.4669189453125, 0.50567626953125, 0.54443359375, 0.58319091796875, 0.6219482421875, 0.66070556640625, 0.699462890625, 0.73822021484375, 0.7769775390625, 0.81573486328125, 0.8544921875, 0.89324951171875, 0.9320068359375, 0.97076416015625, 1.009521484375, 1.04827880859375, 1.0870361328125, 1.12579345703125, 1.16455078125, 1.20330810546875, 1.2420654296875, 1.28082275390625, 1.319580078125, 1.35833740234375, 1.3970947265625, 1.43585205078125, 1.474609375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 13.0, 19.0, 24.0, 26.0, 38.0, 35.0, 41.0, 51.0, 50.0, 53.0, 47.0, 68.0, 53.0, 59.0, 69.0, 56.0, 44.0, 49.0, 39.0, 35.0, 30.0, 20.0, 18.0, 15.0, 12.0, 10.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3595428466796875, -0.346282958984375, -0.3330230712890625, -0.31976318359375, -0.3065032958984375, -0.293243408203125, -0.2799835205078125, -0.2667236328125, -0.2534637451171875, -0.240203857421875, -0.2269439697265625, -0.21368408203125, -0.2004241943359375, -0.187164306640625, -0.1739044189453125, -0.16064453125, -0.1473846435546875, -0.134124755859375, -0.1208648681640625, -0.10760498046875, -0.0943450927734375, -0.081085205078125, -0.0678253173828125, -0.0545654296875, -0.0413055419921875, -0.028045654296875, -0.0147857666015625, -0.00152587890625, 0.0117340087890625, 0.024993896484375, 0.0382537841796875, 0.051513671875, 0.0647735595703125, 0.078033447265625, 0.0912933349609375, 0.10455322265625, 0.1178131103515625, 0.131072998046875, 0.1443328857421875, 0.1575927734375, 0.1708526611328125, 0.184112548828125, 0.1973724365234375, 0.21063232421875, 0.2238922119140625, 0.237152099609375, 0.2504119873046875, 0.263671875, 0.2769317626953125, 0.290191650390625, 0.3034515380859375, 0.31671142578125, 0.3299713134765625, 0.343231201171875, 0.3564910888671875, 0.3697509765625, 0.3830108642578125, 0.396270751953125, 0.4095306396484375, 0.42279052734375, 0.4360504150390625, 0.449310302734375, 0.4625701904296875, 0.475830078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 10.0, 9.0, 8.0, 15.0, 13.0, 21.0, 19.0, 40.0, 56.0, 88.0, 114.0, 228.0, 374.0, 757.0, 1685.0, 4252.0, 13280.0, 53742.0, 265612.0, 580649.0, 95005.0, 21566.0, 6329.0, 2382.0, 1036.0, 527.0, 257.0, 149.0, 90.0, 50.0, 50.0, 35.0, 23.0, 17.0, 17.0, 10.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.009765625, -0.980224609375, -0.95068359375, -0.921142578125, -0.8916015625, -0.862060546875, -0.83251953125, -0.802978515625, -0.7734375, -0.743896484375, -0.71435546875, -0.684814453125, -0.6552734375, -0.625732421875, -0.59619140625, -0.566650390625, -0.537109375, -0.507568359375, -0.47802734375, -0.448486328125, -0.4189453125, -0.389404296875, -0.35986328125, -0.330322265625, -0.30078125, -0.271240234375, -0.24169921875, -0.212158203125, -0.1826171875, -0.153076171875, -0.12353515625, -0.093994140625, -0.064453125, -0.034912109375, -0.00537109375, 0.024169921875, 0.0537109375, 0.083251953125, 0.11279296875, 0.142333984375, 0.171875, 0.201416015625, 0.23095703125, 0.260498046875, 0.2900390625, 0.319580078125, 0.34912109375, 0.378662109375, 0.408203125, 0.437744140625, 0.46728515625, 0.496826171875, 0.5263671875, 0.555908203125, 0.58544921875, 0.614990234375, 0.64453125, 0.674072265625, 0.70361328125, 0.733154296875, 0.7626953125, 0.792236328125, 0.82177734375, 0.851318359375, 0.880859375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 5.0, 5.0, 9.0, 5.0, 5.0, 15.0, 14.0, 17.0, 21.0, 25.0, 21.0, 30.0, 36.0, 48.0, 31.0, 39.0, 48.0, 42.0, 64.0, 54.0, 53.0, 43.0, 42.0, 40.0, 39.0, 40.0, 29.0, 29.0, 29.0, 19.0, 14.0, 26.0, 17.0, 8.0, 8.0, 8.0, 5.0, 9.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.279296875, -1.2348480224609375, -1.190399169921875, -1.1459503173828125, -1.10150146484375, -1.0570526123046875, -1.012603759765625, -0.9681549072265625, -0.9237060546875, -0.8792572021484375, -0.834808349609375, -0.7903594970703125, -0.74591064453125, -0.7014617919921875, -0.657012939453125, -0.6125640869140625, -0.568115234375, -0.5236663818359375, -0.479217529296875, -0.4347686767578125, -0.39031982421875, -0.3458709716796875, -0.301422119140625, -0.2569732666015625, -0.2125244140625, -0.1680755615234375, -0.123626708984375, -0.0791778564453125, -0.03472900390625, 0.0097198486328125, 0.054168701171875, 0.0986175537109375, 0.14306640625, 0.1875152587890625, 0.231964111328125, 0.2764129638671875, 0.32086181640625, 0.3653106689453125, 0.409759521484375, 0.4542083740234375, 0.4986572265625, 0.5431060791015625, 0.587554931640625, 0.6320037841796875, 0.67645263671875, 0.7209014892578125, 0.765350341796875, 0.8097991943359375, 0.854248046875, 0.8986968994140625, 0.943145751953125, 0.9875946044921875, 1.03204345703125, 1.0764923095703125, 1.120941162109375, 1.1653900146484375, 1.2098388671875, 1.2542877197265625, 1.298736572265625, 1.3431854248046875, 1.38763427734375, 1.4320831298828125, 1.476531982421875, 1.5209808349609375, 1.5654296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 9.0, 5.0, 12.0, 12.0, 15.0, 21.0, 34.0, 63.0, 69.0, 124.0, 171.0, 324.0, 564.0, 1233.0, 2666.0, 6526.0, 17778.0, 55988.0, 220788.0, 580610.0, 110914.0, 31820.0, 10949.0, 4104.0, 1844.0, 825.0, 432.0, 221.0, 134.0, 110.0, 70.0, 24.0, 22.0, 16.0, 12.0, 5.0, 7.0, 5.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.24365234375, -0.2350311279296875, -0.226409912109375, -0.2177886962890625, -0.20916748046875, -0.2005462646484375, -0.191925048828125, -0.1833038330078125, -0.1746826171875, -0.1660614013671875, -0.157440185546875, -0.1488189697265625, -0.14019775390625, -0.1315765380859375, -0.122955322265625, -0.1143341064453125, -0.105712890625, -0.0970916748046875, -0.088470458984375, -0.0798492431640625, -0.07122802734375, -0.0626068115234375, -0.053985595703125, -0.0453643798828125, -0.0367431640625, -0.0281219482421875, -0.019500732421875, -0.0108795166015625, -0.00225830078125, 0.0063629150390625, 0.014984130859375, 0.0236053466796875, 0.0322265625, 0.0408477783203125, 0.049468994140625, 0.0580902099609375, 0.06671142578125, 0.0753326416015625, 0.083953857421875, 0.0925750732421875, 0.1011962890625, 0.1098175048828125, 0.118438720703125, 0.1270599365234375, 0.13568115234375, 0.1443023681640625, 0.152923583984375, 0.1615447998046875, 0.170166015625, 0.1787872314453125, 0.187408447265625, 0.1960296630859375, 0.20465087890625, 0.2132720947265625, 0.221893310546875, 0.2305145263671875, 0.2391357421875, 0.2477569580078125, 0.256378173828125, 0.2649993896484375, 0.27362060546875, 0.2822418212890625, 0.290863037109375, 0.2994842529296875, 0.30810546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 5.0, 0.0, 6.0, 3.0, 5.0, 4.0, 9.0, 7.0, 8.0, 9.0, 23.0, 15.0, 29.0, 36.0, 57.0, 101.0, 137.0, 151.0, 112.0, 79.0, 53.0, 56.0, 25.0, 21.0, 10.0, 10.0, 8.0, 4.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.914138793945312e-05, -6.59450888633728e-05, -6.274878978729248e-05, -5.955249071121216e-05, -5.6356191635131836e-05, -5.3159892559051514e-05, -4.996359348297119e-05, -4.676729440689087e-05, -4.357099533081055e-05, -4.0374696254730225e-05, -3.71783971786499e-05, -3.398209810256958e-05, -3.078579902648926e-05, -2.7589499950408936e-05, -2.4393200874328613e-05, -2.119690179824829e-05, -1.800060272216797e-05, -1.4804303646087646e-05, -1.1608004570007324e-05, -8.411705493927002e-06, -5.21540641784668e-06, -2.0191073417663574e-06, 1.1771917343139648e-06, 4.373490810394287e-06, 7.569789886474609e-06, 1.0766088962554932e-05, 1.3962388038635254e-05, 1.7158687114715576e-05, 2.03549861907959e-05, 2.355128526687622e-05, 2.6747584342956543e-05, 2.9943883419036865e-05, 3.314018249511719e-05, 3.633648157119751e-05, 3.953278064727783e-05, 4.2729079723358154e-05, 4.5925378799438477e-05, 4.91216778755188e-05, 5.231797695159912e-05, 5.551427602767944e-05, 5.8710575103759766e-05, 6.190687417984009e-05, 6.510317325592041e-05, 6.829947233200073e-05, 7.149577140808105e-05, 7.469207048416138e-05, 7.78883695602417e-05, 8.108466863632202e-05, 8.428096771240234e-05, 8.747726678848267e-05, 9.067356586456299e-05, 9.386986494064331e-05, 9.706616401672363e-05, 0.00010026246309280396, 0.00010345876216888428, 0.0001066550612449646, 0.00010985136032104492, 0.00011304765939712524, 0.00011624395847320557, 0.00011944025754928589, 0.0001226365566253662, 0.00012583285570144653, 0.00012902915477752686, 0.00013222545385360718, 0.0001354217529296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 7.0, 10.0, 16.0, 16.0, 35.0, 67.0, 114.0, 185.0, 352.0, 761.0, 1624.0, 4288.0, 13385.0, 50357.0, 248065.0, 602770.0, 92974.0, 22241.0, 6802.0, 2337.0, 1082.0, 460.0, 241.0, 140.0, 78.0, 48.0, 33.0, 13.0, 19.0, 15.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.43310546875, -0.4225940704345703, -0.4120826721191406, -0.40157127380371094, -0.39105987548828125, -0.38054847717285156, -0.3700370788574219, -0.3595256805419922, -0.3490142822265625, -0.3385028839111328, -0.3279914855957031, -0.31748008728027344, -0.30696868896484375, -0.29645729064941406, -0.2859458923339844, -0.2754344940185547, -0.264923095703125, -0.2544116973876953, -0.24390029907226562, -0.23338890075683594, -0.22287750244140625, -0.21236610412597656, -0.20185470581054688, -0.1913433074951172, -0.1808319091796875, -0.1703205108642578, -0.15980911254882812, -0.14929771423339844, -0.13878631591796875, -0.12827491760253906, -0.11776351928710938, -0.10725212097167969, -0.09674072265625, -0.08622932434082031, -0.07571792602539062, -0.06520652770996094, -0.05469512939453125, -0.04418373107910156, -0.033672332763671875, -0.023160934448242188, -0.0126495361328125, -0.0021381378173828125, 0.008373260498046875, 0.018884658813476562, 0.02939605712890625, 0.03990745544433594, 0.050418853759765625, 0.06093025207519531, 0.071441650390625, 0.08195304870605469, 0.09246444702148438, 0.10297584533691406, 0.11348724365234375, 0.12399864196777344, 0.13451004028320312, 0.1450214385986328, 0.1555328369140625, 0.1660442352294922, 0.17655563354492188, 0.18706703186035156, 0.19757843017578125, 0.20808982849121094, 0.21860122680664062, 0.2291126251220703, 0.2396240234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 11.0, 5.0, 12.0, 20.0, 25.0, 45.0, 45.0, 87.0, 107.0, 124.0, 111.0, 107.0, 81.0, 76.0, 28.0, 28.0, 25.0, 16.0, 17.0, 12.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5180549621582031, -0.5019302368164062, -0.4858055114746094, -0.4696807861328125, -0.4535560607910156, -0.43743133544921875, -0.4213066101074219, -0.405181884765625, -0.3890571594238281, -0.37293243408203125, -0.3568077087402344, -0.3406829833984375, -0.3245582580566406, -0.30843353271484375, -0.2923088073730469, -0.27618408203125, -0.2600593566894531, -0.24393463134765625, -0.22780990600585938, -0.2116851806640625, -0.19556045532226562, -0.17943572998046875, -0.16331100463867188, -0.147186279296875, -0.13106155395507812, -0.11493682861328125, -0.09881210327148438, -0.0826873779296875, -0.06656265258789062, -0.05043792724609375, -0.034313201904296875, -0.0181884765625, -0.002063751220703125, 0.01406097412109375, 0.030185699462890625, 0.0463104248046875, 0.062435150146484375, 0.07855987548828125, 0.09468460083007812, 0.110809326171875, 0.12693405151367188, 0.14305877685546875, 0.15918350219726562, 0.1753082275390625, 0.19143295288085938, 0.20755767822265625, 0.22368240356445312, 0.23980712890625, 0.2559318542480469, 0.27205657958984375, 0.2881813049316406, 0.3043060302734375, 0.3204307556152344, 0.33655548095703125, 0.3526802062988281, 0.368804931640625, 0.3849296569824219, 0.40105438232421875, 0.4171791076660156, 0.4333038330078125, 0.4494285583496094, 0.46555328369140625, 0.4816780090332031, 0.497802734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 5.0, 13.0, 20.0, 46.0, 119.0, 211.0, 284.0, 153.0, 76.0, 31.0, 13.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.921339988708496, -11.572976112365723, -11.22461223602295, -10.876248359680176, -10.527884483337402, -10.179520606994629, -9.831157684326172, -9.482793807983398, -9.134429931640625, -8.786066055297852, -8.437702178955078, -8.089338302612305, -7.740974426269531, -7.392610549926758, -7.044247150421143, -6.695883274078369, -6.3475189208984375, -5.999155044555664, -5.650791168212891, -5.302427291870117, -4.954063415527344, -4.60569953918457, -4.257336139678955, -3.9089722633361816, -3.560608386993408, -3.2122445106506348, -2.8638806343078613, -2.515516996383667, -2.1671531200408936, -1.8187892436981201, -1.4704256057739258, -1.1220617294311523, -0.7736978530883789, -0.42533403635025024, -0.07697021961212158, 0.2713935375213623, 0.6197574138641357, 0.9681212902069092, 1.3164849281311035, 1.664848804473877, 2.0132126808166504, 2.361576557159424, 2.7099404335021973, 3.0583040714263916, 3.406667947769165, 3.7550318241119385, 4.103395462036133, 4.451759338378906, 4.80012321472168, 5.148487091064453, 5.496850967407227, 5.84521484375, 6.193578720092773, 6.541942596435547, 6.890305995941162, 7.2386698722839355, 7.587033748626709, 7.935397624969482, 8.283761024475098, 8.632124900817871, 8.980488777160645, 9.328852653503418, 9.677216529846191, 10.025580406188965, 10.373944282531738]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 5.0, 10.0, 9.0, 12.0, 10.0, 13.0, 15.0, 23.0, 37.0, 22.0, 24.0, 26.0, 31.0, 29.0, 40.0, 50.0, 57.0, 70.0, 75.0, 77.0, 43.0, 43.0, 34.0, 39.0, 35.0, 21.0, 31.0, 17.0, 21.0, 13.0, 16.0, 10.0, 6.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.065862655639648, -7.836196422576904, -7.606529712677002, -7.376863479614258, -7.147197246551514, -6.9175310134887695, -6.687864303588867, -6.458198070526123, -6.228531837463379, -5.998865604400635, -5.769198894500732, -5.539532661437988, -5.309866428375244, -5.0802001953125, -4.850533485412598, -4.6208672523498535, -4.391200542449951, -4.161534309387207, -3.931867837905884, -3.7022013664245605, -3.4725351333618164, -3.242868661880493, -3.01320219039917, -2.783535957336426, -2.5538694858551025, -2.3242030143737793, -2.094536781311035, -1.864870309829712, -1.6352039575576782, -1.4055376052856445, -1.1758711338043213, -0.9462047815322876, -0.7165389060974121, -0.48687252402305603, -0.25720614194869995, -0.027539730072021484, 0.2021266222000122, 0.4317929744720459, 0.6614594459533691, 0.8911257982254028, 1.1207921504974365, 1.3504585027694702, 1.580124855041504, 1.8097913265228271, 2.0394577980041504, 2.2691240310668945, 2.4987905025482178, 2.728456974029541, 2.958123207092285, 3.1877896785736084, 3.4174559116363525, 3.647122383117676, 3.87678861618042, 4.106454849243164, 4.336121559143066, 4.5657877922058105, 4.795454025268555, 5.025120258331299, 5.254786968231201, 5.484453201293945, 5.7141194343566895, 5.943785667419434, 6.173452377319336, 6.40311861038208, 6.632785320281982]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 11.0, 11.0, 6.0, 9.0, 31.0, 40.0, 64.0, 109.0, 283.0, 537.0, 1412.0, 4792.0, 26763.0, 573097.0, 3452605.0, 118450.0, 11821.0, 2592.0, 884.0, 339.0, 164.0, 94.0, 42.0, 29.0, 20.0, 16.0, 10.0, 12.0, 9.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7955093383789062, -0.7692413330078125, -0.7429733276367188, -0.716705322265625, -0.6904373168945312, -0.6641693115234375, -0.6379013061523438, -0.61163330078125, -0.5853652954101562, -0.5590972900390625, -0.5328292846679688, -0.506561279296875, -0.48029327392578125, -0.4540252685546875, -0.42775726318359375, -0.4014892578125, -0.37522125244140625, -0.3489532470703125, -0.32268524169921875, -0.296417236328125, -0.27014923095703125, -0.2438812255859375, -0.21761322021484375, -0.19134521484375, -0.16507720947265625, -0.1388092041015625, -0.11254119873046875, -0.086273193359375, -0.06000518798828125, -0.0337371826171875, -0.00746917724609375, 0.018798828125, 0.04506683349609375, 0.0713348388671875, 0.09760284423828125, 0.123870849609375, 0.15013885498046875, 0.1764068603515625, 0.20267486572265625, 0.22894287109375, 0.25521087646484375, 0.2814788818359375, 0.30774688720703125, 0.334014892578125, 0.36028289794921875, 0.3865509033203125, 0.41281890869140625, 0.4390869140625, 0.46535491943359375, 0.4916229248046875, 0.5178909301757812, 0.544158935546875, 0.5704269409179688, 0.5966949462890625, 0.6229629516601562, 0.64923095703125, 0.6754989624023438, 0.7017669677734375, 0.7280349731445312, 0.754302978515625, 0.7805709838867188, 0.8068389892578125, 0.8331069946289062, 0.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 7.0, 11.0, 6.0, 12.0, 18.0, 18.0, 35.0, 39.0, 32.0, 40.0, 64.0, 57.0, 64.0, 60.0, 53.0, 59.0, 62.0, 61.0, 43.0, 55.0, 39.0, 32.0, 27.0, 36.0, 17.0, 12.0, 10.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.389404296875, -0.3757972717285156, -0.36219024658203125, -0.3485832214355469, -0.3349761962890625, -0.3213691711425781, -0.30776214599609375, -0.2941551208496094, -0.280548095703125, -0.2669410705566406, -0.25333404541015625, -0.23972702026367188, -0.2261199951171875, -0.21251296997070312, -0.19890594482421875, -0.18529891967773438, -0.17169189453125, -0.15808486938476562, -0.14447784423828125, -0.13087081909179688, -0.1172637939453125, -0.10365676879882812, -0.09004974365234375, -0.07644271850585938, -0.062835693359375, -0.049228668212890625, -0.03562164306640625, -0.022014617919921875, -0.0084075927734375, 0.005199432373046875, 0.01880645751953125, 0.032413482666015625, 0.0460205078125, 0.059627532958984375, 0.07323455810546875, 0.08684158325195312, 0.1004486083984375, 0.11405563354492188, 0.12766265869140625, 0.14126968383789062, 0.154876708984375, 0.16848373413085938, 0.18209075927734375, 0.19569778442382812, 0.2093048095703125, 0.22291183471679688, 0.23651885986328125, 0.2501258850097656, 0.26373291015625, 0.2773399353027344, 0.29094696044921875, 0.3045539855957031, 0.3181610107421875, 0.3317680358886719, 0.34537506103515625, 0.3589820861816406, 0.372589111328125, 0.3861961364746094, 0.39980316162109375, 0.4134101867675781, 0.4270172119140625, 0.4406242370605469, 0.45423126220703125, 0.4678382873535156, 0.4814453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 34.0, 39.0, 47.0, 77.0, 120.0, 216.0, 1441.0, 394313.0, 3794868.0, 2590.0, 241.0, 100.0, 80.0, 50.0, 22.0, 16.0, 13.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.740692138671875, -2.63568115234375, -2.530670166015625, -2.4256591796875, -2.320648193359375, -2.21563720703125, -2.110626220703125, -2.005615234375, -1.900604248046875, -1.79559326171875, -1.690582275390625, -1.5855712890625, -1.480560302734375, -1.37554931640625, -1.270538330078125, -1.16552734375, -1.060516357421875, -0.95550537109375, -0.850494384765625, -0.7454833984375, -0.640472412109375, -0.53546142578125, -0.430450439453125, -0.325439453125, -0.220428466796875, -0.11541748046875, -0.010406494140625, 0.0946044921875, 0.199615478515625, 0.30462646484375, 0.409637451171875, 0.5146484375, 0.619659423828125, 0.72467041015625, 0.829681396484375, 0.9346923828125, 1.039703369140625, 1.14471435546875, 1.249725341796875, 1.354736328125, 1.459747314453125, 1.56475830078125, 1.669769287109375, 1.7747802734375, 1.879791259765625, 1.98480224609375, 2.089813232421875, 2.19482421875, 2.299835205078125, 2.40484619140625, 2.509857177734375, 2.6148681640625, 2.719879150390625, 2.82489013671875, 2.929901123046875, 3.034912109375, 3.139923095703125, 3.24493408203125, 3.349945068359375, 3.4549560546875, 3.559967041015625, 3.66497802734375, 3.769989013671875, 3.875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 11.0, 14.0, 31.0, 100.0, 293.0, 1263.0, 1723.0, 408.0, 129.0, 70.0, 19.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.01171875, -2.9528350830078125, -2.893951416015625, -2.8350677490234375, -2.77618408203125, -2.7173004150390625, -2.658416748046875, -2.5995330810546875, -2.5406494140625, -2.4817657470703125, -2.422882080078125, -2.3639984130859375, -2.30511474609375, -2.2462310791015625, -2.187347412109375, -2.1284637451171875, -2.069580078125, -2.0106964111328125, -1.951812744140625, -1.8929290771484375, -1.83404541015625, -1.7751617431640625, -1.716278076171875, -1.6573944091796875, -1.5985107421875, -1.5396270751953125, -1.480743408203125, -1.4218597412109375, -1.36297607421875, -1.3040924072265625, -1.245208740234375, -1.1863250732421875, -1.12744140625, -1.0685577392578125, -1.009674072265625, -0.9507904052734375, -0.89190673828125, -0.8330230712890625, -0.774139404296875, -0.7152557373046875, -0.6563720703125, -0.5974884033203125, -0.538604736328125, -0.4797210693359375, -0.42083740234375, -0.3619537353515625, -0.303070068359375, -0.2441864013671875, -0.185302734375, -0.1264190673828125, -0.067535400390625, -0.0086517333984375, 0.05023193359375, 0.1091156005859375, 0.167999267578125, 0.2268829345703125, 0.2857666015625, 0.3446502685546875, 0.403533935546875, 0.4624176025390625, 0.52130126953125, 0.5801849365234375, 0.639068603515625, 0.6979522705078125, 0.7568359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 4.0, 17.0, 36.0, 77.0, 202.0, 286.0, 218.0, 85.0, 32.0, 18.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.529682159423828, -8.208880424499512, -7.888078212738037, -7.567276477813721, -7.246474266052246, -6.92567253112793, -6.604870796203613, -6.284068584442139, -5.963266372680664, -5.642464637756348, -5.321662425994873, -5.000860691070557, -4.680058479309082, -4.359256744384766, -4.038455009460449, -3.7176527976989746, -3.396851062774658, -3.0760490894317627, -2.755247116088867, -2.434445381164551, -2.113643169403076, -1.7928413152694702, -1.4720394611358643, -1.1512374877929688, -0.8304355144500732, -0.5096335411071777, -0.188831627368927, 0.13197028636932373, 0.45277225971221924, 0.7735742330551147, 1.0943760871887207, 1.4151780605316162, 1.7359800338745117, 2.0567820072174072, 2.3775839805603027, 2.698385715484619, 3.0191879272460938, 3.33998966217041, 3.6607916355133057, 3.981593608856201, 4.302395820617676, 4.623197555541992, 4.943999767303467, 5.264801502227783, 5.585603713989258, 5.906405448913574, 6.227207183837891, 6.548009395599365, 6.868811130523682, 7.189612865447998, 7.510415077209473, 7.831216812133789, 8.152018547058105, 8.472821235656738, 8.793622970581055, 9.114424705505371, 9.435226440429688, 9.756028175354004, 10.07682991027832, 10.397632598876953, 10.71843433380127, 11.039236068725586, 11.360037803649902, 11.680839538574219, 12.001642227172852]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 8.0, 11.0, 12.0, 10.0, 16.0, 13.0, 22.0, 32.0, 31.0, 33.0, 39.0, 44.0, 48.0, 62.0, 48.0, 54.0, 61.0, 46.0, 61.0, 50.0, 46.0, 37.0, 32.0, 28.0, 25.0, 21.0, 20.0, 14.0, 17.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90915846824646, -3.790902614593506, -3.672646999359131, -3.5543911457061768, -3.4361355304718018, -3.3178796768188477, -3.1996240615844727, -3.0813682079315186, -2.9631123542785645, -2.8448565006256104, -2.7266008853912354, -2.6083450317382812, -2.4900894165039062, -2.371833562850952, -2.253577709197998, -2.135322093963623, -2.017066478729248, -1.8988107442855835, -1.780555009841919, -1.6622991561889648, -1.5440435409545898, -1.4257876873016357, -1.3075319528579712, -1.1892762184143066, -1.071020483970642, -0.9527647495269775, -0.834509015083313, -0.7162532210350037, -0.5979974865913391, -0.47974175214767456, -0.36148595809936523, -0.24323022365570068, -0.12497425079345703, -0.006718501448631287, 0.11153724789619446, 0.2297930121421814, 0.34804874658584595, 0.4663044810295105, 0.5845602750778198, 0.7028160095214844, 0.8210717439651489, 0.9393274784088135, 1.057583212852478, 1.1758389472961426, 1.2940948009490967, 1.4123504161834717, 1.5306062698364258, 1.6488620042800903, 1.7671177387237549, 1.8853734731674194, 2.003629207611084, 2.121885061264038, 2.240140676498413, 2.358396530151367, 2.476652145385742, 2.5949079990386963, 2.7131638526916504, 2.8314197063446045, 2.9496753215789795, 3.0679311752319336, 3.1861867904663086, 3.3044426441192627, 3.422698497772217, 3.540954113006592, 3.659209728240967]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 1.0, 8.0, 17.0, 19.0, 36.0, 45.0, 74.0, 118.0, 193.0, 329.0, 628.0, 1419.0, 3558.0, 10062.0, 36328.0, 163397.0, 526175.0, 234194.0, 50286.0, 13864.0, 4389.0, 1654.0, 726.0, 373.0, 238.0, 157.0, 74.0, 64.0, 34.0, 24.0, 15.0, 11.0, 9.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.03515625, -1.0076370239257812, -0.9801177978515625, -0.9525985717773438, -0.925079345703125, -0.8975601196289062, -0.8700408935546875, -0.8425216674804688, -0.81500244140625, -0.7874832153320312, -0.7599639892578125, -0.7324447631835938, -0.704925537109375, -0.6774063110351562, -0.6498870849609375, -0.6223678588867188, -0.5948486328125, -0.5673294067382812, -0.5398101806640625, -0.5122909545898438, -0.484771728515625, -0.45725250244140625, -0.4297332763671875, -0.40221405029296875, -0.37469482421875, -0.34717559814453125, -0.3196563720703125, -0.29213714599609375, -0.264617919921875, -0.23709869384765625, -0.2095794677734375, -0.18206024169921875, -0.154541015625, -0.12702178955078125, -0.0995025634765625, -0.07198333740234375, -0.044464111328125, -0.01694488525390625, 0.0105743408203125, 0.03809356689453125, 0.06561279296875, 0.09313201904296875, 0.1206512451171875, 0.14817047119140625, 0.175689697265625, 0.20320892333984375, 0.2307281494140625, 0.25824737548828125, 0.2857666015625, 0.31328582763671875, 0.3408050537109375, 0.36832427978515625, 0.395843505859375, 0.42336273193359375, 0.4508819580078125, 0.47840118408203125, 0.50592041015625, 0.5334396362304688, 0.5609588623046875, 0.5884780883789062, 0.615997314453125, 0.6435165405273438, 0.6710357666015625, 0.6985549926757812, 0.72607421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 1.0, 8.0, 7.0, 16.0, 5.0, 12.0, 19.0, 18.0, 28.0, 19.0, 30.0, 31.0, 31.0, 64.0, 58.0, 49.0, 44.0, 40.0, 53.0, 55.0, 42.0, 63.0, 44.0, 41.0, 37.0, 38.0, 31.0, 29.0, 24.0, 8.0, 19.0, 9.0, 11.0, 5.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.317138671875, -0.30498504638671875, -0.2928314208984375, -0.28067779541015625, -0.268524169921875, -0.25637054443359375, -0.2442169189453125, -0.23206329345703125, -0.21990966796875, -0.20775604248046875, -0.1956024169921875, -0.18344879150390625, -0.171295166015625, -0.15914154052734375, -0.1469879150390625, -0.13483428955078125, -0.1226806640625, -0.11052703857421875, -0.0983734130859375, -0.08621978759765625, -0.074066162109375, -0.06191253662109375, -0.0497589111328125, -0.03760528564453125, -0.02545166015625, -0.01329803466796875, -0.0011444091796875, 0.01100921630859375, 0.023162841796875, 0.03531646728515625, 0.0474700927734375, 0.05962371826171875, 0.07177734375, 0.08393096923828125, 0.0960845947265625, 0.10823822021484375, 0.120391845703125, 0.13254547119140625, 0.1446990966796875, 0.15685272216796875, 0.16900634765625, 0.18115997314453125, 0.1933135986328125, 0.20546722412109375, 0.217620849609375, 0.22977447509765625, 0.2419281005859375, 0.25408172607421875, 0.2662353515625, 0.27838897705078125, 0.2905426025390625, 0.30269622802734375, 0.314849853515625, 0.32700347900390625, 0.3391571044921875, 0.35131072998046875, 0.36346435546875, 0.37561798095703125, 0.3877716064453125, 0.39992523193359375, 0.412078857421875, 0.42423248291015625, 0.4363861083984375, 0.44853973388671875, 0.460693359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 11.0, 15.0, 19.0, 27.0, 44.0, 68.0, 101.0, 228.0, 449.0, 1130.0, 3972.0, 26355.0, 618393.0, 369456.0, 22588.0, 3650.0, 1083.0, 459.0, 205.0, 117.0, 50.0, 40.0, 20.0, 16.0, 12.0, 9.0, 7.0, 2.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.612213134765625, -1.55841064453125, -1.504608154296875, -1.4508056640625, -1.397003173828125, -1.34320068359375, -1.289398193359375, -1.235595703125, -1.181793212890625, -1.12799072265625, -1.074188232421875, -1.0203857421875, -0.966583251953125, -0.91278076171875, -0.858978271484375, -0.80517578125, -0.751373291015625, -0.69757080078125, -0.643768310546875, -0.5899658203125, -0.536163330078125, -0.48236083984375, -0.428558349609375, -0.374755859375, -0.320953369140625, -0.26715087890625, -0.213348388671875, -0.1595458984375, -0.105743408203125, -0.05194091796875, 0.001861572265625, 0.0556640625, 0.109466552734375, 0.16326904296875, 0.217071533203125, 0.2708740234375, 0.324676513671875, 0.37847900390625, 0.432281494140625, 0.486083984375, 0.539886474609375, 0.59368896484375, 0.647491455078125, 0.7012939453125, 0.755096435546875, 0.80889892578125, 0.862701416015625, 0.91650390625, 0.970306396484375, 1.02410888671875, 1.077911376953125, 1.1317138671875, 1.185516357421875, 1.23931884765625, 1.293121337890625, 1.346923828125, 1.400726318359375, 1.45452880859375, 1.508331298828125, 1.5621337890625, 1.615936279296875, 1.66973876953125, 1.723541259765625, 1.77734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 7.0, 11.0, 11.0, 19.0, 10.0, 18.0, 26.0, 25.0, 34.0, 41.0, 41.0, 50.0, 43.0, 59.0, 55.0, 63.0, 63.0, 57.0, 39.0, 53.0, 40.0, 30.0, 40.0, 23.0, 30.0, 19.0, 19.0, 12.0, 9.0, 12.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.6599578857421875, -1.609954833984375, -1.5599517822265625, -1.50994873046875, -1.4599456787109375, -1.409942626953125, -1.3599395751953125, -1.3099365234375, -1.2599334716796875, -1.209930419921875, -1.1599273681640625, -1.10992431640625, -1.0599212646484375, -1.009918212890625, -0.9599151611328125, -0.909912109375, -0.8599090576171875, -0.809906005859375, -0.7599029541015625, -0.70989990234375, -0.6598968505859375, -0.609893798828125, -0.5598907470703125, -0.5098876953125, -0.4598846435546875, -0.409881591796875, -0.3598785400390625, -0.30987548828125, -0.2598724365234375, -0.209869384765625, -0.1598663330078125, -0.10986328125, -0.0598602294921875, -0.009857177734375, 0.0401458740234375, 0.09014892578125, 0.1401519775390625, 0.190155029296875, 0.2401580810546875, 0.2901611328125, 0.3401641845703125, 0.390167236328125, 0.4401702880859375, 0.49017333984375, 0.5401763916015625, 0.590179443359375, 0.6401824951171875, 0.690185546875, 0.7401885986328125, 0.790191650390625, 0.8401947021484375, 0.89019775390625, 0.9402008056640625, 0.990203857421875, 1.0402069091796875, 1.0902099609375, 1.1402130126953125, 1.190216064453125, 1.2402191162109375, 1.29022216796875, 1.3402252197265625, 1.390228271484375, 1.4402313232421875, 1.490234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 9.0, 11.0, 11.0, 14.0, 25.0, 25.0, 59.0, 68.0, 111.0, 151.0, 238.0, 432.0, 829.0, 1736.0, 3897.0, 10238.0, 33654.0, 167629.0, 708562.0, 86643.0, 21340.0, 7060.0, 2789.0, 1349.0, 667.0, 346.0, 223.0, 136.0, 95.0, 47.0, 41.0, 30.0, 12.0, 17.0, 14.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.297607421875, -0.2877922058105469, -0.27797698974609375, -0.2681617736816406, -0.2583465576171875, -0.24853134155273438, -0.23871612548828125, -0.22890090942382812, -0.219085693359375, -0.20927047729492188, -0.19945526123046875, -0.18964004516601562, -0.1798248291015625, -0.17000961303710938, -0.16019439697265625, -0.15037918090820312, -0.14056396484375, -0.13074874877929688, -0.12093353271484375, -0.11111831665039062, -0.1013031005859375, -0.09148788452148438, -0.08167266845703125, -0.07185745239257812, -0.062042236328125, -0.052227020263671875, -0.04241180419921875, -0.032596588134765625, -0.0227813720703125, -0.012966156005859375, -0.00315093994140625, 0.006664276123046875, 0.0164794921875, 0.026294708251953125, 0.03610992431640625, 0.045925140380859375, 0.0557403564453125, 0.06555557250976562, 0.07537078857421875, 0.08518600463867188, 0.095001220703125, 0.10481643676757812, 0.11463165283203125, 0.12444686889648438, 0.1342620849609375, 0.14407730102539062, 0.15389251708984375, 0.16370773315429688, 0.17352294921875, 0.18333816528320312, 0.19315338134765625, 0.20296859741210938, 0.2127838134765625, 0.22259902954101562, 0.23241424560546875, 0.24222946166992188, 0.252044677734375, 0.2618598937988281, 0.27167510986328125, 0.2814903259277344, 0.2913055419921875, 0.3011207580566406, 0.31093597412109375, 0.3207511901855469, 0.33056640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 12.0, 10.0, 14.0, 14.0, 11.0, 26.0, 34.0, 33.0, 61.0, 74.0, 108.0, 156.0, 126.0, 90.0, 65.0, 39.0, 22.0, 23.0, 19.0, 9.0, 12.0, 10.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.548664093017578e-05, -9.265542030334473e-05, -8.982419967651367e-05, -8.699297904968262e-05, -8.416175842285156e-05, -8.133053779602051e-05, -7.849931716918945e-05, -7.56680965423584e-05, -7.283687591552734e-05, -7.000565528869629e-05, -6.717443466186523e-05, -6.434321403503418e-05, -6.151199340820312e-05, -5.868077278137207e-05, -5.5849552154541016e-05, -5.301833152770996e-05, -5.0187110900878906e-05, -4.735589027404785e-05, -4.45246696472168e-05, -4.169344902038574e-05, -3.886222839355469e-05, -3.603100776672363e-05, -3.319978713989258e-05, -3.0368566513061523e-05, -2.753734588623047e-05, -2.4706125259399414e-05, -2.187490463256836e-05, -1.9043684005737305e-05, -1.621246337890625e-05, -1.3381242752075195e-05, -1.055002212524414e-05, -7.718801498413086e-06, -4.887580871582031e-06, -2.0563602447509766e-06, 7.748603820800781e-07, 3.606081008911133e-06, 6.4373016357421875e-06, 9.268522262573242e-06, 1.2099742889404297e-05, 1.4930963516235352e-05, 1.7762184143066406e-05, 2.059340476989746e-05, 2.3424625396728516e-05, 2.625584602355957e-05, 2.9087066650390625e-05, 3.191828727722168e-05, 3.4749507904052734e-05, 3.758072853088379e-05, 4.0411949157714844e-05, 4.32431697845459e-05, 4.607439041137695e-05, 4.890561103820801e-05, 5.173683166503906e-05, 5.456805229187012e-05, 5.739927291870117e-05, 6.0230493545532227e-05, 6.306171417236328e-05, 6.589293479919434e-05, 6.872415542602539e-05, 7.155537605285645e-05, 7.43865966796875e-05, 7.721781730651855e-05, 8.004903793334961e-05, 8.288025856018066e-05, 8.571147918701172e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 4.0, 10.0, 8.0, 20.0, 23.0, 33.0, 69.0, 89.0, 131.0, 194.0, 361.0, 767.0, 1589.0, 3750.0, 12035.0, 50514.0, 579118.0, 337556.0, 44416.0, 11128.0, 3600.0, 1499.0, 702.0, 351.0, 212.0, 120.0, 86.0, 45.0, 33.0, 20.0, 22.0, 11.0, 9.0, 3.0, 4.0, 0.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.304443359375, -0.29315185546875, -0.2818603515625, -0.27056884765625, -0.25927734375, -0.24798583984375, -0.2366943359375, -0.22540283203125, -0.214111328125, -0.20281982421875, -0.1915283203125, -0.18023681640625, -0.1689453125, -0.15765380859375, -0.1463623046875, -0.13507080078125, -0.123779296875, -0.11248779296875, -0.1011962890625, -0.08990478515625, -0.07861328125, -0.06732177734375, -0.0560302734375, -0.04473876953125, -0.033447265625, -0.02215576171875, -0.0108642578125, 0.00042724609375, 0.01171875, 0.02301025390625, 0.0343017578125, 0.04559326171875, 0.056884765625, 0.06817626953125, 0.0794677734375, 0.09075927734375, 0.10205078125, 0.11334228515625, 0.1246337890625, 0.13592529296875, 0.147216796875, 0.15850830078125, 0.1697998046875, 0.18109130859375, 0.1923828125, 0.20367431640625, 0.2149658203125, 0.22625732421875, 0.237548828125, 0.24884033203125, 0.2601318359375, 0.27142333984375, 0.28271484375, 0.29400634765625, 0.3052978515625, 0.31658935546875, 0.327880859375, 0.33917236328125, 0.3504638671875, 0.36175537109375, 0.373046875, 0.38433837890625, 0.3956298828125, 0.40692138671875, 0.418212890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 7.0, 10.0, 8.0, 5.0, 12.0, 19.0, 24.0, 26.0, 39.0, 53.0, 72.0, 88.0, 113.0, 109.0, 107.0, 82.0, 68.0, 38.0, 21.0, 19.0, 15.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.464599609375, -0.4529609680175781, -0.44132232666015625, -0.4296836853027344, -0.4180450439453125, -0.4064064025878906, -0.39476776123046875, -0.3831291198730469, -0.371490478515625, -0.3598518371582031, -0.34821319580078125, -0.3365745544433594, -0.3249359130859375, -0.3132972717285156, -0.30165863037109375, -0.2900199890136719, -0.27838134765625, -0.2667427062988281, -0.25510406494140625, -0.24346542358398438, -0.2318267822265625, -0.22018814086914062, -0.20854949951171875, -0.19691085815429688, -0.185272216796875, -0.17363357543945312, -0.16199493408203125, -0.15035629272460938, -0.1387176513671875, -0.12707901000976562, -0.11544036865234375, -0.10380172729492188, -0.0921630859375, -0.08052444458007812, -0.06888580322265625, -0.057247161865234375, -0.0456085205078125, -0.033969879150390625, -0.02233123779296875, -0.010692596435546875, 0.000946044921875, 0.012584686279296875, 0.02422332763671875, 0.035861968994140625, 0.0475006103515625, 0.059139251708984375, 0.07077789306640625, 0.08241653442382812, 0.09405517578125, 0.10569381713867188, 0.11733245849609375, 0.12897109985351562, 0.1406097412109375, 0.15224838256835938, 0.16388702392578125, 0.17552566528320312, 0.187164306640625, 0.19880294799804688, 0.21044158935546875, 0.22208023071289062, 0.2337188720703125, 0.24535751342773438, 0.25699615478515625, 0.2686347961425781, 0.2802734375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 13.0, 10.0, 21.0, 27.0, 68.0, 112.0, 222.0, 266.0, 129.0, 68.0, 27.0, 16.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.044835090637207, -8.753379821777344, -8.46192455291748, -8.1704683303833, -7.8790130615234375, -7.587557792663574, -7.296102523803711, -7.004647254943848, -6.713191509246826, -6.421736240386963, -6.130280494689941, -5.838825225830078, -5.547369956970215, -5.255914211273193, -4.96445894241333, -4.673003196716309, -4.381547927856445, -4.090092658996582, -3.7986369132995605, -3.5071816444396973, -3.215726137161255, -2.9242706298828125, -2.632815361022949, -2.341359853744507, -2.0499043464660645, -1.758448839187622, -1.4669934511184692, -1.1755380630493164, -0.884082555770874, -0.5926270484924316, -0.3011716604232788, -0.009716272354125977, 0.28173828125, 0.5731937289237976, 0.8646491765975952, 1.156104564666748, 1.4475600719451904, 1.7390155792236328, 2.030470848083496, 2.3219263553619385, 2.613381862640381, 2.9048373699188232, 3.1962928771972656, 3.487748146057129, 3.7792036533355713, 4.070659160614014, 4.362114429473877, 4.653570175170898, 4.945025444030762, 5.236480712890625, 5.5279364585876465, 5.81939172744751, 6.110847473144531, 6.4023027420043945, 6.693758010864258, 6.985213279724121, 7.276669025421143, 7.568124294281006, 7.859580039978027, 8.15103530883789, 8.442490577697754, 8.733945846557617, 9.025402069091797, 9.31685733795166, 9.608312606811523]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 3.0, 3.0, 11.0, 8.0, 12.0, 17.0, 16.0, 20.0, 18.0, 27.0, 29.0, 27.0, 31.0, 33.0, 49.0, 67.0, 76.0, 72.0, 74.0, 68.0, 53.0, 35.0, 20.0, 24.0, 32.0, 15.0, 22.0, 19.0, 22.0, 11.0, 11.0, 13.0, 9.0, 10.0, 8.0, 3.0, 7.0, 4.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.7383294105529785, -6.555067539215088, -6.3718061447143555, -6.188544273376465, -6.005282402038574, -5.822020530700684, -5.638759136199951, -5.4554972648620605, -5.272235870361328, -5.0889739990234375, -4.905712604522705, -4.7224507331848145, -4.539188861846924, -4.355927467346191, -4.172665596008301, -3.98940372467041, -3.8061418533325195, -3.622880220413208, -3.4396183490753174, -3.256356716156006, -3.0730948448181152, -2.8898332118988037, -2.706571578979492, -2.5233097076416016, -2.34004807472229, -2.1567864418029785, -1.973524570465088, -1.7902629375457764, -1.6070011854171753, -1.4237394332885742, -1.2404778003692627, -1.0572160482406616, -0.8739538192749023, -0.6906920671463013, -0.507430374622345, -0.32416868209838867, -0.1409069299697876, 0.04235482215881348, 0.225616455078125, 0.4088782072067261, 0.5921399593353271, 0.7754017114639282, 0.9586634039878845, 1.1419250965118408, 1.325186848640442, 1.508448600769043, 1.6917102336883545, 1.8749719858169556, 2.0582337379455566, 2.241495370864868, 2.424757242202759, 2.6080188751220703, 2.791280746459961, 2.9745423793792725, 3.157804012298584, 3.3410658836364746, 3.524327516555786, 3.7075891494750977, 3.8908510208129883, 4.074112892150879, 4.257374286651611, 4.440636157989502, 4.623897552490234, 4.807159423828125, 4.990421295166016]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 15.0, 22.0, 32.0, 48.0, 101.0, 257.0, 714.0, 2600.0, 16300.0, 639654.0, 3481664.0, 46445.0, 4606.0, 1020.0, 391.0, 146.0, 86.0, 45.0, 41.0, 30.0, 12.0, 8.0, 7.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.19775390625, -1.1552734375, -1.11279296875, -1.0703125, -1.02783203125, -0.9853515625, -0.94287109375, -0.900390625, -0.85791015625, -0.8154296875, -0.77294921875, -0.73046875, -0.68798828125, -0.6455078125, -0.60302734375, -0.560546875, -0.51806640625, -0.4755859375, -0.43310546875, -0.390625, -0.34814453125, -0.3056640625, -0.26318359375, -0.220703125, -0.17822265625, -0.1357421875, -0.09326171875, -0.05078125, -0.00830078125, 0.0341796875, 0.07666015625, 0.119140625, 0.16162109375, 0.2041015625, 0.24658203125, 0.2890625, 0.33154296875, 0.3740234375, 0.41650390625, 0.458984375, 0.50146484375, 0.5439453125, 0.58642578125, 0.62890625, 0.67138671875, 0.7138671875, 0.75634765625, 0.798828125, 0.84130859375, 0.8837890625, 0.92626953125, 0.96875, 1.01123046875, 1.0537109375, 1.09619140625, 1.138671875, 1.18115234375, 1.2236328125, 1.26611328125, 1.30859375, 1.35107421875, 1.3935546875, 1.43603515625, 1.478515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 13.0, 8.0, 17.0, 25.0, 19.0, 22.0, 27.0, 29.0, 32.0, 48.0, 56.0, 44.0, 62.0, 51.0, 47.0, 41.0, 55.0, 52.0, 52.0, 49.0, 35.0, 38.0, 43.0, 28.0, 21.0, 10.0, 12.0, 16.0, 15.0, 3.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33060455322265625, -0.3181915283203125, -0.30577850341796875, -0.293365478515625, -0.28095245361328125, -0.2685394287109375, -0.25612640380859375, -0.24371337890625, -0.23130035400390625, -0.2188873291015625, -0.20647430419921875, -0.194061279296875, -0.18164825439453125, -0.1692352294921875, -0.15682220458984375, -0.1444091796875, -0.13199615478515625, -0.1195831298828125, -0.10717010498046875, -0.094757080078125, -0.08234405517578125, -0.0699310302734375, -0.05751800537109375, -0.04510498046875, -0.03269195556640625, -0.0202789306640625, -0.00786590576171875, 0.004547119140625, 0.01696014404296875, 0.0293731689453125, 0.04178619384765625, 0.05419921875, 0.06661224365234375, 0.0790252685546875, 0.09143829345703125, 0.103851318359375, 0.11626434326171875, 0.1286773681640625, 0.14109039306640625, 0.15350341796875, 0.16591644287109375, 0.1783294677734375, 0.19074249267578125, 0.203155517578125, 0.21556854248046875, 0.2279815673828125, 0.24039459228515625, 0.2528076171875, 0.26522064208984375, 0.2776336669921875, 0.29004669189453125, 0.302459716796875, 0.31487274169921875, 0.3272857666015625, 0.33969879150390625, 0.35211181640625, 0.36452484130859375, 0.3769378662109375, 0.38935089111328125, 0.401763916015625, 0.41417694091796875, 0.4265899658203125, 0.43900299072265625, 0.451416015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 22.0, 38.0, 58.0, 80.0, 124.0, 267.0, 4189.0, 4160283.0, 28274.0, 601.0, 137.0, 87.0, 59.0, 25.0, 18.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23046875, -6.06939697265625, -5.9083251953125, -5.74725341796875, -5.586181640625, -5.42510986328125, -5.2640380859375, -5.10296630859375, -4.94189453125, -4.78082275390625, -4.6197509765625, -4.45867919921875, -4.297607421875, -4.13653564453125, -3.9754638671875, -3.81439208984375, -3.6533203125, -3.49224853515625, -3.3311767578125, -3.17010498046875, -3.009033203125, -2.84796142578125, -2.6868896484375, -2.52581787109375, -2.36474609375, -2.20367431640625, -2.0426025390625, -1.88153076171875, -1.720458984375, -1.55938720703125, -1.3983154296875, -1.23724365234375, -1.076171875, -0.91510009765625, -0.7540283203125, -0.59295654296875, -0.431884765625, -0.27081298828125, -0.1097412109375, 0.05133056640625, 0.21240234375, 0.37347412109375, 0.5345458984375, 0.69561767578125, 0.856689453125, 1.01776123046875, 1.1788330078125, 1.33990478515625, 1.5009765625, 1.66204833984375, 1.8231201171875, 1.98419189453125, 2.145263671875, 2.30633544921875, 2.4674072265625, 2.62847900390625, 2.78955078125, 2.95062255859375, 3.1116943359375, 3.27276611328125, 3.433837890625, 3.59490966796875, 3.7559814453125, 3.91705322265625, 4.078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 20.0, 55.0, 186.0, 901.0, 2146.0, 548.0, 131.0, 40.0, 24.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.40625, -4.322021484375, -4.23779296875, -4.153564453125, -4.0693359375, -3.985107421875, -3.90087890625, -3.816650390625, -3.732421875, -3.648193359375, -3.56396484375, -3.479736328125, -3.3955078125, -3.311279296875, -3.22705078125, -3.142822265625, -3.05859375, -2.974365234375, -2.89013671875, -2.805908203125, -2.7216796875, -2.637451171875, -2.55322265625, -2.468994140625, -2.384765625, -2.300537109375, -2.21630859375, -2.132080078125, -2.0478515625, -1.963623046875, -1.87939453125, -1.795166015625, -1.7109375, -1.626708984375, -1.54248046875, -1.458251953125, -1.3740234375, -1.289794921875, -1.20556640625, -1.121337890625, -1.037109375, -0.952880859375, -0.86865234375, -0.784423828125, -0.7001953125, -0.615966796875, -0.53173828125, -0.447509765625, -0.36328125, -0.279052734375, -0.19482421875, -0.110595703125, -0.0263671875, 0.057861328125, 0.14208984375, 0.226318359375, 0.310546875, 0.394775390625, 0.47900390625, 0.563232421875, 0.6474609375, 0.731689453125, 0.81591796875, 0.900146484375, 0.984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 15.0, 14.0, 63.0, 168.0, 322.0, 261.0, 87.0, 41.0, 17.0, 5.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0472211837768555, -4.522011756896973, -3.99680233001709, -3.471592903137207, -2.946383476257324, -2.4211740493774414, -1.8959646224975586, -1.3707551956176758, -0.845545768737793, -0.32033634185791016, 0.20487308502197266, 0.7300825119018555, 1.2552919387817383, 1.780501365661621, 2.305710792541504, 2.8309202194213867, 3.3561296463012695, 3.8813390731811523, 4.406548500061035, 4.931757926940918, 5.456967353820801, 5.982176780700684, 6.507386207580566, 7.032595634460449, 7.557805061340332, 8.083014488220215, 8.608223915100098, 9.13343334197998, 9.658642768859863, 10.183852195739746, 10.709061622619629, 11.234271049499512, 11.759479522705078, 12.284688949584961, 12.809898376464844, 13.335107803344727, 13.86031723022461, 14.385526657104492, 14.910736083984375, 15.435945510864258, 15.96115493774414, 16.486364364624023, 17.011573791503906, 17.53678321838379, 18.061992645263672, 18.587202072143555, 19.112411499023438, 19.63762092590332, 20.162830352783203, 20.688039779663086, 21.21324920654297, 21.73845863342285, 22.263668060302734, 22.788877487182617, 23.3140869140625, 23.839296340942383, 24.364505767822266, 24.88971519470215, 25.41492462158203, 25.940134048461914, 26.465343475341797, 26.99055290222168, 27.515762329101562, 28.040971755981445, 28.566181182861328]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 11.0, 11.0, 19.0, 19.0, 16.0, 27.0, 31.0, 32.0, 35.0, 39.0, 40.0, 63.0, 50.0, 48.0, 54.0, 50.0, 44.0, 60.0, 53.0, 48.0, 39.0, 29.0, 36.0, 27.0, 24.0, 26.0, 16.0, 8.0, 11.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1863203048706055, -5.015599727630615, -4.844879150390625, -4.674158573150635, -4.5034379959106445, -4.332717418670654, -4.161996841430664, -3.991276502609253, -3.8205559253692627, -3.6498353481292725, -3.4791147708892822, -3.308394432067871, -3.137673854827881, -2.9669532775878906, -2.7962327003479004, -2.62551212310791, -2.45479154586792, -2.2840709686279297, -2.1133503913879395, -1.9426299333572388, -1.7719093561172485, -1.6011887788772583, -1.4304683208465576, -1.2597477436065674, -1.0890271663665771, -0.9183065891265869, -0.7475860714912415, -0.576865553855896, -0.40614497661590576, -0.23542439937591553, -0.06470394134521484, 0.10601663589477539, 0.2767372131347656, 0.44745776057243347, 0.6181783080101013, 0.7888988256454468, 0.959619402885437, 1.1303399801254272, 1.301060438156128, 1.4717810153961182, 1.6425015926361084, 1.8132221698760986, 1.9839427471160889, 2.1546630859375, 2.3253836631774902, 2.4961042404174805, 2.6668248176574707, 2.837545394897461, 3.008265972137451, 3.1789865493774414, 3.3497071266174316, 3.520427703857422, 3.691148281097412, 3.8618688583374023, 4.032588958740234, 4.203310012817383, 4.374030113220215, 4.544750690460205, 4.715471267700195, 4.8861918449401855, 5.056912422180176, 5.227632999420166, 5.398353576660156, 5.569073677062988, 5.739794731140137]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 7.0, 17.0, 16.0, 28.0, 51.0, 66.0, 82.0, 135.0, 230.0, 341.0, 578.0, 1038.0, 1883.0, 3425.0, 7360.0, 17229.0, 46453.0, 146403.0, 426777.0, 268070.0, 79212.0, 27340.0, 10957.0, 5062.0, 2454.0, 1366.0, 704.0, 455.0, 285.0, 169.0, 110.0, 74.0, 60.0, 37.0, 19.0, 21.0, 10.0, 8.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.8984375, -0.8739852905273438, -0.8495330810546875, -0.8250808715820312, -0.800628662109375, -0.7761764526367188, -0.7517242431640625, -0.7272720336914062, -0.70281982421875, -0.6783676147460938, -0.6539154052734375, -0.6294631958007812, -0.605010986328125, -0.5805587768554688, -0.5561065673828125, -0.5316543579101562, -0.5072021484375, -0.48274993896484375, -0.4582977294921875, -0.43384552001953125, -0.409393310546875, -0.38494110107421875, -0.3604888916015625, -0.33603668212890625, -0.31158447265625, -0.28713226318359375, -0.2626800537109375, -0.23822784423828125, -0.213775634765625, -0.18932342529296875, -0.1648712158203125, -0.14041900634765625, -0.115966796875, -0.09151458740234375, -0.0670623779296875, -0.04261016845703125, -0.018157958984375, 0.00629425048828125, 0.0307464599609375, 0.05519866943359375, 0.07965087890625, 0.10410308837890625, 0.1285552978515625, 0.15300750732421875, 0.177459716796875, 0.20191192626953125, 0.2263641357421875, 0.25081634521484375, 0.2752685546875, 0.29972076416015625, 0.3241729736328125, 0.34862518310546875, 0.373077392578125, 0.39752960205078125, 0.4219818115234375, 0.44643402099609375, 0.47088623046875, 0.49533843994140625, 0.5197906494140625, 0.5442428588867188, 0.568695068359375, 0.5931472778320312, 0.6175994873046875, 0.6420516967773438, 0.66650390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 2.0, 5.0, 7.0, 15.0, 12.0, 12.0, 20.0, 20.0, 25.0, 24.0, 40.0, 41.0, 55.0, 51.0, 48.0, 52.0, 47.0, 47.0, 55.0, 49.0, 51.0, 52.0, 46.0, 41.0, 24.0, 32.0, 30.0, 16.0, 20.0, 10.0, 18.0, 10.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.3586578369140625, -0.345489501953125, -0.3323211669921875, -0.31915283203125, -0.3059844970703125, -0.292816162109375, -0.2796478271484375, -0.2664794921875, -0.2533111572265625, -0.240142822265625, -0.2269744873046875, -0.21380615234375, -0.2006378173828125, -0.187469482421875, -0.1743011474609375, -0.1611328125, -0.1479644775390625, -0.134796142578125, -0.1216278076171875, -0.10845947265625, -0.0952911376953125, -0.082122802734375, -0.0689544677734375, -0.0557861328125, -0.0426177978515625, -0.029449462890625, -0.0162811279296875, -0.00311279296875, 0.0100555419921875, 0.023223876953125, 0.0363922119140625, 0.049560546875, 0.0627288818359375, 0.075897216796875, 0.0890655517578125, 0.10223388671875, 0.1154022216796875, 0.128570556640625, 0.1417388916015625, 0.1549072265625, 0.1680755615234375, 0.181243896484375, 0.1944122314453125, 0.20758056640625, 0.2207489013671875, 0.233917236328125, 0.2470855712890625, 0.26025390625, 0.2734222412109375, 0.286590576171875, 0.2997589111328125, 0.31292724609375, 0.3260955810546875, 0.339263916015625, 0.3524322509765625, 0.3656005859375, 0.3787689208984375, 0.391937255859375, 0.4051055908203125, 0.41827392578125, 0.4314422607421875, 0.444610595703125, 0.4577789306640625, 0.470947265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 11.0, 13.0, 12.0, 23.0, 43.0, 51.0, 77.0, 132.0, 246.0, 451.0, 756.0, 1685.0, 4669.0, 20962.0, 178005.0, 770202.0, 56233.0, 9681.0, 2780.0, 1114.0, 556.0, 292.0, 198.0, 118.0, 79.0, 41.0, 34.0, 25.0, 16.0, 11.0, 11.0, 1.0, 5.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2822265625, -1.236846923828125, -1.19146728515625, -1.146087646484375, -1.1007080078125, -1.055328369140625, -1.00994873046875, -0.964569091796875, -0.919189453125, -0.873809814453125, -0.82843017578125, -0.783050537109375, -0.7376708984375, -0.692291259765625, -0.64691162109375, -0.601531982421875, -0.55615234375, -0.510772705078125, -0.46539306640625, -0.420013427734375, -0.3746337890625, -0.329254150390625, -0.28387451171875, -0.238494873046875, -0.193115234375, -0.147735595703125, -0.10235595703125, -0.056976318359375, -0.0115966796875, 0.033782958984375, 0.07916259765625, 0.124542236328125, 0.169921875, 0.215301513671875, 0.26068115234375, 0.306060791015625, 0.3514404296875, 0.396820068359375, 0.44219970703125, 0.487579345703125, 0.532958984375, 0.578338623046875, 0.62371826171875, 0.669097900390625, 0.7144775390625, 0.759857177734375, 0.80523681640625, 0.850616455078125, 0.89599609375, 0.941375732421875, 0.98675537109375, 1.032135009765625, 1.0775146484375, 1.122894287109375, 1.16827392578125, 1.213653564453125, 1.259033203125, 1.304412841796875, 1.34979248046875, 1.395172119140625, 1.4405517578125, 1.485931396484375, 1.53131103515625, 1.576690673828125, 1.6220703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 8.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 14.0, 17.0, 11.0, 23.0, 14.0, 15.0, 18.0, 22.0, 31.0, 38.0, 39.0, 32.0, 37.0, 34.0, 45.0, 49.0, 58.0, 44.0, 36.0, 48.0, 41.0, 41.0, 37.0, 30.0, 29.0, 23.0, 9.0, 26.0, 21.0, 16.0, 13.0, 20.0, 11.0, 6.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.142578125, -1.1016693115234375, -1.060760498046875, -1.0198516845703125, -0.97894287109375, -0.9380340576171875, -0.897125244140625, -0.8562164306640625, -0.8153076171875, -0.7743988037109375, -0.733489990234375, -0.6925811767578125, -0.65167236328125, -0.6107635498046875, -0.569854736328125, -0.5289459228515625, -0.488037109375, -0.4471282958984375, -0.406219482421875, -0.3653106689453125, -0.32440185546875, -0.2834930419921875, -0.242584228515625, -0.2016754150390625, -0.1607666015625, -0.1198577880859375, -0.078948974609375, -0.0380401611328125, 0.00286865234375, 0.0437774658203125, 0.084686279296875, 0.1255950927734375, 0.16650390625, 0.2074127197265625, 0.248321533203125, 0.2892303466796875, 0.33013916015625, 0.3710479736328125, 0.411956787109375, 0.4528656005859375, 0.4937744140625, 0.5346832275390625, 0.575592041015625, 0.6165008544921875, 0.65740966796875, 0.6983184814453125, 0.739227294921875, 0.7801361083984375, 0.821044921875, 0.8619537353515625, 0.902862548828125, 0.9437713623046875, 0.98468017578125, 1.0255889892578125, 1.066497802734375, 1.1074066162109375, 1.1483154296875, 1.1892242431640625, 1.230133056640625, 1.2710418701171875, 1.31195068359375, 1.3528594970703125, 1.393768310546875, 1.4346771240234375, 1.4755859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 13.0, 8.0, 16.0, 25.0, 38.0, 46.0, 91.0, 173.0, 397.0, 1073.0, 4610.0, 31167.0, 887756.0, 110097.0, 9812.0, 2107.0, 595.0, 236.0, 98.0, 67.0, 32.0, 23.0, 22.0, 7.0, 6.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.666015625, -0.64501953125, -0.6240234375, -0.60302734375, -0.58203125, -0.56103515625, -0.5400390625, -0.51904296875, -0.498046875, -0.47705078125, -0.4560546875, -0.43505859375, -0.4140625, -0.39306640625, -0.3720703125, -0.35107421875, -0.330078125, -0.30908203125, -0.2880859375, -0.26708984375, -0.24609375, -0.22509765625, -0.2041015625, -0.18310546875, -0.162109375, -0.14111328125, -0.1201171875, -0.09912109375, -0.078125, -0.05712890625, -0.0361328125, -0.01513671875, 0.005859375, 0.02685546875, 0.0478515625, 0.06884765625, 0.08984375, 0.11083984375, 0.1318359375, 0.15283203125, 0.173828125, 0.19482421875, 0.2158203125, 0.23681640625, 0.2578125, 0.27880859375, 0.2998046875, 0.32080078125, 0.341796875, 0.36279296875, 0.3837890625, 0.40478515625, 0.42578125, 0.44677734375, 0.4677734375, 0.48876953125, 0.509765625, 0.53076171875, 0.5517578125, 0.57275390625, 0.59375, 0.61474609375, 0.6357421875, 0.65673828125, 0.677734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 5.0, 16.0, 16.0, 11.0, 37.0, 53.0, 77.0, 180.0, 261.0, 157.0, 72.0, 27.0, 15.0, 16.0, 14.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021958351135253906, -0.0002137012779712677, -0.00020781904458999634, -0.00020193681120872498, -0.0001960545778274536, -0.00019017234444618225, -0.0001842901110649109, -0.00017840787768363953, -0.00017252564430236816, -0.0001666434109210968, -0.00016076117753982544, -0.00015487894415855408, -0.00014899671077728271, -0.00014311447739601135, -0.00013723224401474, -0.00013135001063346863, -0.00012546777725219727, -0.0001195855438709259, -0.00011370331048965454, -0.00010782107710838318, -0.00010193884372711182, -9.605661034584045e-05, -9.017437696456909e-05, -8.429214358329773e-05, -7.840991020202637e-05, -7.2527676820755e-05, -6.664544343948364e-05, -6.076321005821228e-05, -5.488097667694092e-05, -4.8998743295669556e-05, -4.311650991439819e-05, -3.723427653312683e-05, -3.135204315185547e-05, -2.5469809770584106e-05, -1.9587576389312744e-05, -1.3705343008041382e-05, -7.82310962677002e-06, -1.9408762454986572e-06, 3.941357135772705e-06, 9.823590517044067e-06, 1.570582389831543e-05, 2.1588057279586792e-05, 2.7470290660858154e-05, 3.3352524042129517e-05, 3.923475742340088e-05, 4.511699080467224e-05, 5.0999224185943604e-05, 5.6881457567214966e-05, 6.276369094848633e-05, 6.864592432975769e-05, 7.452815771102905e-05, 8.041039109230042e-05, 8.629262447357178e-05, 9.217485785484314e-05, 9.80570912361145e-05, 0.00010393932461738586, 0.00010982155799865723, 0.00011570379137992859, 0.00012158602476119995, 0.0001274682581424713, 0.00013335049152374268, 0.00013923272490501404, 0.0001451149582862854, 0.00015099719166755676, 0.00015687942504882812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 0.0, 9.0, 5.0, 7.0, 16.0, 23.0, 25.0, 51.0, 72.0, 115.0, 248.0, 473.0, 993.0, 2643.0, 8416.0, 36158.0, 664892.0, 293493.0, 29753.0, 7087.0, 2227.0, 882.0, 418.0, 221.0, 136.0, 69.0, 41.0, 33.0, 16.0, 13.0, 7.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.418701171875, -0.4042320251464844, -0.38976287841796875, -0.3752937316894531, -0.3608245849609375, -0.3463554382324219, -0.33188629150390625, -0.3174171447753906, -0.302947998046875, -0.2884788513183594, -0.27400970458984375, -0.2595405578613281, -0.2450714111328125, -0.23060226440429688, -0.21613311767578125, -0.20166397094726562, -0.18719482421875, -0.17272567749023438, -0.15825653076171875, -0.14378738403320312, -0.1293182373046875, -0.11484909057617188, -0.10037994384765625, -0.08591079711914062, -0.071441650390625, -0.056972503662109375, -0.04250335693359375, -0.028034210205078125, -0.0135650634765625, 0.000904083251953125, 0.01537322998046875, 0.029842376708984375, 0.0443115234375, 0.058780670166015625, 0.07324981689453125, 0.08771896362304688, 0.1021881103515625, 0.11665725708007812, 0.13112640380859375, 0.14559555053710938, 0.160064697265625, 0.17453384399414062, 0.18900299072265625, 0.20347213745117188, 0.2179412841796875, 0.23241043090820312, 0.24687957763671875, 0.2613487243652344, 0.27581787109375, 0.2902870178222656, 0.30475616455078125, 0.3192253112792969, 0.3336944580078125, 0.3481636047363281, 0.36263275146484375, 0.3771018981933594, 0.391571044921875, 0.4060401916503906, 0.42050933837890625, 0.4349784851074219, 0.4494476318359375, 0.4639167785644531, 0.47838592529296875, 0.4928550720214844, 0.50732421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 6.0, 4.0, 3.0, 3.0, 3.0, 6.0, 2.0, 4.0, 13.0, 10.0, 15.0, 10.0, 17.0, 21.0, 30.0, 32.0, 59.0, 61.0, 77.0, 77.0, 94.0, 88.0, 77.0, 56.0, 61.0, 30.0, 26.0, 15.0, 18.0, 16.0, 13.0, 13.0, 11.0, 2.0, 7.0, 7.0, 2.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.365478515625, -0.35546875, -0.345458984375, -0.33544921875, -0.325439453125, -0.3154296875, -0.305419921875, -0.29541015625, -0.285400390625, -0.275390625, -0.265380859375, -0.25537109375, -0.245361328125, -0.2353515625, -0.225341796875, -0.21533203125, -0.205322265625, -0.1953125, -0.185302734375, -0.17529296875, -0.165283203125, -0.1552734375, -0.145263671875, -0.13525390625, -0.125244140625, -0.115234375, -0.105224609375, -0.09521484375, -0.085205078125, -0.0751953125, -0.065185546875, -0.05517578125, -0.045166015625, -0.03515625, -0.025146484375, -0.01513671875, -0.005126953125, 0.0048828125, 0.014892578125, 0.02490234375, 0.034912109375, 0.044921875, 0.054931640625, 0.06494140625, 0.074951171875, 0.0849609375, 0.094970703125, 0.10498046875, 0.114990234375, 0.125, 0.135009765625, 0.14501953125, 0.155029296875, 0.1650390625, 0.175048828125, 0.18505859375, 0.195068359375, 0.205078125, 0.215087890625, 0.22509765625, 0.235107421875, 0.2451171875, 0.255126953125, 0.26513671875, 0.275146484375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 6.0, 14.0, 14.0, 62.0, 83.0, 259.0, 304.0, 131.0, 53.0, 41.0, 18.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.180699348449707, -14.828330039978027, -14.475959777832031, -14.123590469360352, -13.771220207214355, -13.418850898742676, -13.06648063659668, -12.714111328125, -12.36174201965332, -12.00937271118164, -11.657002449035645, -11.304633140563965, -10.952262878417969, -10.599893569946289, -10.24752426147461, -9.895153999328613, -9.542783737182617, -9.190414428710938, -8.838044166564941, -8.485674858093262, -8.133304595947266, -7.780935287475586, -7.428565502166748, -7.07619571685791, -6.723825931549072, -6.371456146240234, -6.0190863609313965, -5.666716575622559, -5.314347267150879, -4.961977005004883, -4.609607696533203, -4.257237911224365, -3.904867172241211, -3.552497386932373, -3.200127601623535, -2.8477580547332764, -2.4953882694244385, -2.1430184841156006, -1.7906489372253418, -1.438279151916504, -1.085909366607666, -0.7335396409034729, -0.3811699151992798, -0.028800249099731445, 0.32356953620910645, 0.6759393215179443, 1.0283088684082031, 1.380678653717041, 1.733048439025879, 2.085418224334717, 2.4377880096435547, 2.7901575565338135, 3.1425273418426514, 3.4948971271514893, 3.847266674041748, 4.199636459350586, 4.552006244659424, 4.904376029968262, 5.2567458152771, 5.6091156005859375, 5.961484909057617, 6.313855171203613, 6.666224479675293, 7.018594264984131, 7.370964050292969]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 13.0, 11.0, 9.0, 18.0, 15.0, 18.0, 26.0, 16.0, 36.0, 31.0, 30.0, 65.0, 71.0, 67.0, 63.0, 67.0, 83.0, 71.0, 48.0, 33.0, 34.0, 22.0, 23.0, 20.0, 12.0, 19.0, 14.0, 12.0, 6.0, 10.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.743718147277832, -6.538629055023193, -6.333540439605713, -6.128451347351074, -5.9233622550964355, -5.718273162841797, -5.513184547424316, -5.308095455169678, -5.103006362915039, -4.8979172706604, -4.69282865524292, -4.487739562988281, -4.282650470733643, -4.077561378479004, -3.8724727630615234, -3.6673836708068848, -3.4622950553894043, -3.2572062015533447, -3.052117109298706, -2.8470282554626465, -2.641939163208008, -2.4368503093719482, -2.2317614555358887, -2.02667236328125, -1.8215835094451904, -1.6164945363998413, -1.4114055633544922, -1.2063167095184326, -1.0012277364730835, -0.7961387634277344, -0.5910499095916748, -0.3859609365463257, -0.18087148666381836, 0.024217456579208374, 0.2293063998222351, 0.43439531326293945, 0.6394842863082886, 0.8445732593536377, 1.0496621131896973, 1.2547510862350464, 1.4598400592803955, 1.6649290323257446, 1.8700180053710938, 2.0751068592071533, 2.280195713043213, 2.4852848052978516, 2.690373659133911, 2.8954625129699707, 3.1005516052246094, 3.305640459060669, 3.5107295513153076, 3.715818405151367, 3.920907497406006, 4.1259965896606445, 4.331085205078125, 4.536174297332764, 4.741263389587402, 4.946352481842041, 5.1514410972595215, 5.35653018951416, 5.561619281768799, 5.7667083740234375, 5.971796989440918, 6.176886081695557, 6.381974697113037]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 11.0, 20.0, 24.0, 45.0, 81.0, 122.0, 251.0, 429.0, 869.0, 1721.0, 4017.0, 10872.0, 37081.0, 194090.0, 1855969.0, 1837738.0, 196283.0, 36192.0, 10661.0, 4011.0, 1723.0, 887.0, 469.0, 262.0, 163.0, 84.0, 61.0, 36.0, 28.0, 20.0, 14.0, 5.0, 5.0, 5.0, 3.0, 8.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8935546875, -0.86376953125, -0.833984375, -0.80419921875, -0.7744140625, -0.74462890625, -0.71484375, -0.68505859375, -0.6552734375, -0.62548828125, -0.595703125, -0.56591796875, -0.5361328125, -0.50634765625, -0.4765625, -0.44677734375, -0.4169921875, -0.38720703125, -0.357421875, -0.32763671875, -0.2978515625, -0.26806640625, -0.23828125, -0.20849609375, -0.1787109375, -0.14892578125, -0.119140625, -0.08935546875, -0.0595703125, -0.02978515625, 0.0, 0.02978515625, 0.0595703125, 0.08935546875, 0.119140625, 0.14892578125, 0.1787109375, 0.20849609375, 0.23828125, 0.26806640625, 0.2978515625, 0.32763671875, 0.357421875, 0.38720703125, 0.4169921875, 0.44677734375, 0.4765625, 0.50634765625, 0.5361328125, 0.56591796875, 0.595703125, 0.62548828125, 0.6552734375, 0.68505859375, 0.71484375, 0.74462890625, 0.7744140625, 0.80419921875, 0.833984375, 0.86376953125, 0.8935546875, 0.92333984375, 0.953125, 0.98291015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 2.0, 4.0, 6.0, 5.0, 14.0, 11.0, 12.0, 17.0, 26.0, 14.0, 25.0, 34.0, 37.0, 31.0, 47.0, 47.0, 47.0, 37.0, 41.0, 52.0, 54.0, 46.0, 46.0, 44.0, 46.0, 43.0, 36.0, 39.0, 24.0, 24.0, 20.0, 15.0, 9.0, 11.0, 9.0, 13.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3587989807128906, -0.34699249267578125, -0.3351860046386719, -0.3233795166015625, -0.3115730285644531, -0.29976654052734375, -0.2879600524902344, -0.276153564453125, -0.2643470764160156, -0.25254058837890625, -0.24073410034179688, -0.2289276123046875, -0.21712112426757812, -0.20531463623046875, -0.19350814819335938, -0.18170166015625, -0.16989517211914062, -0.15808868408203125, -0.14628219604492188, -0.1344757080078125, -0.12266921997070312, -0.11086273193359375, -0.09905624389648438, -0.087249755859375, -0.07544326782226562, -0.06363677978515625, -0.051830291748046875, -0.0400238037109375, -0.028217315673828125, -0.01641082763671875, -0.004604339599609375, 0.0072021484375, 0.019008636474609375, 0.03081512451171875, 0.042621612548828125, 0.0544281005859375, 0.06623458862304688, 0.07804107666015625, 0.08984756469726562, 0.101654052734375, 0.11346054077148438, 0.12526702880859375, 0.13707351684570312, 0.1488800048828125, 0.16068649291992188, 0.17249298095703125, 0.18429946899414062, 0.19610595703125, 0.20791244506835938, 0.21971893310546875, 0.23152542114257812, 0.2433319091796875, 0.2551383972167969, 0.26694488525390625, 0.2787513732910156, 0.290557861328125, 0.3023643493652344, 0.31417083740234375, 0.3259773254394531, 0.3377838134765625, 0.3495903015136719, 0.36139678955078125, 0.3732032775878906, 0.385009765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 16.0, 27.0, 62.0, 135.0, 385.0, 1338.0, 13730.0, 4127094.0, 48648.0, 2005.0, 499.0, 153.0, 90.0, 36.0, 21.0, 15.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -3.9915771484375, -3.815185546875, -3.6387939453125, -3.46240234375, -3.2860107421875, -3.109619140625, -2.9332275390625, -2.7568359375, -2.5804443359375, -2.404052734375, -2.2276611328125, -2.05126953125, -1.8748779296875, -1.698486328125, -1.5220947265625, -1.345703125, -1.1693115234375, -0.992919921875, -0.8165283203125, -0.64013671875, -0.4637451171875, -0.287353515625, -0.1109619140625, 0.0654296875, 0.2418212890625, 0.418212890625, 0.5946044921875, 0.77099609375, 0.9473876953125, 1.123779296875, 1.3001708984375, 1.4765625, 1.6529541015625, 1.829345703125, 2.0057373046875, 2.18212890625, 2.3585205078125, 2.534912109375, 2.7113037109375, 2.8876953125, 3.0640869140625, 3.240478515625, 3.4168701171875, 3.59326171875, 3.7696533203125, 3.946044921875, 4.1224365234375, 4.298828125, 4.4752197265625, 4.651611328125, 4.8280029296875, 5.00439453125, 5.1807861328125, 5.357177734375, 5.5335693359375, 5.7099609375, 5.8863525390625, 6.062744140625, 6.2391357421875, 6.41552734375, 6.5919189453125, 6.768310546875, 6.9447021484375, 7.12109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 27.0, 47.0, 74.0, 156.0, 306.0, 644.0, 1190.0, 888.0, 380.0, 174.0, 85.0, 49.0, 23.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.670989990234375, -3.57830810546875, -3.485626220703125, -3.3929443359375, -3.300262451171875, -3.20758056640625, -3.114898681640625, -3.022216796875, -2.929534912109375, -2.83685302734375, -2.744171142578125, -2.6514892578125, -2.558807373046875, -2.46612548828125, -2.373443603515625, -2.28076171875, -2.188079833984375, -2.09539794921875, -2.002716064453125, -1.9100341796875, -1.817352294921875, -1.72467041015625, -1.631988525390625, -1.539306640625, -1.446624755859375, -1.35394287109375, -1.261260986328125, -1.1685791015625, -1.075897216796875, -0.98321533203125, -0.890533447265625, -0.7978515625, -0.705169677734375, -0.61248779296875, -0.519805908203125, -0.4271240234375, -0.334442138671875, -0.24176025390625, -0.149078369140625, -0.056396484375, 0.036285400390625, 0.12896728515625, 0.221649169921875, 0.3143310546875, 0.407012939453125, 0.49969482421875, 0.592376708984375, 0.68505859375, 0.777740478515625, 0.87042236328125, 0.963104248046875, 1.0557861328125, 1.148468017578125, 1.24114990234375, 1.333831787109375, 1.426513671875, 1.519195556640625, 1.61187744140625, 1.704559326171875, 1.7972412109375, 1.889923095703125, 1.98260498046875, 2.075286865234375, 2.16796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 8.0, 10.0, 25.0, 55.0, 83.0, 172.0, 184.0, 173.0, 91.0, 70.0, 41.0, 27.0, 8.0, 15.0, 4.0, 5.0, 4.0, 4.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.804410934448242, -22.21473503112793, -21.62506103515625, -21.035385131835938, -20.445709228515625, -19.856033325195312, -19.266357421875, -18.67668342590332, -18.087007522583008, -17.497331619262695, -16.907657623291016, -16.317981719970703, -15.72830581665039, -15.138629913330078, -14.548954963684082, -13.959280014038086, -13.369604110717773, -12.779928207397461, -12.190253257751465, -11.600578308105469, -11.010902404785156, -10.421226501464844, -9.831551551818848, -9.241876602172852, -8.652200698852539, -8.062524795532227, -7.4728498458862305, -6.883174419403076, -6.293498992919922, -5.703823566436768, -5.114148139953613, -4.524472713470459, -3.934795379638672, -3.3451199531555176, -2.7554445266723633, -2.165769100189209, -1.5760936737060547, -0.9864182472229004, -0.3967428207397461, 0.1929326057434082, 0.7826080322265625, 1.3722834587097168, 1.961958885192871, 2.5516343116760254, 3.1413097381591797, 3.730985164642334, 4.320660591125488, 4.910336017608643, 5.500011444091797, 6.089686870574951, 6.6793622970581055, 7.26903772354126, 7.858713150024414, 8.448389053344727, 9.038064002990723, 9.627738952636719, 10.217414855957031, 10.807090759277344, 11.39676570892334, 11.986440658569336, 12.576116561889648, 13.165792465209961, 13.755467414855957, 14.345142364501953, 14.934818267822266]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 8.0, 7.0, 19.0, 18.0, 24.0, 29.0, 39.0, 58.0, 57.0, 77.0, 118.0, 90.0, 102.0, 82.0, 64.0, 48.0, 42.0, 35.0, 28.0, 24.0, 15.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.61494255065918, -16.147159576416016, -15.679378509521484, -15.211596488952637, -14.743814468383789, -14.276032447814941, -13.808250427246094, -13.34046745300293, -12.872686386108398, -12.40490436553955, -11.937122344970703, -11.469340324401855, -11.001558303833008, -10.53377628326416, -10.065994262695312, -9.598211288452148, -9.1304292678833, -8.662647247314453, -8.194865226745605, -7.727083206176758, -7.25930118560791, -6.7915191650390625, -6.323736667633057, -5.855954647064209, -5.388172626495361, -4.920390605926514, -4.452608585357666, -3.9848263263702393, -3.5170443058013916, -3.049262285232544, -2.581480026245117, -2.1136980056762695, -1.6459150314331055, -1.1781330108642578, -0.7103508710861206, -0.2425687313079834, 0.22521328926086426, 0.6929953098297119, 1.1607775688171387, 1.6285595893859863, 2.096341609954834, 2.5641236305236816, 3.0319056510925293, 3.499687910079956, 3.9674699306488037, 4.4352521896362305, 4.903034210205078, 5.370816230773926, 5.838598251342773, 6.306380271911621, 6.774162292480469, 7.241944313049316, 7.709726333618164, 8.177508354187012, 8.64529037475586, 9.113073348999023, 9.580854415893555, 10.048636436462402, 10.51641845703125, 10.984200477600098, 11.451982498168945, 11.919764518737793, 12.38754653930664, 12.855329513549805, 13.323111534118652]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 4.0, 8.0, 10.0, 20.0, 32.0, 50.0, 86.0, 179.0, 301.0, 604.0, 1472.0, 4139.0, 14445.0, 81976.0, 702673.0, 205189.0, 26918.0, 6488.0, 2200.0, 871.0, 393.0, 206.0, 97.0, 67.0, 39.0, 22.0, 22.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0182342529296875, -0.982757568359375, -0.9472808837890625, -0.91180419921875, -0.8763275146484375, -0.840850830078125, -0.8053741455078125, -0.7698974609375, -0.7344207763671875, -0.698944091796875, -0.6634674072265625, -0.62799072265625, -0.5925140380859375, -0.557037353515625, -0.5215606689453125, -0.486083984375, -0.4506072998046875, -0.415130615234375, -0.3796539306640625, -0.34417724609375, -0.3087005615234375, -0.273223876953125, -0.2377471923828125, -0.2022705078125, -0.1667938232421875, -0.131317138671875, -0.0958404541015625, -0.06036376953125, -0.0248870849609375, 0.010589599609375, 0.0460662841796875, 0.08154296875, 0.1170196533203125, 0.152496337890625, 0.1879730224609375, 0.22344970703125, 0.2589263916015625, 0.294403076171875, 0.3298797607421875, 0.3653564453125, 0.4008331298828125, 0.436309814453125, 0.4717864990234375, 0.50726318359375, 0.5427398681640625, 0.578216552734375, 0.6136932373046875, 0.649169921875, 0.6846466064453125, 0.720123291015625, 0.7555999755859375, 0.79107666015625, 0.8265533447265625, 0.862030029296875, 0.8975067138671875, 0.9329833984375, 0.9684600830078125, 1.003936767578125, 1.0394134521484375, 1.07489013671875, 1.1103668212890625, 1.145843505859375, 1.1813201904296875, 1.216796875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 13.0, 14.0, 21.0, 34.0, 45.0, 61.0, 105.0, 95.0, 120.0, 113.0, 115.0, 95.0, 58.0, 46.0, 26.0, 21.0, 16.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.38629150390625, -1.3497314453125, -1.31317138671875, -1.276611328125, -1.24005126953125, -1.2034912109375, -1.16693115234375, -1.13037109375, -1.09381103515625, -1.0572509765625, -1.02069091796875, -0.984130859375, -0.94757080078125, -0.9110107421875, -0.87445068359375, -0.837890625, -0.80133056640625, -0.7647705078125, -0.72821044921875, -0.691650390625, -0.65509033203125, -0.6185302734375, -0.58197021484375, -0.54541015625, -0.50885009765625, -0.4722900390625, -0.43572998046875, -0.399169921875, -0.36260986328125, -0.3260498046875, -0.28948974609375, -0.2529296875, -0.21636962890625, -0.1798095703125, -0.14324951171875, -0.106689453125, -0.07012939453125, -0.0335693359375, 0.00299072265625, 0.03955078125, 0.07611083984375, 0.1126708984375, 0.14923095703125, 0.185791015625, 0.22235107421875, 0.2589111328125, 0.29547119140625, 0.33203125, 0.36859130859375, 0.4051513671875, 0.44171142578125, 0.478271484375, 0.51483154296875, 0.5513916015625, 0.58795166015625, 0.62451171875, 0.66107177734375, 0.6976318359375, 0.73419189453125, 0.770751953125, 0.80731201171875, 0.8438720703125, 0.88043212890625, 0.9169921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 8.0, 13.0, 18.0, 17.0, 26.0, 27.0, 35.0, 60.0, 100.0, 144.0, 238.0, 438.0, 853.0, 1975.0, 6507.0, 34324.0, 817026.0, 162298.0, 17340.0, 4071.0, 1422.0, 632.0, 343.0, 193.0, 126.0, 80.0, 53.0, 37.0, 27.0, 14.0, 19.0, 16.0, 14.0, 12.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.1650390625, -1.130584716796875, -1.09613037109375, -1.061676025390625, -1.0272216796875, -0.992767333984375, -0.95831298828125, -0.923858642578125, -0.889404296875, -0.854949951171875, -0.82049560546875, -0.786041259765625, -0.7515869140625, -0.717132568359375, -0.68267822265625, -0.648223876953125, -0.61376953125, -0.579315185546875, -0.54486083984375, -0.510406494140625, -0.4759521484375, -0.441497802734375, -0.40704345703125, -0.372589111328125, -0.338134765625, -0.303680419921875, -0.26922607421875, -0.234771728515625, -0.2003173828125, -0.165863037109375, -0.13140869140625, -0.096954345703125, -0.0625, -0.028045654296875, 0.00640869140625, 0.040863037109375, 0.0753173828125, 0.109771728515625, 0.14422607421875, 0.178680419921875, 0.213134765625, 0.247589111328125, 0.28204345703125, 0.316497802734375, 0.3509521484375, 0.385406494140625, 0.41986083984375, 0.454315185546875, 0.48876953125, 0.523223876953125, 0.55767822265625, 0.592132568359375, 0.6265869140625, 0.661041259765625, 0.69549560546875, 0.729949951171875, 0.764404296875, 0.798858642578125, 0.83331298828125, 0.867767333984375, 0.9022216796875, 0.936676025390625, 0.97113037109375, 1.005584716796875, 1.0400390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 7.0, 11.0, 9.0, 13.0, 20.0, 16.0, 20.0, 27.0, 35.0, 35.0, 37.0, 41.0, 53.0, 58.0, 85.0, 81.0, 62.0, 68.0, 36.0, 50.0, 38.0, 30.0, 20.0, 28.0, 12.0, 15.0, 9.0, 12.0, 18.0, 7.0, 9.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.24609375, -2.17864990234375, -2.1112060546875, -2.04376220703125, -1.976318359375, -1.90887451171875, -1.8414306640625, -1.77398681640625, -1.70654296875, -1.63909912109375, -1.5716552734375, -1.50421142578125, -1.436767578125, -1.36932373046875, -1.3018798828125, -1.23443603515625, -1.1669921875, -1.09954833984375, -1.0321044921875, -0.96466064453125, -0.897216796875, -0.82977294921875, -0.7623291015625, -0.69488525390625, -0.62744140625, -0.55999755859375, -0.4925537109375, -0.42510986328125, -0.357666015625, -0.29022216796875, -0.2227783203125, -0.15533447265625, -0.087890625, -0.02044677734375, 0.0469970703125, 0.11444091796875, 0.181884765625, 0.24932861328125, 0.3167724609375, 0.38421630859375, 0.45166015625, 0.51910400390625, 0.5865478515625, 0.65399169921875, 0.721435546875, 0.78887939453125, 0.8563232421875, 0.92376708984375, 0.9912109375, 1.05865478515625, 1.1260986328125, 1.19354248046875, 1.260986328125, 1.32843017578125, 1.3958740234375, 1.46331787109375, 1.53076171875, 1.59820556640625, 1.6656494140625, 1.73309326171875, 1.800537109375, 1.86798095703125, 1.9354248046875, 2.00286865234375, 2.0703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 13.0, 21.0, 32.0, 33.0, 34.0, 57.0, 86.0, 137.0, 197.0, 341.0, 498.0, 996.0, 1765.0, 3751.0, 9124.0, 28469.0, 165787.0, 767752.0, 46214.0, 13038.0, 4979.0, 2226.0, 1118.0, 658.0, 375.0, 236.0, 151.0, 100.0, 79.0, 58.0, 35.0, 29.0, 14.0, 16.0, 15.0, 7.0, 2.0, 6.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0], "bins": [-0.1251220703125, -0.12134933471679688, -0.11757659912109375, -0.11380386352539062, -0.1100311279296875, -0.10625839233398438, -0.10248565673828125, -0.09871292114257812, -0.094940185546875, -0.09116744995117188, -0.08739471435546875, -0.08362197875976562, -0.0798492431640625, -0.07607650756835938, -0.07230377197265625, -0.06853103637695312, -0.06475830078125, -0.060985565185546875, -0.05721282958984375, -0.053440093994140625, -0.0496673583984375, -0.045894622802734375, -0.04212188720703125, -0.038349151611328125, -0.034576416015625, -0.030803680419921875, -0.02703094482421875, -0.023258209228515625, -0.0194854736328125, -0.015712738037109375, -0.01194000244140625, -0.008167266845703125, -0.00439453125, -0.000621795654296875, 0.00315093994140625, 0.006923675537109375, 0.0106964111328125, 0.014469146728515625, 0.01824188232421875, 0.022014617919921875, 0.025787353515625, 0.029560089111328125, 0.03333282470703125, 0.037105560302734375, 0.0408782958984375, 0.044651031494140625, 0.04842376708984375, 0.052196502685546875, 0.05596923828125, 0.059741973876953125, 0.06351470947265625, 0.06728744506835938, 0.0710601806640625, 0.07483291625976562, 0.07860565185546875, 0.08237838745117188, 0.086151123046875, 0.08992385864257812, 0.09369659423828125, 0.09746932983398438, 0.1012420654296875, 0.10501480102539062, 0.10878753662109375, 0.11256027221679688, 0.1163330078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 4.0, 8.0, 11.0, 17.0, 18.0, 23.0, 19.0, 42.0, 44.0, 48.0, 77.0, 81.0, 99.0, 94.0, 103.0, 65.0, 53.0, 38.0, 30.0, 21.0, 13.0, 10.0, 17.0, 11.0, 7.0, 6.0, 2.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-05, -3.825034946203232e-05, -3.7161633372306824e-05, -3.607291728258133e-05, -3.4984201192855835e-05, -3.389548510313034e-05, -3.2806769013404846e-05, -3.171805292367935e-05, -3.062933683395386e-05, -2.9540620744228363e-05, -2.845190465450287e-05, -2.7363188564777374e-05, -2.627447247505188e-05, -2.5185756385326385e-05, -2.409704029560089e-05, -2.3008324205875397e-05, -2.1919608116149902e-05, -2.0830892026424408e-05, -1.9742175936698914e-05, -1.865345984697342e-05, -1.7564743757247925e-05, -1.647602766752243e-05, -1.5387311577796936e-05, -1.4298595488071442e-05, -1.3209879398345947e-05, -1.2121163308620453e-05, -1.1032447218894958e-05, -9.943731129169464e-06, -8.85501503944397e-06, -7.766298949718475e-06, -6.677582859992981e-06, -5.5888667702674866e-06, -4.500150680541992e-06, -3.411434590816498e-06, -2.3227185010910034e-06, -1.234002411365509e-06, -1.4528632164001465e-07, 9.434297680854797e-07, 2.032145857810974e-06, 3.1208619475364685e-06, 4.209578037261963e-06, 5.298294126987457e-06, 6.387010216712952e-06, 7.475726306438446e-06, 8.56444239616394e-06, 9.653158485889435e-06, 1.074187457561493e-05, 1.1830590665340424e-05, 1.2919306755065918e-05, 1.4008022844791412e-05, 1.5096738934516907e-05, 1.61854550242424e-05, 1.7274171113967896e-05, 1.836288720369339e-05, 1.9451603293418884e-05, 2.054031938314438e-05, 2.1629035472869873e-05, 2.2717751562595367e-05, 2.3806467652320862e-05, 2.4895183742046356e-05, 2.598389983177185e-05, 2.7072615921497345e-05, 2.816133201122284e-05, 2.9250048100948334e-05, 3.0338764190673828e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 4.0, 6.0, 11.0, 11.0, 10.0, 19.0, 32.0, 36.0, 53.0, 80.0, 102.0, 155.0, 260.0, 434.0, 787.0, 1351.0, 2306.0, 4573.0, 9862.0, 24107.0, 83287.0, 762770.0, 107502.0, 28373.0, 11285.0, 5140.0, 2476.0, 1399.0, 806.0, 465.0, 302.0, 174.0, 116.0, 86.0, 42.0, 37.0, 27.0, 25.0, 8.0, 8.0, 10.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.102294921875, -0.09905529022216797, -0.09581565856933594, -0.0925760269165039, -0.08933639526367188, -0.08609676361083984, -0.08285713195800781, -0.07961750030517578, -0.07637786865234375, -0.07313823699951172, -0.06989860534667969, -0.06665897369384766, -0.06341934204101562, -0.060179710388183594, -0.05694007873535156, -0.05370044708251953, -0.0504608154296875, -0.04722118377685547, -0.04398155212402344, -0.040741920471191406, -0.037502288818359375, -0.034262657165527344, -0.031023025512695312, -0.02778339385986328, -0.02454376220703125, -0.02130413055419922, -0.018064498901367188, -0.014824867248535156, -0.011585235595703125, -0.008345603942871094, -0.0051059722900390625, -0.0018663406372070312, 0.001373291015625, 0.004612922668457031, 0.007852554321289062, 0.011092185974121094, 0.014331817626953125, 0.017571449279785156, 0.020811080932617188, 0.02405071258544922, 0.02729034423828125, 0.03052997589111328, 0.03376960754394531, 0.037009239196777344, 0.040248870849609375, 0.043488502502441406, 0.04672813415527344, 0.04996776580810547, 0.0532073974609375, 0.05644702911376953, 0.05968666076660156, 0.0629262924194336, 0.06616592407226562, 0.06940555572509766, 0.07264518737792969, 0.07588481903076172, 0.07912445068359375, 0.08236408233642578, 0.08560371398925781, 0.08884334564208984, 0.09208297729492188, 0.0953226089477539, 0.09856224060058594, 0.10180187225341797, 0.10504150390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 11.0, 8.0, 10.0, 11.0, 10.0, 12.0, 22.0, 31.0, 29.0, 24.0, 56.0, 72.0, 103.0, 99.0, 95.0, 88.0, 86.0, 47.0, 49.0, 28.0, 14.0, 21.0, 13.0, 9.0, 7.0, 13.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2066650390625, -0.20105552673339844, -0.19544601440429688, -0.1898365020751953, -0.18422698974609375, -0.1786174774169922, -0.17300796508789062, -0.16739845275878906, -0.1617889404296875, -0.15617942810058594, -0.15056991577148438, -0.1449604034423828, -0.13935089111328125, -0.1337413787841797, -0.12813186645507812, -0.12252235412597656, -0.116912841796875, -0.11130332946777344, -0.10569381713867188, -0.10008430480957031, -0.09447479248046875, -0.08886528015136719, -0.08325576782226562, -0.07764625549316406, -0.0720367431640625, -0.06642723083496094, -0.060817718505859375, -0.05520820617675781, -0.04959869384765625, -0.04398918151855469, -0.038379669189453125, -0.03277015686035156, -0.02716064453125, -0.021551132202148438, -0.015941619873046875, -0.010332107543945312, -0.00472259521484375, 0.0008869171142578125, 0.006496429443359375, 0.012105941772460938, 0.0177154541015625, 0.023324966430664062, 0.028934478759765625, 0.03454399108886719, 0.04015350341796875, 0.04576301574707031, 0.051372528076171875, 0.05698204040527344, 0.062591552734375, 0.06820106506347656, 0.07381057739257812, 0.07942008972167969, 0.08502960205078125, 0.09063911437988281, 0.09624862670898438, 0.10185813903808594, 0.1074676513671875, 0.11307716369628906, 0.11868667602539062, 0.12429618835449219, 0.12990570068359375, 0.1355152130126953, 0.14112472534179688, 0.14673423767089844, 0.15234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 19.0, 38.0, 82.0, 271.0, 464.0, 75.0, 30.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.785268783569336, -19.27933120727539, -18.773391723632812, -18.267452239990234, -17.76151466369629, -17.255577087402344, -16.749637603759766, -16.243698120117188, -15.737760543823242, -15.23182201385498, -14.725883483886719, -14.219944953918457, -13.714006423950195, -13.208067893981934, -12.702129364013672, -12.19619083404541, -11.690252304077148, -11.184313774108887, -10.678375244140625, -10.172436714172363, -9.666498184204102, -9.16055965423584, -8.654621124267578, -8.148682594299316, -7.642744064331055, -7.136805534362793, -6.630867004394531, -6.1249284744262695, -5.618989944458008, -5.113051414489746, -4.607112884521484, -4.101174354553223, -3.595235824584961, -3.089297294616699, -2.5833587646484375, -2.077420234680176, -1.571481704711914, -1.0655431747436523, -0.5596046447753906, -0.053666114807128906, 0.4522724151611328, 0.9582109451293945, 1.4641494750976562, 1.970088005065918, 2.4760265350341797, 2.9819650650024414, 3.487903594970703, 3.993842124938965, 4.499780654907227, 5.005719184875488, 5.51165771484375, 6.017596244812012, 6.523534774780273, 7.029473304748535, 7.535411834716797, 8.041350364685059, 8.54728889465332, 9.053227424621582, 9.559165954589844, 10.065104484558105, 10.571043014526367, 11.076981544494629, 11.58292007446289, 12.088858604431152, 12.594797134399414]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 7.0, 11.0, 10.0, 15.0, 17.0, 26.0, 19.0, 24.0, 37.0, 37.0, 62.0, 107.0, 168.0, 130.0, 69.0, 44.0, 38.0, 20.0, 20.0, 22.0, 15.0, 14.0, 13.0, 9.0, 8.0, 6.0, 5.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.757657051086426, -5.540931701660156, -5.324206352233887, -5.107481002807617, -4.8907551765441895, -4.67402982711792, -4.45730447769165, -4.240579128265381, -4.023853302001953, -3.8071279525756836, -3.590402364730835, -3.3736770153045654, -3.156951427459717, -2.9402260780334473, -2.7235007286071777, -2.506775379180908, -2.2900500297546387, -2.073324680328369, -1.8565990924835205, -1.639873743057251, -1.423148274421692, -1.2064228057861328, -0.9896974563598633, -0.7729719877243042, -0.5562465190887451, -0.3395210802555084, -0.12279564142227173, 0.09392976760864258, 0.31065523624420166, 0.5273807048797607, 0.7441060543060303, 0.9608315229415894, 1.1775569915771484, 1.3942824602127075, 1.6110079288482666, 1.8277332782745361, 2.0444588661193848, 2.2611842155456543, 2.477909564971924, 2.6946349143981934, 2.911360502243042, 3.1280858516693115, 3.34481143951416, 3.5615367889404297, 3.778262138366699, 3.994987726211548, 4.211712837219238, 4.428438663482666, 4.6451640129089355, 4.861889362335205, 5.078614711761475, 5.295340538024902, 5.512065887451172, 5.728791236877441, 5.945516586303711, 6.1622419357299805, 6.37896728515625, 6.5956926345825195, 6.812417984008789, 7.029143333435059, 7.245869159698486, 7.462594509124756, 7.679319858551025, 7.896045207977295, 8.112771034240723]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 10.0, 10.0, 6.0, 9.0, 16.0, 13.0, 15.0, 13.0, 19.0, 18.0, 28.0, 26.0, 30.0, 35.0, 59.0, 235.0, 127.0, 48.0, 35.0, 31.0, 27.0, 20.0, 19.0, 27.0, 17.0, 10.0, 17.0, 13.0, 10.0, 8.0, 9.0, 10.0, 3.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.446533203125, -0.43294525146484375, -0.4193572998046875, -0.40576934814453125, -0.392181396484375, -0.37859344482421875, -0.3650054931640625, -0.35141754150390625, -0.33782958984375, -0.32424163818359375, -0.3106536865234375, -0.29706573486328125, -0.283477783203125, -0.26988983154296875, -0.2563018798828125, -0.24271392822265625, -0.2291259765625, -0.21553802490234375, -0.2019500732421875, -0.18836212158203125, -0.174774169921875, -0.16118621826171875, -0.1475982666015625, -0.13401031494140625, -0.12042236328125, -0.10683441162109375, -0.0932464599609375, -0.07965850830078125, -0.066070556640625, -0.05248260498046875, -0.0388946533203125, -0.02530670166015625, -0.01171875, 0.00186920166015625, 0.0154571533203125, 0.02904510498046875, 0.042633056640625, 0.05622100830078125, 0.0698089599609375, 0.08339691162109375, 0.09698486328125, 0.11057281494140625, 0.1241607666015625, 0.13774871826171875, 0.151336669921875, 0.16492462158203125, 0.1785125732421875, 0.19210052490234375, 0.2056884765625, 0.21927642822265625, 0.2328643798828125, 0.24645233154296875, 0.260040283203125, 0.27362823486328125, 0.2872161865234375, 0.30080413818359375, 0.31439208984375, 0.32798004150390625, 0.3415679931640625, 0.35515594482421875, 0.368743896484375, 0.38233184814453125, 0.3959197998046875, 0.40950775146484375, 0.423095703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 7.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 17.0, 30.0, 63.0, 131.0, 307.0, 1012.0, 6654.0, 8359688.0, 18215.0, 1716.0, 384.0, 171.0, 77.0, 26.0, 15.0, 14.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.210654258728027, -5.9687347412109375, -5.726815223693848, -5.484895706176758, -5.242976188659668, -5.001056671142578, -4.759137153625488, -4.51721715927124, -4.27529764175415, -4.0333781242370605, -3.7914586067199707, -3.549539089202881, -3.307619333267212, -3.065699815750122, -2.8237802982330322, -2.5818605422973633, -2.3399412631988525, -2.0980217456817627, -1.8561021089553833, -1.6141825914382935, -1.372262954711914, -1.1303434371948242, -0.8884239196777344, -0.646504282951355, -0.40458476543426514, -0.1626652032136917, 0.07925435900688171, 0.32117390632629395, 0.5630934834480286, 0.8050130605697632, 1.046932578086853, 1.2888522148132324, 1.5307717323303223, 1.772691249847412, 2.014610767364502, 2.256530284881592, 2.4984500408172607, 2.7403695583343506, 2.9822890758514404, 3.2242088317871094, 3.466128349304199, 3.708047866821289, 3.949967384338379, 4.191886901855469, 4.433806419372559, 4.675725936889648, 4.917645454406738, 5.159565448760986, 5.401484489440918, 5.643404006958008, 5.885323524475098, 6.1272430419921875, 6.369162559509277, 6.611082077026367, 6.853001594543457, 7.094921588897705, 7.336841106414795, 7.578760623931885, 7.820680141448975, 8.062600135803223, 8.304519653320312, 8.546439170837402, 8.788358688354492, 9.030278205871582, 9.272197723388672]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 7.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.100747108459473, -6.846602916717529, -6.592458724975586, -6.338314533233643, -6.084170341491699, -5.830026149749756, -5.5758819580078125, -5.321737766265869, -5.067593574523926, -4.813449382781982, -4.559305191040039, -4.305160999298096, -4.051016807556152, -3.796872615814209, -3.5427284240722656, -3.2885842323303223, -3.034440040588379, -2.7802958488464355, -2.526151657104492, -2.272007465362549, -2.0178632736206055, -1.763719081878662, -1.5095748901367188, -1.2554306983947754, -1.001286506652832, -0.7471423149108887, -0.4929981231689453, -0.23885393142700195, 0.015290260314941406, 0.26943445205688477, 0.5235786437988281, 0.7777228355407715, 1.0318660736083984, 1.2860102653503418, 1.5401544570922852, 1.7942986488342285, 2.048442840576172, 2.3025870323181152, 2.5567312240600586, 2.810875415802002, 3.0650196075439453, 3.3191637992858887, 3.573307991027832, 3.8274521827697754, 4.081596374511719, 4.335740566253662, 4.5898847579956055, 4.844028949737549, 5.098173141479492, 5.3523173332214355, 5.606461524963379, 5.860605716705322, 6.114749908447266, 6.368894100189209, 6.623038291931152, 6.877182483673096, 7.131326675415039, 7.385470867156982, 7.639615058898926, 7.893759250640869, 8.147903442382812, 8.402048110961914, 8.6561918258667, 8.910335540771484, 9.164480209350586]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 9.0, 25.0, 23.0, 34.0, 54.0, 96.0, 200.0, 372.0, 1043.0, 3369.0, 15236.0, 83808.0, 292086.0, 103736.0, 18331.0, 3932.0, 1080.0, 387.0, 178.0, 100.0, 67.0, 41.0, 30.0, 13.0, 8.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.22467041015625, -6.0391845703125, -5.85369873046875, -5.668212890625, -5.48272705078125, -5.2972412109375, -5.11175537109375, -4.92626953125, -4.74078369140625, -4.5552978515625, -4.36981201171875, -4.184326171875, -3.99884033203125, -3.8133544921875, -3.62786865234375, -3.4423828125, -3.25689697265625, -3.0714111328125, -2.88592529296875, -2.700439453125, -2.51495361328125, -2.3294677734375, -2.14398193359375, -1.95849609375, -1.77301025390625, -1.5875244140625, -1.40203857421875, -1.216552734375, -1.03106689453125, -0.8455810546875, -0.66009521484375, -0.474609375, -0.28912353515625, -0.1036376953125, 0.08184814453125, 0.267333984375, 0.45281982421875, 0.6383056640625, 0.82379150390625, 1.00927734375, 1.19476318359375, 1.3802490234375, 1.56573486328125, 1.751220703125, 1.93670654296875, 2.1221923828125, 2.30767822265625, 2.4931640625, 2.67864990234375, 2.8641357421875, 3.04962158203125, 3.235107421875, 3.42059326171875, 3.6060791015625, 3.79156494140625, 3.97705078125, 4.16253662109375, 4.3480224609375, 4.53350830078125, 4.718994140625, 4.90447998046875, 5.0899658203125, 5.27545166015625, 5.4609375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 13.0, 25.0, 30.0, 31.0, 38.0, 60.0, 72.0, 100.0, 110.0, 104.0, 92.0, 77.0, 59.0, 59.0, 38.0, 18.0, 17.0, 20.0, 12.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8699569702148438, -0.8419647216796875, -0.8139724731445312, -0.785980224609375, -0.7579879760742188, -0.7299957275390625, -0.7020034790039062, -0.67401123046875, -0.6460189819335938, -0.6180267333984375, -0.5900344848632812, -0.562042236328125, -0.5340499877929688, -0.5060577392578125, -0.47806549072265625, -0.4500732421875, -0.42208099365234375, -0.3940887451171875, -0.36609649658203125, -0.338104248046875, -0.31011199951171875, -0.2821197509765625, -0.25412750244140625, -0.22613525390625, -0.19814300537109375, -0.1701507568359375, -0.14215850830078125, -0.114166259765625, -0.08617401123046875, -0.0581817626953125, -0.03018951416015625, -0.002197265625, 0.02579498291015625, 0.0537872314453125, 0.08177947998046875, 0.109771728515625, 0.13776397705078125, 0.1657562255859375, 0.19374847412109375, 0.22174072265625, 0.24973297119140625, 0.2777252197265625, 0.30571746826171875, 0.333709716796875, 0.36170196533203125, 0.3896942138671875, 0.41768646240234375, 0.4456787109375, 0.47367095947265625, 0.5016632080078125, 0.5296554565429688, 0.557647705078125, 0.5856399536132812, 0.6136322021484375, 0.6416244506835938, 0.66961669921875, 0.6976089477539062, 0.7256011962890625, 0.7535934448242188, 0.781585693359375, 0.8095779418945312, 0.8375701904296875, 0.8655624389648438, 0.8935546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 12.0, 16.0, 29.0, 56.0, 83.0, 91.0, 61.0, 45.0, 24.0, 15.0, 6.0, 5.0, 7.0, 8.0, 7.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.62237548828125, -3.473726749420166, -3.325077772140503, -3.176429033279419, -3.027780055999756, -2.879131317138672, -2.730482578277588, -2.581833839416504, -2.433184862136841, -2.284536123275757, -2.1358871459960938, -1.9872384071350098, -1.8385895490646362, -1.6899406909942627, -1.5412919521331787, -1.3926430940628052, -1.2439942359924316, -1.095345377922058, -0.9466965794563293, -0.7980477809906006, -0.649398922920227, -0.5007500648498535, -0.35210126638412476, -0.203452467918396, -0.05480360984802246, 0.09384521842002869, 0.24249404668807983, 0.391142874956131, 0.5397917032241821, 0.6884405612945557, 0.8370893597602844, 0.9857381582260132, 1.1343865394592285, 1.283035397529602, 1.4316842555999756, 1.5803329944610596, 1.728981852531433, 1.8776307106018066, 2.0262794494628906, 2.1749281883239746, 2.3235771656036377, 2.4722259044647217, 2.6208748817443848, 2.7695236206054688, 2.9181723594665527, 3.066821336746216, 3.2154700756073, 3.364119052886963, 3.512767791748047, 3.661416530609131, 3.810065507888794, 3.958714246749878, 4.107363224029541, 4.256011962890625, 4.404660701751709, 4.553309440612793, 4.701958656311035, 4.850607395172119, 4.999256134033203, 5.147905349731445, 5.296554088592529, 5.445202827453613, 5.593851566314697, 5.742500305175781, 5.891149044036865]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 9.0, 3.0, 5.0, 3.0, 4.0, 8.0, 12.0, 24.0, 50.0, 67.0, 79.0, 71.0, 55.0, 23.0, 15.0, 6.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2175278663635254, -3.1092283725738525, -3.0009288787841797, -2.892629384994507, -2.784329891204834, -2.676030397415161, -2.5677309036254883, -2.4594314098358154, -2.3511319160461426, -2.2428324222564697, -2.134532928466797, -2.026233434677124, -1.9179339408874512, -1.8096344470977783, -1.7013349533081055, -1.5930354595184326, -1.4847360849380493, -1.3764365911483765, -1.2681370973587036, -1.1598376035690308, -1.051538109779358, -0.9432386755943298, -0.834939181804657, -0.7266396880149841, -0.6183401942253113, -0.5100407004356384, -0.4017412066459656, -0.2934417426586151, -0.18514224886894226, -0.0768427848815918, 0.031456708908081055, 0.1397562026977539, 0.24805569648742676, 0.3563551902770996, 0.46465468406677246, 0.5729541778564453, 0.6812536716461182, 0.7895531058311462, 0.8978525996208191, 1.0061521530151367, 1.1144516468048096, 1.2227511405944824, 1.3310506343841553, 1.4393501281738281, 1.547649621963501, 1.6559491157531738, 1.7642486095428467, 1.8725481033325195, 1.9808474779129028, 2.089146852493286, 2.197446346282959, 2.305745840072632, 2.4140453338623047, 2.5223448276519775, 2.6306443214416504, 2.7389438152313232, 2.847243309020996, 2.955542802810669, 3.063842296600342, 3.1721417903900146, 3.2804412841796875, 3.3887407779693604, 3.497040271759033, 3.605339765548706, 3.713639259338379]}, "eval/loss": 4.476690292358398, "eval/wer": 2.426160253867513, "eval/runtime": 1110.5914, "eval/samples_per_second": 2.379, "eval/steps_per_second": 0.298, "train/train_runtime": 6254.5702, "train/train_samples_per_second": 4.563, "train/train_steps_per_second": 0.143, "train/total_flos": 0.0, "train/train_loss": 4.602872911590097} \ No newline at end of file